diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.0396, "train/learning_rate": 0.00018623309263299647, "train/epoch": 1.39, "train/global_step": 4500, "_runtime": 42345, "_timestamp": 1651716434, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 132.0, 854.0, 28.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.91638946533203, -36.24909591674805, -35.58180618286133, -34.914512634277344, -34.24721908569336, -33.579925537109375, -32.912635803222656, -32.24534225463867, -31.57805061340332, -30.91075897216797, -30.243465423583984, -29.576173782348633, -28.90888023376465, -28.241588592529297, -27.574295043945312, -26.90700340270996, -26.23971176147461, -25.572420120239258, -24.905126571655273, -24.237834930419922, -23.570541381835938, -22.903249740600586, -22.235958099365234, -21.56866455078125, -20.901371002197266, -20.234079360961914, -19.56678581237793, -18.899494171142578, -18.232200622558594, -17.564908981323242, -16.89761734008789, -16.230323791503906, -15.563033103942871, -14.895740509033203, -14.228447914123535, -13.561155319213867, -12.893863677978516, -12.226571083068848, -11.55927848815918, -10.891986846923828, -10.224693298339844, -9.557400703430176, -8.890108108520508, -8.222816467285156, -7.555523872375488, -6.88823127746582, -6.220938682556152, -5.553646564483643, -4.886354446411133, -4.219061851501465, -3.551769733428955, -2.884477138519287, -2.2171847820281982, -1.5498924255371094, -0.8825998306274414, -0.21530771255493164, 0.45198488235473633, 1.1192772388458252, 1.7865697145462036, 2.453862190246582, 3.121154546737671, 3.7884469032287598, 4.455739498138428, 5.1230316162109375, 5.7903242111206055]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 12.0, 14.0, 22.0, 22.0, 21.0, 28.0, 36.0, 40.0, 41.0, 66.0, 46.0, 66.0, 55.0, 72.0, 52.0, 63.0, 52.0, 50.0, 39.0, 28.0, 46.0, 35.0, 22.0, 22.0, 14.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4424476623535156, -2.321978807449341, -2.201509952545166, -2.0810413360595703, -1.9605724811553955, -1.8401036262512207, -1.719634771347046, -1.599165916442871, -1.4786971807479858, -1.358228325843811, -1.2377595901489258, -1.117290735244751, -0.996821939945221, -0.8763531446456909, -0.7558842897415161, -0.6354154944419861, -0.514946699142456, -0.394477903842926, -0.2740090787410736, -0.1535402536392212, -0.03307145833969116, 0.08739733695983887, 0.20786619186401367, 0.3283349871635437, 0.44880378246307373, 0.5692725777626038, 0.6897413730621338, 0.8102102279663086, 0.9306790232658386, 1.0511478185653687, 1.1716166734695435, 1.2920854091644287, 1.4125542640686035, 1.5330231189727783, 1.6534918546676636, 1.7739607095718384, 1.8944294452667236, 2.0148983001708984, 2.1353671550750732, 2.255836009979248, 2.3763046264648438, 2.4967734813690186, 2.6172423362731934, 2.737710952758789, 2.858179807662964, 2.9786486625671387, 3.0991175174713135, 3.2195863723754883, 3.340055227279663, 3.460524082183838, 3.5809929370880127, 3.7014617919921875, 3.821930408477783, 3.942399263381958, 4.062868118286133, 4.1833367347717285, 4.303805828094482, 4.424274444580078, 4.544743537902832, 4.665212154388428, 4.785681247711182, 4.906149864196777, 5.026618957519531, 5.147087574005127, 5.267556190490723]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 10.0, 12.0, 13.0, 32.0, 51.0, 85.0, 135.0, 263.0, 454.0, 835.0, 1586.0, 2992.0, 6175.0, 13390.0, 30167.0, 69830.0, 196738.0, 2490394.0, 1116467.0, 156262.0, 60251.0, 25884.0, 11364.0, 5408.0, 2577.0, 1338.0, 696.0, 364.0, 209.0, 112.0, 85.0, 45.0, 21.0, 12.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.052734375, -1.9921722412109375, -1.931610107421875, -1.8710479736328125, -1.81048583984375, -1.7499237060546875, -1.689361572265625, -1.6287994384765625, -1.5682373046875, -1.5076751708984375, -1.447113037109375, -1.3865509033203125, -1.32598876953125, -1.2654266357421875, -1.204864501953125, -1.1443023681640625, -1.083740234375, -1.0231781005859375, -0.962615966796875, -0.9020538330078125, -0.84149169921875, -0.7809295654296875, -0.720367431640625, -0.6598052978515625, -0.5992431640625, -0.5386810302734375, -0.478118896484375, -0.4175567626953125, -0.35699462890625, -0.2964324951171875, -0.235870361328125, -0.1753082275390625, -0.11474609375, -0.0541839599609375, 0.006378173828125, 0.0669403076171875, 0.12750244140625, 0.1880645751953125, 0.248626708984375, 0.3091888427734375, 0.3697509765625, 0.4303131103515625, 0.490875244140625, 0.5514373779296875, 0.61199951171875, 0.6725616455078125, 0.733123779296875, 0.7936859130859375, 0.854248046875, 0.9148101806640625, 0.975372314453125, 1.0359344482421875, 1.09649658203125, 1.1570587158203125, 1.217620849609375, 1.2781829833984375, 1.3387451171875, 1.3993072509765625, 1.459869384765625, 1.5204315185546875, 1.58099365234375, 1.6415557861328125, 1.702117919921875, 1.7626800537109375, 1.8232421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 13.0, 11.0, 15.0, 26.0, 21.0, 21.0, 32.0, 42.0, 48.0, 50.0, 71.0, 56.0, 78.0, 68.0, 57.0, 59.0, 50.0, 54.0, 47.0, 30.0, 38.0, 32.0, 16.0, 23.0, 16.0, 7.0, 5.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.794891357421875, -2.68548583984375, -2.576080322265625, -2.4666748046875, -2.357269287109375, -2.24786376953125, -2.138458251953125, -2.029052734375, -1.919647216796875, -1.81024169921875, -1.700836181640625, -1.5914306640625, -1.482025146484375, -1.37261962890625, -1.263214111328125, -1.15380859375, -1.044403076171875, -0.93499755859375, -0.825592041015625, -0.7161865234375, -0.606781005859375, -0.49737548828125, -0.387969970703125, -0.278564453125, -0.169158935546875, -0.05975341796875, 0.049652099609375, 0.1590576171875, 0.268463134765625, 0.37786865234375, 0.487274169921875, 0.5966796875, 0.706085205078125, 0.81549072265625, 0.924896240234375, 1.0343017578125, 1.143707275390625, 1.25311279296875, 1.362518310546875, 1.471923828125, 1.581329345703125, 1.69073486328125, 1.800140380859375, 1.9095458984375, 2.018951416015625, 2.12835693359375, 2.237762451171875, 2.34716796875, 2.456573486328125, 2.56597900390625, 2.675384521484375, 2.7847900390625, 2.894195556640625, 3.00360107421875, 3.113006591796875, 3.222412109375, 3.331817626953125, 3.44122314453125, 3.550628662109375, 3.6600341796875, 3.769439697265625, 3.87884521484375, 3.988250732421875, 4.09765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 25.0, 35.0, 53.0, 83.0, 207.0, 4789.0, 4188374.0, 355.0, 110.0, 58.0, 45.0, 34.0, 13.0, 22.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.4375, -78.0126953125, -75.587890625, -73.1630859375, -70.73828125, -68.3134765625, -65.888671875, -63.4638671875, -61.0390625, -58.6142578125, -56.189453125, -53.7646484375, -51.33984375, -48.9150390625, -46.490234375, -44.0654296875, -41.640625, -39.2158203125, -36.791015625, -34.3662109375, -31.94140625, -29.5166015625, -27.091796875, -24.6669921875, -22.2421875, -19.8173828125, -17.392578125, -14.9677734375, -12.54296875, -10.1181640625, -7.693359375, -5.2685546875, -2.84375, -0.4189453125, 2.005859375, 4.4306640625, 6.85546875, 9.2802734375, 11.705078125, 14.1298828125, 16.5546875, 18.9794921875, 21.404296875, 23.8291015625, 26.25390625, 28.6787109375, 31.103515625, 33.5283203125, 35.953125, 38.3779296875, 40.802734375, 43.2275390625, 45.65234375, 48.0771484375, 50.501953125, 52.9267578125, 55.3515625, 57.7763671875, 60.201171875, 62.6259765625, 65.05078125, 67.4755859375, 69.900390625, 72.3251953125, 74.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 16.0, 17.0, 27.0, 33.0, 53.0, 87.0, 171.0, 855.0, 2177.0, 276.0, 116.0, 54.0, 46.0, 31.0, 25.0, 17.0, 8.0, 14.0, 6.0, 6.0, 3.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.38470458984375, -1.3416748046875, -1.29864501953125, -1.255615234375, -1.21258544921875, -1.1695556640625, -1.12652587890625, -1.08349609375, -1.04046630859375, -0.9974365234375, -0.95440673828125, -0.911376953125, -0.86834716796875, -0.8253173828125, -0.78228759765625, -0.7392578125, -0.69622802734375, -0.6531982421875, -0.61016845703125, -0.567138671875, -0.52410888671875, -0.4810791015625, -0.43804931640625, -0.39501953125, -0.35198974609375, -0.3089599609375, -0.26593017578125, -0.222900390625, -0.17987060546875, -0.1368408203125, -0.09381103515625, -0.05078125, -0.00775146484375, 0.0352783203125, 0.07830810546875, 0.121337890625, 0.16436767578125, 0.2073974609375, 0.25042724609375, 0.29345703125, 0.33648681640625, 0.3795166015625, 0.42254638671875, 0.465576171875, 0.50860595703125, 0.5516357421875, 0.59466552734375, 0.6376953125, 0.68072509765625, 0.7237548828125, 0.76678466796875, 0.809814453125, 0.85284423828125, 0.8958740234375, 0.93890380859375, 0.98193359375, 1.02496337890625, 1.0679931640625, 1.11102294921875, 1.154052734375, 1.19708251953125, 1.2401123046875, 1.28314208984375, 1.326171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 9.0, 16.0, 22.0, 42.0, 78.0, 77.0, 98.0, 115.0, 139.0, 104.0, 87.0, 58.0, 43.0, 32.0, 24.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0522964000701904, -2.92010498046875, -2.7879137992858887, -2.6557223796844482, -2.523530960083008, -2.3913397789001465, -2.259148359298706, -2.1269569396972656, -1.9947656393051147, -1.8625743389129639, -1.7303829193115234, -1.5981916189193726, -1.4660003185272217, -1.3338088989257812, -1.2016175985336304, -1.0694262981414795, -0.9372348785400391, -0.8050435185432434, -0.6728521585464478, -0.5406608581542969, -0.4084694981575012, -0.27627813816070557, -0.1440868377685547, -0.011895477771759033, 0.12029588222503662, 0.2524872422218323, 0.38467857241630554, 0.5168699026107788, 0.6490612626075745, 0.7812526226043701, 0.913443922996521, 1.0456352233886719, 1.1778268814086914, 1.3100181818008423, 1.4422096014022827, 1.5744009017944336, 1.706592321395874, 1.838783621788025, 1.9709749221801758, 2.103166341781616, 2.2353577613830566, 2.367549180984497, 2.4997403621673584, 2.631931781768799, 2.7641232013702393, 2.8963146209716797, 3.028505802154541, 3.1606972217559814, 3.2928884029388428, 3.425079822540283, 3.5572710037231445, 3.689462423324585, 3.8216538429260254, 3.9538450241088867, 4.086036682128906, 4.218227863311768, 4.350419044494629, 4.48261022567749, 4.61480188369751, 4.746993064880371, 4.879184246063232, 5.011375904083252, 5.143567085266113, 5.275758266448975, 5.407949924468994]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 4.0, 5.0, 6.0, 12.0, 14.0, 22.0, 15.0, 43.0, 29.0, 26.0, 29.0, 47.0, 50.0, 43.0, 45.0, 53.0, 34.0, 47.0, 58.0, 36.0, 46.0, 44.0, 38.0, 36.0, 38.0, 36.0, 36.0, 19.0, 22.0, 18.0, 14.0, 10.0, 3.0, 8.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.438009262084961, -2.351890802383423, -2.2657723426818848, -2.1796538829803467, -2.0935354232788086, -2.0074169635772705, -1.921298623085022, -1.8351801633834839, -1.7490617036819458, -1.6629432439804077, -1.5768247842788696, -1.490706443786621, -1.404587984085083, -1.318469524383545, -1.2323510646820068, -1.1462326049804688, -1.0601141452789307, -0.9739956855773926, -0.8878772258758545, -0.8017588257789612, -0.7156403660774231, -0.629521906375885, -0.5434035062789917, -0.4572850465774536, -0.3711665868759155, -0.28504812717437744, -0.19892969727516174, -0.11281126737594604, -0.02669280767440796, 0.05942565202713013, 0.14554405212402344, 0.23166251182556152, 0.3177812099456787, 0.4038996696472168, 0.4900180995464325, 0.5761365294456482, 0.6622549891471863, 0.7483734488487244, 0.8344918489456177, 0.9206103086471558, 1.0067287683486938, 1.092847228050232, 1.17896568775177, 1.2650840282440186, 1.3512024879455566, 1.4373209476470947, 1.5234394073486328, 1.609557867050171, 1.695676326751709, 1.781794786453247, 1.8679132461547852, 1.9540317058563232, 2.0401501655578613, 2.1262686252593994, 2.2123870849609375, 2.2985053062438965, 2.3846240043640137, 2.4707424640655518, 2.55686092376709, 2.642979383468628, 2.729097843170166, 2.815216302871704, 2.901334762573242, 2.987452983856201, 3.0735714435577393]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 16.0, 15.0, 13.0, 19.0, 26.0, 34.0, 51.0, 87.0, 107.0, 176.0, 231.0, 350.0, 575.0, 987.0, 1727.0, 3410.0, 7745.0, 19143.0, 53209.0, 160161.0, 399956.0, 261177.0, 87290.0, 29925.0, 11608.0, 4885.0, 2328.0, 1199.0, 706.0, 425.0, 323.0, 198.0, 127.0, 81.0, 55.0, 33.0, 39.0, 24.0, 25.0, 15.0, 4.0, 6.0, 10.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3616142272949219, -0.34944915771484375, -0.3372840881347656, -0.3251190185546875, -0.3129539489746094, -0.30078887939453125, -0.2886238098144531, -0.276458740234375, -0.2642936706542969, -0.25212860107421875, -0.23996353149414062, -0.2277984619140625, -0.21563339233398438, -0.20346832275390625, -0.19130325317382812, -0.17913818359375, -0.16697311401367188, -0.15480804443359375, -0.14264297485351562, -0.1304779052734375, -0.11831283569335938, -0.10614776611328125, -0.09398269653320312, -0.081817626953125, -0.06965255737304688, -0.05748748779296875, -0.045322418212890625, -0.0331573486328125, -0.020992279052734375, -0.00882720947265625, 0.003337860107421875, 0.0155029296875, 0.027667999267578125, 0.03983306884765625, 0.051998138427734375, 0.0641632080078125, 0.07632827758789062, 0.08849334716796875, 0.10065841674804688, 0.112823486328125, 0.12498855590820312, 0.13715362548828125, 0.14931869506835938, 0.1614837646484375, 0.17364883422851562, 0.18581390380859375, 0.19797897338867188, 0.21014404296875, 0.22230911254882812, 0.23447418212890625, 0.24663925170898438, 0.2588043212890625, 0.2709693908691406, 0.28313446044921875, 0.2952995300292969, 0.307464599609375, 0.3196296691894531, 0.33179473876953125, 0.3439598083496094, 0.3561248779296875, 0.3682899475097656, 0.38045501708984375, 0.3926200866699219, 0.40478515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 4.0, 3.0, 5.0, 6.0, 9.0, 11.0, 23.0, 26.0, 28.0, 24.0, 23.0, 38.0, 49.0, 38.0, 31.0, 55.0, 49.0, 48.0, 42.0, 37.0, 35.0, 56.0, 50.0, 23.0, 39.0, 35.0, 42.0, 35.0, 23.0, 23.0, 18.0, 16.0, 10.0, 14.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8449249267578125, -1.782623291015625, -1.7203216552734375, -1.65802001953125, -1.5957183837890625, -1.533416748046875, -1.4711151123046875, -1.4088134765625, -1.3465118408203125, -1.284210205078125, -1.2219085693359375, -1.15960693359375, -1.0973052978515625, -1.035003662109375, -0.9727020263671875, -0.910400390625, -0.8480987548828125, -0.785797119140625, -0.7234954833984375, -0.66119384765625, -0.5988922119140625, -0.536590576171875, -0.4742889404296875, -0.4119873046875, -0.3496856689453125, -0.287384033203125, -0.2250823974609375, -0.16278076171875, -0.1004791259765625, -0.038177490234375, 0.0241241455078125, 0.08642578125, 0.1487274169921875, 0.211029052734375, 0.2733306884765625, 0.33563232421875, 0.3979339599609375, 0.460235595703125, 0.5225372314453125, 0.5848388671875, 0.6471405029296875, 0.709442138671875, 0.7717437744140625, 0.83404541015625, 0.8963470458984375, 0.958648681640625, 1.0209503173828125, 1.083251953125, 1.1455535888671875, 1.207855224609375, 1.2701568603515625, 1.33245849609375, 1.3947601318359375, 1.457061767578125, 1.5193634033203125, 1.5816650390625, 1.6439666748046875, 1.706268310546875, 1.7685699462890625, 1.83087158203125, 1.8931732177734375, 1.955474853515625, 2.0177764892578125, 2.080078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 4.0, 11.0, 20.0, 12.0, 27.0, 42.0, 30.0, 56.0, 70.0, 87.0, 98.0, 148.0, 154.0, 203.0, 302.0, 336.0, 415.0, 804.0, 2427.0, 26081.0, 430114.0, 547936.0, 33229.0, 2965.0, 789.0, 489.0, 348.0, 275.0, 205.0, 190.0, 162.0, 103.0, 89.0, 66.0, 77.0, 53.0, 25.0, 25.0, 18.0, 15.0, 12.0, 14.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5255966186523438, -0.5092010498046875, -0.49280548095703125, -0.476409912109375, -0.46001434326171875, -0.4436187744140625, -0.42722320556640625, -0.41082763671875, -0.39443206787109375, -0.3780364990234375, -0.36164093017578125, -0.345245361328125, -0.32884979248046875, -0.3124542236328125, -0.29605865478515625, -0.2796630859375, -0.26326751708984375, -0.2468719482421875, -0.23047637939453125, -0.214080810546875, -0.19768524169921875, -0.1812896728515625, -0.16489410400390625, -0.14849853515625, -0.13210296630859375, -0.1157073974609375, -0.09931182861328125, -0.082916259765625, -0.06652069091796875, -0.0501251220703125, -0.03372955322265625, -0.017333984375, -0.00093841552734375, 0.0154571533203125, 0.03185272216796875, 0.048248291015625, 0.06464385986328125, 0.0810394287109375, 0.09743499755859375, 0.11383056640625, 0.13022613525390625, 0.1466217041015625, 0.16301727294921875, 0.179412841796875, 0.19580841064453125, 0.2122039794921875, 0.22859954833984375, 0.2449951171875, 0.26139068603515625, 0.2777862548828125, 0.29418182373046875, 0.310577392578125, 0.32697296142578125, 0.3433685302734375, 0.35976409912109375, 0.37615966796875, 0.39255523681640625, 0.4089508056640625, 0.42534637451171875, 0.441741943359375, 0.45813751220703125, 0.4745330810546875, 0.49092864990234375, 0.50732421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 11.0, 10.0, 12.0, 7.0, 12.0, 12.0, 13.0, 20.0, 22.0, 18.0, 24.0, 37.0, 45.0, 32.0, 31.0, 45.0, 57.0, 46.0, 54.0, 39.0, 47.0, 44.0, 35.0, 34.0, 36.0, 33.0, 38.0, 25.0, 33.0, 29.0, 20.0, 12.0, 15.0, 12.0, 15.0, 9.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.208984375, -3.0859375, -2.962890625, -2.83984375, -2.716796875, -2.59375, -2.470703125, -2.34765625, -2.224609375, -2.1015625, -1.978515625, -1.85546875, -1.732421875, -1.609375, -1.486328125, -1.36328125, -1.240234375, -1.1171875, -0.994140625, -0.87109375, -0.748046875, -0.625, -0.501953125, -0.37890625, -0.255859375, -0.1328125, -0.009765625, 0.11328125, 0.236328125, 0.359375, 0.482421875, 0.60546875, 0.728515625, 0.8515625, 0.974609375, 1.09765625, 1.220703125, 1.34375, 1.466796875, 1.58984375, 1.712890625, 1.8359375, 1.958984375, 2.08203125, 2.205078125, 2.328125, 2.451171875, 2.57421875, 2.697265625, 2.8203125, 2.943359375, 3.06640625, 3.189453125, 3.3125, 3.435546875, 3.55859375, 3.681640625, 3.8046875, 3.927734375, 4.05078125, 4.173828125, 4.296875, 4.419921875, 4.54296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 12.0, 10.0, 18.0, 22.0, 48.0, 74.0, 104.0, 220.0, 431.0, 1301.0, 11208.0, 1014973.0, 17526.0, 1597.0, 457.0, 220.0, 130.0, 68.0, 41.0, 23.0, 14.0, 11.0, 7.0, 7.0, 3.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.1294574737548828, -0.12475967407226562, -0.12006187438964844, -0.11536407470703125, -0.11066627502441406, -0.10596847534179688, -0.10127067565917969, -0.0965728759765625, -0.09187507629394531, -0.08717727661132812, -0.08247947692871094, -0.07778167724609375, -0.07308387756347656, -0.06838607788085938, -0.06368827819824219, -0.058990478515625, -0.05429267883300781, -0.049594879150390625, -0.04489707946777344, -0.04019927978515625, -0.03550148010253906, -0.030803680419921875, -0.026105880737304688, -0.0214080810546875, -0.016710281372070312, -0.012012481689453125, -0.0073146820068359375, -0.00261688232421875, 0.0020809173583984375, 0.006778717041015625, 0.011476516723632812, 0.01617431640625, 0.020872116088867188, 0.025569915771484375, 0.030267715454101562, 0.03496551513671875, 0.03966331481933594, 0.044361114501953125, 0.04905891418457031, 0.0537567138671875, 0.05845451354980469, 0.06315231323242188, 0.06785011291503906, 0.07254791259765625, 0.07724571228027344, 0.08194351196289062, 0.08664131164550781, 0.091339111328125, 0.09603691101074219, 0.10073471069335938, 0.10543251037597656, 0.11013031005859375, 0.11482810974121094, 0.11952590942382812, 0.12422370910644531, 0.1289215087890625, 0.1336193084716797, 0.13831710815429688, 0.14301490783691406, 0.14771270751953125, 0.15241050720214844, 0.15710830688476562, 0.1618061065673828, 0.16650390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 9.0, 17.0, 12.0, 24.0, 30.0, 44.0, 54.0, 75.0, 84.0, 65.0, 94.0, 80.0, 82.0, 62.0, 70.0, 56.0, 32.0, 25.0, 15.0, 13.0, 10.0, 4.0, 9.0, 5.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1054019927978516e-05, -3.0104070901870728e-05, -2.915412187576294e-05, -2.820417284965515e-05, -2.7254223823547363e-05, -2.6304274797439575e-05, -2.5354325771331787e-05, -2.4404376745224e-05, -2.345442771911621e-05, -2.2504478693008423e-05, -2.1554529666900635e-05, -2.0604580640792847e-05, -1.965463161468506e-05, -1.870468258857727e-05, -1.7754733562469482e-05, -1.6804784536361694e-05, -1.5854835510253906e-05, -1.4904886484146118e-05, -1.395493745803833e-05, -1.3004988431930542e-05, -1.2055039405822754e-05, -1.1105090379714966e-05, -1.0155141353607178e-05, -9.20519232749939e-06, -8.255243301391602e-06, -7.3052942752838135e-06, -6.355345249176025e-06, -5.405396223068237e-06, -4.455447196960449e-06, -3.505498170852661e-06, -2.555549144744873e-06, -1.605600118637085e-06, -6.556510925292969e-07, 2.942979335784912e-07, 1.2442469596862793e-06, 2.1941959857940674e-06, 3.1441450119018555e-06, 4.0940940380096436e-06, 5.044043064117432e-06, 5.99399209022522e-06, 6.943941116333008e-06, 7.893890142440796e-06, 8.843839168548584e-06, 9.793788194656372e-06, 1.074373722076416e-05, 1.1693686246871948e-05, 1.2643635272979736e-05, 1.3593584299087524e-05, 1.4543533325195312e-05, 1.54934823513031e-05, 1.644343137741089e-05, 1.7393380403518677e-05, 1.8343329429626465e-05, 1.9293278455734253e-05, 2.024322748184204e-05, 2.119317650794983e-05, 2.2143125534057617e-05, 2.3093074560165405e-05, 2.4043023586273193e-05, 2.499297261238098e-05, 2.594292163848877e-05, 2.6892870664596558e-05, 2.7842819690704346e-05, 2.8792768716812134e-05, 2.9742717742919922e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 1.0, 6.0, 3.0, 2.0, 10.0, 13.0, 23.0, 30.0, 74.0, 189.0, 1136.0, 865146.0, 180771.0, 830.0, 138.0, 55.0, 37.0, 23.0, 12.0, 13.0, 4.0, 5.0, 11.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64013671875, -0.6232643127441406, -0.6063919067382812, -0.5895195007324219, -0.5726470947265625, -0.5557746887207031, -0.5389022827148438, -0.5220298767089844, -0.505157470703125, -0.4882850646972656, -0.47141265869140625, -0.4545402526855469, -0.4376678466796875, -0.4207954406738281, -0.40392303466796875, -0.3870506286621094, -0.37017822265625, -0.3533058166503906, -0.33643341064453125, -0.3195610046386719, -0.3026885986328125, -0.2858161926269531, -0.26894378662109375, -0.2520713806152344, -0.235198974609375, -0.21832656860351562, -0.20145416259765625, -0.18458175659179688, -0.1677093505859375, -0.15083694458007812, -0.13396453857421875, -0.11709213256835938, -0.1002197265625, -0.08334732055664062, -0.06647491455078125, -0.049602508544921875, -0.0327301025390625, -0.015857696533203125, 0.00101470947265625, 0.017887115478515625, 0.034759521484375, 0.051631927490234375, 0.06850433349609375, 0.08537673950195312, 0.1022491455078125, 0.11912155151367188, 0.13599395751953125, 0.15286636352539062, 0.16973876953125, 0.18661117553710938, 0.20348358154296875, 0.22035598754882812, 0.2372283935546875, 0.2541007995605469, 0.27097320556640625, 0.2878456115722656, 0.304718017578125, 0.3215904235839844, 0.33846282958984375, 0.3553352355957031, 0.3722076416015625, 0.3890800476074219, 0.40595245361328125, 0.4228248596191406, 0.439697265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 1.0, 9.0, 15.0, 12.0, 24.0, 38.0, 65.0, 85.0, 186.0, 201.0, 135.0, 54.0, 43.0, 26.0, 27.0, 11.0, 11.0, 7.0, 5.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.039794921875, -0.0386965274810791, -0.0375981330871582, -0.036499738693237305, -0.035401344299316406, -0.03430294990539551, -0.03320455551147461, -0.03210616111755371, -0.031007766723632812, -0.029909372329711914, -0.028810977935791016, -0.027712583541870117, -0.02661418914794922, -0.02551579475402832, -0.024417400360107422, -0.023319005966186523, -0.022220611572265625, -0.021122217178344727, -0.020023822784423828, -0.01892542839050293, -0.01782703399658203, -0.016728639602661133, -0.015630245208740234, -0.014531850814819336, -0.013433456420898438, -0.012335062026977539, -0.01123666763305664, -0.010138273239135742, -0.009039878845214844, -0.007941484451293945, -0.006843090057373047, -0.0057446956634521484, -0.00464630126953125, -0.0035479068756103516, -0.002449512481689453, -0.0013511180877685547, -0.00025272369384765625, 0.0008456707000732422, 0.0019440650939941406, 0.003042459487915039, 0.0041408538818359375, 0.005239248275756836, 0.006337642669677734, 0.007436037063598633, 0.008534431457519531, 0.00963282585144043, 0.010731220245361328, 0.011829614639282227, 0.012928009033203125, 0.014026403427124023, 0.015124797821044922, 0.01622319221496582, 0.01732158660888672, 0.018419981002807617, 0.019518375396728516, 0.020616769790649414, 0.021715164184570312, 0.02281355857849121, 0.02391195297241211, 0.025010347366333008, 0.026108741760253906, 0.027207136154174805, 0.028305530548095703, 0.0294039249420166, 0.0305023193359375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 7.0, 50.0, 171.0, 341.0, 274.0, 94.0, 30.0, 14.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.264389991760254, -12.961758613586426, -12.659126281738281, -12.356494903564453, -12.053863525390625, -11.75123119354248, -11.448599815368652, -11.145967483520508, -10.84333610534668, -10.540704727172852, -10.238072395324707, -9.935441017150879, -9.632808685302734, -9.330177307128906, -9.027545928955078, -8.72491455078125, -8.422282218933105, -8.119650840759277, -7.817018508911133, -7.514387130737305, -7.211755275726318, -6.909123420715332, -6.606492042541504, -6.303860187530518, -6.001228332519531, -5.698596477508545, -5.395964622497559, -5.0933332443237305, -4.790701389312744, -4.488069534301758, -4.18543815612793, -3.8828063011169434, -3.580173969268799, -3.2775421142578125, -2.9749104976654053, -2.672278881072998, -2.3696470260620117, -2.0670151710510254, -1.7643835544586182, -1.461751937866211, -1.1591200828552246, -0.8564883470535278, -0.553856611251831, -0.2512248754501343, 0.0514068603515625, 0.3540385961532593, 0.656670331954956, 0.9593019485473633, 1.2619338035583496, 1.5645655393600464, 1.8671972751617432, 2.1698288917541504, 2.4724607467651367, 2.775092601776123, 3.0777242183685303, 3.3803558349609375, 3.682987689971924, 3.98561954498291, 4.288250923156738, 4.590882778167725, 4.893514633178711, 5.196146488189697, 5.498778343200684, 5.801409721374512, 6.104041576385498]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 11.0, 16.0, 16.0, 14.0, 38.0, 33.0, 29.0, 33.0, 42.0, 57.0, 46.0, 50.0, 43.0, 49.0, 55.0, 58.0, 37.0, 52.0, 42.0, 48.0, 45.0, 34.0, 37.0, 24.0, 21.0, 20.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880835771560669, -1.813689947128296, -1.7465442419052124, -1.6793984174728394, -1.6122527122497559, -1.5451068878173828, -1.4779610633850098, -1.4108152389526367, -1.3436695337295532, -1.2765237092971802, -1.2093780040740967, -1.1422321796417236, -1.0750863552093506, -1.007940649986267, -0.940794825553894, -0.8736490607261658, -0.8065032958984375, -0.7393575310707092, -0.672211766242981, -0.6050659418106079, -0.5379201769828796, -0.47077441215515137, -0.4036286175251007, -0.33648282289505005, -0.2693370580673218, -0.2021912783384323, -0.13504549860954285, -0.06789971888065338, -0.000753939151763916, 0.06639182567596436, 0.13353762030601501, 0.20068341493606567, 0.26782894134521484, 0.3349747061729431, 0.4021205008029938, 0.46926629543304443, 0.5364120602607727, 0.603557825088501, 0.670703649520874, 0.7378494143486023, 0.8049951791763306, 0.8721409440040588, 0.9392867088317871, 1.0064325332641602, 1.0735783576965332, 1.1407240629196167, 1.2078698873519897, 1.2750155925750732, 1.3421614170074463, 1.4093072414398193, 1.4764529466629028, 1.5435987710952759, 1.6107444763183594, 1.6778903007507324, 1.7450361251831055, 1.8121819496154785, 1.879327654838562, 1.946473479270935, 2.0136191844940186, 2.0807650089263916, 2.1479108333587646, 2.2150564193725586, 2.2822022438049316, 2.3493480682373047, 2.4164938926696777]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 11.0, 6.0, 14.0, 8.0, 30.0, 44.0, 59.0, 89.0, 151.0, 305.0, 498.0, 928.0, 1760.0, 3359.0, 7088.0, 17495.0, 61316.0, 291386.0, 488149.0, 125693.0, 29619.0, 10673.0, 4759.0, 2363.0, 1214.0, 626.0, 347.0, 213.0, 132.0, 76.0, 50.0, 30.0, 21.0, 19.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.425506591796875, -1.37835693359375, -1.331207275390625, -1.2840576171875, -1.236907958984375, -1.18975830078125, -1.142608642578125, -1.095458984375, -1.048309326171875, -1.00115966796875, -0.954010009765625, -0.9068603515625, -0.859710693359375, -0.81256103515625, -0.765411376953125, -0.71826171875, -0.671112060546875, -0.62396240234375, -0.576812744140625, -0.5296630859375, -0.482513427734375, -0.43536376953125, -0.388214111328125, -0.341064453125, -0.293914794921875, -0.24676513671875, -0.199615478515625, -0.1524658203125, -0.105316162109375, -0.05816650390625, -0.011016845703125, 0.0361328125, 0.083282470703125, 0.13043212890625, 0.177581787109375, 0.2247314453125, 0.271881103515625, 0.31903076171875, 0.366180419921875, 0.413330078125, 0.460479736328125, 0.50762939453125, 0.554779052734375, 0.6019287109375, 0.649078369140625, 0.69622802734375, 0.743377685546875, 0.79052734375, 0.837677001953125, 0.88482666015625, 0.931976318359375, 0.9791259765625, 1.026275634765625, 1.07342529296875, 1.120574951171875, 1.167724609375, 1.214874267578125, 1.26202392578125, 1.309173583984375, 1.3563232421875, 1.403472900390625, 1.45062255859375, 1.497772216796875, 1.544921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 8.0, 10.0, 15.0, 24.0, 39.0, 54.0, 56.0, 62.0, 71.0, 64.0, 72.0, 92.0, 83.0, 81.0, 57.0, 55.0, 50.0, 29.0, 20.0, 19.0, 14.0, 8.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2325439453125, -8.847900390625, -8.4632568359375, -8.07861328125, -7.6939697265625, -7.309326171875, -6.9246826171875, -6.5400390625, -6.1553955078125, -5.770751953125, -5.3861083984375, -5.00146484375, -4.6168212890625, -4.232177734375, -3.8475341796875, -3.462890625, -3.0782470703125, -2.693603515625, -2.3089599609375, -1.92431640625, -1.5396728515625, -1.155029296875, -0.7703857421875, -0.3857421875, -0.0010986328125, 0.383544921875, 0.7681884765625, 1.15283203125, 1.5374755859375, 1.922119140625, 2.3067626953125, 2.69140625, 3.0760498046875, 3.460693359375, 3.8453369140625, 4.22998046875, 4.6146240234375, 4.999267578125, 5.3839111328125, 5.7685546875, 6.1531982421875, 6.537841796875, 6.9224853515625, 7.30712890625, 7.6917724609375, 8.076416015625, 8.4610595703125, 8.845703125, 9.2303466796875, 9.614990234375, 9.9996337890625, 10.38427734375, 10.7689208984375, 11.153564453125, 11.5382080078125, 11.9228515625, 12.3074951171875, 12.692138671875, 13.0767822265625, 13.46142578125, 13.8460693359375, 14.230712890625, 14.6153564453125, 15.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 12.0, 16.0, 20.0, 23.0, 31.0, 44.0, 77.0, 100.0, 236.0, 717.0, 24768.0, 1019443.0, 2207.0, 353.0, 160.0, 108.0, 50.0, 54.0, 27.0, 21.0, 22.0, 18.0, 10.0, 3.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.26123046875, -11.8271484375, -11.39306640625, -10.958984375, -10.52490234375, -10.0908203125, -9.65673828125, -9.22265625, -8.78857421875, -8.3544921875, -7.92041015625, -7.486328125, -7.05224609375, -6.6181640625, -6.18408203125, -5.75, -5.31591796875, -4.8818359375, -4.44775390625, -4.013671875, -3.57958984375, -3.1455078125, -2.71142578125, -2.27734375, -1.84326171875, -1.4091796875, -0.97509765625, -0.541015625, -0.10693359375, 0.3271484375, 0.76123046875, 1.1953125, 1.62939453125, 2.0634765625, 2.49755859375, 2.931640625, 3.36572265625, 3.7998046875, 4.23388671875, 4.66796875, 5.10205078125, 5.5361328125, 5.97021484375, 6.404296875, 6.83837890625, 7.2724609375, 7.70654296875, 8.140625, 8.57470703125, 9.0087890625, 9.44287109375, 9.876953125, 10.31103515625, 10.7451171875, 11.17919921875, 11.61328125, 12.04736328125, 12.4814453125, 12.91552734375, 13.349609375, 13.78369140625, 14.2177734375, 14.65185546875, 15.0859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 8.0, 15.0, 16.0, 33.0, 27.0, 56.0, 52.0, 63.0, 78.0, 69.0, 97.0, 71.0, 79.0, 70.0, 55.0, 61.0, 31.0, 25.0, 17.0, 22.0, 13.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.13232421875, -9.7490234375, -9.36572265625, -8.982421875, -8.59912109375, -8.2158203125, -7.83251953125, -7.44921875, -7.06591796875, -6.6826171875, -6.29931640625, -5.916015625, -5.53271484375, -5.1494140625, -4.76611328125, -4.3828125, -3.99951171875, -3.6162109375, -3.23291015625, -2.849609375, -2.46630859375, -2.0830078125, -1.69970703125, -1.31640625, -0.93310546875, -0.5498046875, -0.16650390625, 0.216796875, 0.60009765625, 0.9833984375, 1.36669921875, 1.75, 2.13330078125, 2.5166015625, 2.89990234375, 3.283203125, 3.66650390625, 4.0498046875, 4.43310546875, 4.81640625, 5.19970703125, 5.5830078125, 5.96630859375, 6.349609375, 6.73291015625, 7.1162109375, 7.49951171875, 7.8828125, 8.26611328125, 8.6494140625, 9.03271484375, 9.416015625, 9.79931640625, 10.1826171875, 10.56591796875, 10.94921875, 11.33251953125, 11.7158203125, 12.09912109375, 12.482421875, 12.86572265625, 13.2490234375, 13.63232421875, 14.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 13.0, 8.0, 18.0, 29.0, 54.0, 124.0, 293.0, 972.0, 4341.0, 39233.0, 958648.0, 38984.0, 4280.0, 976.0, 318.0, 119.0, 67.0, 42.0, 5.0, 10.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1757354736328125, -1.139556884765625, -1.1033782958984375, -1.06719970703125, -1.0310211181640625, -0.994842529296875, -0.9586639404296875, -0.9224853515625, -0.8863067626953125, -0.850128173828125, -0.8139495849609375, -0.77777099609375, -0.7415924072265625, -0.705413818359375, -0.6692352294921875, -0.633056640625, -0.5968780517578125, -0.560699462890625, -0.5245208740234375, -0.48834228515625, -0.4521636962890625, -0.415985107421875, -0.3798065185546875, -0.3436279296875, -0.3074493408203125, -0.271270751953125, -0.2350921630859375, -0.19891357421875, -0.1627349853515625, -0.126556396484375, -0.0903778076171875, -0.05419921875, -0.0180206298828125, 0.018157958984375, 0.0543365478515625, 0.09051513671875, 0.1266937255859375, 0.162872314453125, 0.1990509033203125, 0.2352294921875, 0.2714080810546875, 0.307586669921875, 0.3437652587890625, 0.37994384765625, 0.4161224365234375, 0.452301025390625, 0.4884796142578125, 0.524658203125, 0.5608367919921875, 0.597015380859375, 0.6331939697265625, 0.66937255859375, 0.7055511474609375, 0.741729736328125, 0.7779083251953125, 0.8140869140625, 0.8502655029296875, 0.886444091796875, 0.9226226806640625, 0.95880126953125, 0.9949798583984375, 1.031158447265625, 1.0673370361328125, 1.103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 13.0, 21.0, 36.0, 67.0, 111.0, 331.0, 211.0, 74.0, 46.0, 22.0, 14.0, 14.0, 6.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018167495727539062, -0.00017672404646873474, -0.00017177313566207886, -0.00016682222485542297, -0.0001618713140487671, -0.0001569204032421112, -0.00015196949243545532, -0.00014701858162879944, -0.00014206767082214355, -0.00013711676001548767, -0.0001321658492088318, -0.0001272149384021759, -0.00012226402759552002, -0.00011731311678886414, -0.00011236220598220825, -0.00010741129517555237, -0.00010246038436889648, -9.75094735622406e-05, -9.255856275558472e-05, -8.760765194892883e-05, -8.265674114227295e-05, -7.770583033561707e-05, -7.275491952896118e-05, -6.78040087223053e-05, -6.285309791564941e-05, -5.790218710899353e-05, -5.2951276302337646e-05, -4.800036549568176e-05, -4.304945468902588e-05, -3.8098543882369995e-05, -3.314763307571411e-05, -2.8196722269058228e-05, -2.3245811462402344e-05, -1.829490065574646e-05, -1.3343989849090576e-05, -8.393079042434692e-06, -3.4421682357788086e-06, 1.5087425708770752e-06, 6.459653377532959e-06, 1.1410564184188843e-05, 1.6361474990844727e-05, 2.131238579750061e-05, 2.6263296604156494e-05, 3.121420741081238e-05, 3.616511821746826e-05, 4.1116029024124146e-05, 4.606693983078003e-05, 5.101785063743591e-05, 5.59687614440918e-05, 6.091967225074768e-05, 6.587058305740356e-05, 7.082149386405945e-05, 7.577240467071533e-05, 8.072331547737122e-05, 8.56742262840271e-05, 9.062513709068298e-05, 9.557604789733887e-05, 0.00010052695870399475, 0.00010547786951065063, 0.00011042878031730652, 0.0001153796911239624, 0.00012033060193061829, 0.00012528151273727417, 0.00013023242354393005, 0.00013518333435058594]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 13.0, 10.0, 10.0, 18.0, 18.0, 27.0, 66.0, 112.0, 234.0, 630.0, 2214.0, 12797.0, 671016.0, 346361.0, 11746.0, 2154.0, 633.0, 194.0, 97.0, 65.0, 30.0, 18.0, 21.0, 16.0, 7.0, 3.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0673828125, -1.032928466796875, -0.99847412109375, -0.964019775390625, -0.9295654296875, -0.895111083984375, -0.86065673828125, -0.826202392578125, -0.791748046875, -0.757293701171875, -0.72283935546875, -0.688385009765625, -0.6539306640625, -0.619476318359375, -0.58502197265625, -0.550567626953125, -0.51611328125, -0.481658935546875, -0.44720458984375, -0.412750244140625, -0.3782958984375, -0.343841552734375, -0.30938720703125, -0.274932861328125, -0.240478515625, -0.206024169921875, -0.17156982421875, -0.137115478515625, -0.1026611328125, -0.068206787109375, -0.03375244140625, 0.000701904296875, 0.03515625, 0.069610595703125, 0.10406494140625, 0.138519287109375, 0.1729736328125, 0.207427978515625, 0.24188232421875, 0.276336669921875, 0.310791015625, 0.345245361328125, 0.37969970703125, 0.414154052734375, 0.4486083984375, 0.483062744140625, 0.51751708984375, 0.551971435546875, 0.58642578125, 0.620880126953125, 0.65533447265625, 0.689788818359375, 0.7242431640625, 0.758697509765625, 0.79315185546875, 0.827606201171875, 0.862060546875, 0.896514892578125, 0.93096923828125, 0.965423583984375, 0.9998779296875, 1.034332275390625, 1.06878662109375, 1.103240966796875, 1.1376953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 15.0, 11.0, 12.0, 25.0, 27.0, 47.0, 61.0, 88.0, 343.0, 87.0, 60.0, 49.0, 30.0, 16.0, 13.0, 11.0, 18.0, 14.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.1877593994140625, -0.180694580078125, -0.1736297607421875, -0.16656494140625, -0.1595001220703125, -0.152435302734375, -0.1453704833984375, -0.1383056640625, -0.1312408447265625, -0.124176025390625, -0.1171112060546875, -0.11004638671875, -0.1029815673828125, -0.095916748046875, -0.0888519287109375, -0.081787109375, -0.0747222900390625, -0.067657470703125, -0.0605926513671875, -0.05352783203125, -0.0464630126953125, -0.039398193359375, -0.0323333740234375, -0.0252685546875, -0.0182037353515625, -0.011138916015625, -0.0040740966796875, 0.00299072265625, 0.0100555419921875, 0.017120361328125, 0.0241851806640625, 0.03125, 0.0383148193359375, 0.045379638671875, 0.0524444580078125, 0.05950927734375, 0.0665740966796875, 0.073638916015625, 0.0807037353515625, 0.0877685546875, 0.0948333740234375, 0.101898193359375, 0.1089630126953125, 0.11602783203125, 0.1230926513671875, 0.130157470703125, 0.1372222900390625, 0.144287109375, 0.1513519287109375, 0.158416748046875, 0.1654815673828125, 0.17254638671875, 0.1796112060546875, 0.186676025390625, 0.1937408447265625, 0.2008056640625, 0.2078704833984375, 0.214935302734375, 0.2220001220703125, 0.22906494140625, 0.2361297607421875, 0.243194580078125, 0.2502593994140625, 0.25732421875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 70.0, 491.0, 376.0, 53.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.29172134399414, -49.37619400024414, -48.46066665649414, -47.54513931274414, -46.629615783691406, -45.714088439941406, -44.798561096191406, -43.883033752441406, -42.967506408691406, -42.051979064941406, -41.136451721191406, -40.220924377441406, -39.30540084838867, -38.38987350463867, -37.47434616088867, -36.55881881713867, -35.64329147338867, -34.72776412963867, -33.81223678588867, -32.89670944213867, -31.981184005737305, -31.065658569335938, -30.150131225585938, -29.234603881835938, -28.31907844543457, -27.40355110168457, -26.488025665283203, -25.572498321533203, -24.656970977783203, -23.741443634033203, -22.825918197631836, -21.910390853881836, -20.99486541748047, -20.07933807373047, -19.1638126373291, -18.2482852935791, -17.3327579498291, -16.417232513427734, -15.501705169677734, -14.586177825927734, -13.670650482177734, -12.75512409210205, -11.83959674835205, -10.924070358276367, -10.008543014526367, -9.093016624450684, -8.177490234375, -7.261962890625, -6.346435546875, -5.430908679962158, -4.515381813049316, -3.5998551845550537, -2.684328317642212, -1.7688016891479492, -0.8532748222351074, 0.062252044677734375, 0.9777789115905762, 1.893305778503418, 2.8088326454162598, 3.7243592739105225, 4.639885902404785, 5.555412769317627, 6.470939636230469, 7.3864665031433105, 8.301993370056152]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 9.0, 5.0, 12.0, 7.0, 6.0, 12.0, 19.0, 10.0, 29.0, 21.0, 26.0, 21.0, 23.0, 29.0, 27.0, 32.0, 34.0, 48.0, 39.0, 32.0, 45.0, 35.0, 49.0, 45.0, 42.0, 35.0, 31.0, 24.0, 35.0, 27.0, 21.0, 24.0, 26.0, 21.0, 15.0, 17.0, 11.0, 7.0, 8.0, 11.0, 6.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.610380172729492, -9.327811241149902, -9.045243263244629, -8.762674331665039, -8.48010540008545, -8.19753646850586, -7.914968490600586, -7.632399559020996, -7.3498311042785645, -7.067262649536133, -6.784693717956543, -6.502125263214111, -6.21955680847168, -5.93698787689209, -5.654419422149658, -5.371850967407227, -5.089282035827637, -4.806713581085205, -4.524144649505615, -4.241576194763184, -3.959007501602173, -3.676438808441162, -3.3938703536987305, -3.1113016605377197, -2.828732967376709, -2.5461642742156982, -2.2635955810546875, -1.9810271263122559, -1.6984584331512451, -1.4158897399902344, -1.1333211660385132, -0.850752592086792, -0.5681829452514648, -0.2856143116950989, -0.00304567813873291, 0.27952295541763306, 0.562091588973999, 0.8446602821350098, 1.127228856086731, 1.4097974300384521, 1.692366123199463, 1.9749348163604736, 2.2575035095214844, 2.540071964263916, 2.8226406574249268, 3.1052093505859375, 3.387777805328369, 3.67034649848938, 3.9529151916503906, 4.235483646392822, 4.518052577972412, 4.800621032714844, 5.083189964294434, 5.365758419036865, 5.648326873779297, 5.930895805358887, 6.213464260101318, 6.49603271484375, 6.77860164642334, 7.0611701011657715, 7.343738555908203, 7.626307487487793, 7.908875942230225, 8.191444396972656, 8.474013328552246]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 11.0, 16.0, 21.0, 37.0, 51.0, 80.0, 121.0, 208.0, 474.0, 1400.0, 5452.0, 28731.0, 375639.0, 3621025.0, 138828.0, 16768.0, 3492.0, 1038.0, 381.0, 182.0, 114.0, 56.0, 49.0, 27.0, 23.0, 16.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.94921875, -4.81304931640625, -4.6768798828125, -4.54071044921875, -4.404541015625, -4.26837158203125, -4.1322021484375, -3.99603271484375, -3.85986328125, -3.72369384765625, -3.5875244140625, -3.45135498046875, -3.315185546875, -3.17901611328125, -3.0428466796875, -2.90667724609375, -2.7705078125, -2.63433837890625, -2.4981689453125, -2.36199951171875, -2.225830078125, -2.08966064453125, -1.9534912109375, -1.81732177734375, -1.68115234375, -1.54498291015625, -1.4088134765625, -1.27264404296875, -1.136474609375, -1.00030517578125, -0.8641357421875, -0.72796630859375, -0.591796875, -0.45562744140625, -0.3194580078125, -0.18328857421875, -0.047119140625, 0.08905029296875, 0.2252197265625, 0.36138916015625, 0.49755859375, 0.63372802734375, 0.7698974609375, 0.90606689453125, 1.042236328125, 1.17840576171875, 1.3145751953125, 1.45074462890625, 1.5869140625, 1.72308349609375, 1.8592529296875, 1.99542236328125, 2.131591796875, 2.26776123046875, 2.4039306640625, 2.54010009765625, 2.67626953125, 2.81243896484375, 2.9486083984375, 3.08477783203125, 3.220947265625, 3.35711669921875, 3.4932861328125, 3.62945556640625, 3.765625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 5.0, 7.0, 10.0, 17.0, 9.0, 14.0, 13.0, 24.0, 24.0, 28.0, 25.0, 25.0, 36.0, 38.0, 41.0, 54.0, 52.0, 40.0, 40.0, 42.0, 36.0, 37.0, 31.0, 45.0, 37.0, 39.0, 30.0, 26.0, 28.0, 27.0, 29.0, 14.0, 8.0, 12.0, 12.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.7255859375, -1.674560546875, -1.62353515625, -1.572509765625, -1.521484375, -1.470458984375, -1.41943359375, -1.368408203125, -1.3173828125, -1.266357421875, -1.21533203125, -1.164306640625, -1.11328125, -1.062255859375, -1.01123046875, -0.960205078125, -0.9091796875, -0.858154296875, -0.80712890625, -0.756103515625, -0.705078125, -0.654052734375, -0.60302734375, -0.552001953125, -0.5009765625, -0.449951171875, -0.39892578125, -0.347900390625, -0.296875, -0.245849609375, -0.19482421875, -0.143798828125, -0.0927734375, -0.041748046875, 0.00927734375, 0.060302734375, 0.111328125, 0.162353515625, 0.21337890625, 0.264404296875, 0.3154296875, 0.366455078125, 0.41748046875, 0.468505859375, 0.51953125, 0.570556640625, 0.62158203125, 0.672607421875, 0.7236328125, 0.774658203125, 0.82568359375, 0.876708984375, 0.927734375, 0.978759765625, 1.02978515625, 1.080810546875, 1.1318359375, 1.182861328125, 1.23388671875, 1.284912109375, 1.3359375, 1.386962890625, 1.43798828125, 1.489013671875, 1.5400390625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 15.0, 16.0, 31.0, 78.0, 313.0, 47126.0, 4146125.0, 377.0, 111.0, 52.0, 12.0, 9.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.8720703125, -40.525390625, -39.1787109375, -37.83203125, -36.4853515625, -35.138671875, -33.7919921875, -32.4453125, -31.0986328125, -29.751953125, -28.4052734375, -27.05859375, -25.7119140625, -24.365234375, -23.0185546875, -21.671875, -20.3251953125, -18.978515625, -17.6318359375, -16.28515625, -14.9384765625, -13.591796875, -12.2451171875, -10.8984375, -9.5517578125, -8.205078125, -6.8583984375, -5.51171875, -4.1650390625, -2.818359375, -1.4716796875, -0.125, 1.2216796875, 2.568359375, 3.9150390625, 5.26171875, 6.6083984375, 7.955078125, 9.3017578125, 10.6484375, 11.9951171875, 13.341796875, 14.6884765625, 16.03515625, 17.3818359375, 18.728515625, 20.0751953125, 21.421875, 22.7685546875, 24.115234375, 25.4619140625, 26.80859375, 28.1552734375, 29.501953125, 30.8486328125, 32.1953125, 33.5419921875, 34.888671875, 36.2353515625, 37.58203125, 38.9287109375, 40.275390625, 41.6220703125, 42.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 3.0, 6.0, 10.0, 20.0, 17.0, 40.0, 44.0, 79.0, 133.0, 186.0, 368.0, 952.0, 1139.0, 462.0, 204.0, 121.0, 96.0, 57.0, 35.0, 26.0, 17.0, 16.0, 8.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8556671142578125, -0.829010009765625, -0.8023529052734375, -0.77569580078125, -0.7490386962890625, -0.722381591796875, -0.6957244873046875, -0.6690673828125, -0.6424102783203125, -0.615753173828125, -0.5890960693359375, -0.56243896484375, -0.5357818603515625, -0.509124755859375, -0.4824676513671875, -0.455810546875, -0.4291534423828125, -0.402496337890625, -0.3758392333984375, -0.34918212890625, -0.3225250244140625, -0.295867919921875, -0.2692108154296875, -0.2425537109375, -0.2158966064453125, -0.189239501953125, -0.1625823974609375, -0.13592529296875, -0.1092681884765625, -0.082611083984375, -0.0559539794921875, -0.029296875, -0.0026397705078125, 0.024017333984375, 0.0506744384765625, 0.07733154296875, 0.1039886474609375, 0.130645751953125, 0.1573028564453125, 0.1839599609375, 0.2106170654296875, 0.237274169921875, 0.2639312744140625, 0.29058837890625, 0.3172454833984375, 0.343902587890625, 0.3705596923828125, 0.397216796875, 0.4238739013671875, 0.450531005859375, 0.4771881103515625, 0.50384521484375, 0.5305023193359375, 0.557159423828125, 0.5838165283203125, 0.6104736328125, 0.6371307373046875, 0.663787841796875, 0.6904449462890625, 0.71710205078125, 0.7437591552734375, 0.770416259765625, 0.7970733642578125, 0.82373046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 14.0, 16.0, 82.0, 246.0, 376.0, 190.0, 48.0, 16.0, 6.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.284709930419922, -16.941699981689453, -16.598691940307617, -16.25568199157715, -15.912673950195312, -15.56966495513916, -15.226655960083008, -14.883646011352539, -14.540637969970703, -14.19762897491455, -13.854619979858398, -13.511610984802246, -13.168601989746094, -12.825592994689941, -12.482583999633789, -12.13957405090332, -11.796565055847168, -11.453556060791016, -11.110547065734863, -10.767538070678711, -10.424529075622559, -10.081520080566406, -9.738510131835938, -9.395502090454102, -9.052492141723633, -8.70948314666748, -8.366474151611328, -8.023465156555176, -7.680456161499023, -7.337447166442871, -6.9944376945495605, -6.651428699493408, -6.3084211349487305, -5.965412139892578, -5.622403144836426, -5.279394149780273, -4.936385154724121, -4.593376159667969, -4.250366687774658, -3.907357692718506, -3.5643486976623535, -3.221339702606201, -2.878330707550049, -2.5353214740753174, -2.192312479019165, -1.8493034839630127, -1.5062942504882812, -1.163285255432129, -0.8202762603759766, -0.47726720571517944, -0.13425815105438232, 0.20875096321105957, 0.5517599582672119, 0.8947689533233643, 1.2377781867980957, 1.580787181854248, 1.9237961769104004, 2.2668051719665527, 2.609814167022705, 2.9528234004974365, 3.295832395553589, 3.638841390609741, 3.9818506240844727, 4.324859619140625, 4.667868614196777]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 14.0, 17.0, 21.0, 15.0, 15.0, 30.0, 21.0, 35.0, 27.0, 33.0, 33.0, 32.0, 44.0, 32.0, 47.0, 43.0, 46.0, 45.0, 40.0, 48.0, 29.0, 25.0, 27.0, 38.0, 38.0, 24.0, 17.0, 31.0, 20.0, 18.0, 9.0, 12.0, 9.0, 11.0, 6.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8065723180770874, -1.7518330812454224, -1.6970938444137573, -1.6423547267913818, -1.5876154899597168, -1.5328762531280518, -1.4781370162963867, -1.4233977794647217, -1.3686585426330566, -1.3139193058013916, -1.2591800689697266, -1.2044408321380615, -1.149701714515686, -1.094962477684021, -1.040223240852356, -0.9854840040206909, -0.9307448863983154, -0.8760056495666504, -0.8212664723396301, -0.7665272355079651, -0.7117880582809448, -0.6570488214492798, -0.6023095846176147, -0.5475703477859497, -0.49283117055892944, -0.4380919635295868, -0.38335275650024414, -0.3286135196685791, -0.27387431263923645, -0.2191351056098938, -0.16439586877822876, -0.10965666174888611, -0.054917335510253906, -0.00017812103033065796, 0.05456109344959259, 0.10930031538009644, 0.1640395224094391, 0.21877872943878174, 0.2735179662704468, 0.32825717329978943, 0.3829963803291321, 0.43773558735847473, 0.4924747943878174, 0.5472140312194824, 0.6019532680511475, 0.6566924452781677, 0.7114316821098328, 0.766170859336853, 0.8209100961685181, 0.8756493330001831, 0.9303885102272034, 0.9851277470588684, 1.0398669242858887, 1.0946061611175537, 1.1493453979492188, 1.2040846347808838, 1.2588238716125488, 1.3135631084442139, 1.368302345275879, 1.423041582107544, 1.4777806997299194, 1.5325199365615845, 1.5872591733932495, 1.6419984102249146, 1.69673752784729]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 12.0, 11.0, 10.0, 28.0, 43.0, 62.0, 75.0, 108.0, 148.0, 231.0, 351.0, 504.0, 787.0, 1185.0, 2220.0, 5506.0, 23307.0, 186925.0, 695014.0, 107119.0, 15576.0, 4244.0, 1810.0, 1121.0, 684.0, 463.0, 303.0, 194.0, 157.0, 107.0, 61.0, 54.0, 36.0, 17.0, 17.0, 16.0, 10.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.429931640625, -0.41811370849609375, -0.4062957763671875, -0.39447784423828125, -0.382659912109375, -0.37084197998046875, -0.3590240478515625, -0.34720611572265625, -0.33538818359375, -0.32357025146484375, -0.3117523193359375, -0.29993438720703125, -0.288116455078125, -0.27629852294921875, -0.2644805908203125, -0.25266265869140625, -0.2408447265625, -0.22902679443359375, -0.2172088623046875, -0.20539093017578125, -0.193572998046875, -0.18175506591796875, -0.1699371337890625, -0.15811920166015625, -0.14630126953125, -0.13448333740234375, -0.1226654052734375, -0.11084747314453125, -0.099029541015625, -0.08721160888671875, -0.0753936767578125, -0.06357574462890625, -0.0517578125, -0.03993988037109375, -0.0281219482421875, -0.01630401611328125, -0.004486083984375, 0.00733184814453125, 0.0191497802734375, 0.03096771240234375, 0.04278564453125, 0.05460357666015625, 0.0664215087890625, 0.07823944091796875, 0.090057373046875, 0.10187530517578125, 0.1136932373046875, 0.12551116943359375, 0.1373291015625, 0.14914703369140625, 0.1609649658203125, 0.17278289794921875, 0.184600830078125, 0.19641876220703125, 0.2082366943359375, 0.22005462646484375, 0.23187255859375, 0.24369049072265625, 0.2555084228515625, 0.26732635498046875, 0.279144287109375, 0.29096221923828125, 0.3027801513671875, 0.31459808349609375, 0.326416015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 3.0, 4.0, 10.0, 14.0, 20.0, 14.0, 18.0, 26.0, 22.0, 26.0, 41.0, 41.0, 32.0, 31.0, 52.0, 49.0, 39.0, 57.0, 42.0, 39.0, 53.0, 37.0, 48.0, 43.0, 25.0, 31.0, 26.0, 21.0, 24.0, 19.0, 18.0, 11.0, 10.0, 10.0, 11.0, 5.0, 8.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4951171875, -1.453369140625, -1.41162109375, -1.369873046875, -1.328125, -1.286376953125, -1.24462890625, -1.202880859375, -1.1611328125, -1.119384765625, -1.07763671875, -1.035888671875, -0.994140625, -0.952392578125, -0.91064453125, -0.868896484375, -0.8271484375, -0.785400390625, -0.74365234375, -0.701904296875, -0.66015625, -0.618408203125, -0.57666015625, -0.534912109375, -0.4931640625, -0.451416015625, -0.40966796875, -0.367919921875, -0.326171875, -0.284423828125, -0.24267578125, -0.200927734375, -0.1591796875, -0.117431640625, -0.07568359375, -0.033935546875, 0.0078125, 0.049560546875, 0.09130859375, 0.133056640625, 0.1748046875, 0.216552734375, 0.25830078125, 0.300048828125, 0.341796875, 0.383544921875, 0.42529296875, 0.467041015625, 0.5087890625, 0.550537109375, 0.59228515625, 0.634033203125, 0.67578125, 0.717529296875, 0.75927734375, 0.801025390625, 0.8427734375, 0.884521484375, 0.92626953125, 0.968017578125, 1.009765625, 1.051513671875, 1.09326171875, 1.135009765625, 1.1767578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 5.0, 13.0, 15.0, 21.0, 23.0, 22.0, 44.0, 48.0, 67.0, 74.0, 96.0, 125.0, 175.0, 208.0, 254.0, 364.0, 581.0, 1256.0, 5909.0, 54955.0, 591416.0, 355772.0, 30372.0, 3806.0, 951.0, 476.0, 341.0, 230.0, 189.0, 148.0, 123.0, 99.0, 73.0, 57.0, 42.0, 49.0, 28.0, 26.0, 19.0, 16.0, 9.0, 12.0, 12.0, 8.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2177734375, -0.21072006225585938, -0.20366668701171875, -0.19661331176757812, -0.1895599365234375, -0.18250656127929688, -0.17545318603515625, -0.16839981079101562, -0.161346435546875, -0.15429306030273438, -0.14723968505859375, -0.14018630981445312, -0.1331329345703125, -0.12607955932617188, -0.11902618408203125, -0.11197280883789062, -0.10491943359375, -0.09786605834960938, -0.09081268310546875, -0.08375930786132812, -0.0767059326171875, -0.06965255737304688, -0.06259918212890625, -0.055545806884765625, -0.048492431640625, -0.041439056396484375, -0.03438568115234375, -0.027332305908203125, -0.0202789306640625, -0.013225555419921875, -0.00617218017578125, 0.000881195068359375, 0.0079345703125, 0.014987945556640625, 0.02204132080078125, 0.029094696044921875, 0.0361480712890625, 0.043201446533203125, 0.05025482177734375, 0.057308197021484375, 0.064361572265625, 0.07141494750976562, 0.07846832275390625, 0.08552169799804688, 0.0925750732421875, 0.09962844848632812, 0.10668182373046875, 0.11373519897460938, 0.12078857421875, 0.12784194946289062, 0.13489532470703125, 0.14194869995117188, 0.1490020751953125, 0.15605545043945312, 0.16310882568359375, 0.17016220092773438, 0.177215576171875, 0.18426895141601562, 0.19132232666015625, 0.19837570190429688, 0.2054290771484375, 0.21248245239257812, 0.21953582763671875, 0.22658920288085938, 0.233642578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 11.0, 7.0, 12.0, 13.0, 16.0, 21.0, 15.0, 32.0, 17.0, 26.0, 32.0, 30.0, 41.0, 42.0, 32.0, 38.0, 39.0, 36.0, 45.0, 34.0, 41.0, 46.0, 32.0, 34.0, 33.0, 30.0, 22.0, 26.0, 24.0, 23.0, 20.0, 12.0, 14.0, 12.0, 15.0, 12.0, 9.0, 5.0, 3.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8564453125, -1.7955780029296875, -1.734710693359375, -1.6738433837890625, -1.61297607421875, -1.5521087646484375, -1.491241455078125, -1.4303741455078125, -1.3695068359375, -1.3086395263671875, -1.247772216796875, -1.1869049072265625, -1.12603759765625, -1.0651702880859375, -1.004302978515625, -0.9434356689453125, -0.882568359375, -0.8217010498046875, -0.760833740234375, -0.6999664306640625, -0.63909912109375, -0.5782318115234375, -0.517364501953125, -0.4564971923828125, -0.3956298828125, -0.3347625732421875, -0.273895263671875, -0.2130279541015625, -0.15216064453125, -0.0912933349609375, -0.030426025390625, 0.0304412841796875, 0.09130859375, 0.1521759033203125, 0.213043212890625, 0.2739105224609375, 0.33477783203125, 0.3956451416015625, 0.456512451171875, 0.5173797607421875, 0.5782470703125, 0.6391143798828125, 0.699981689453125, 0.7608489990234375, 0.82171630859375, 0.8825836181640625, 0.943450927734375, 1.0043182373046875, 1.065185546875, 1.1260528564453125, 1.186920166015625, 1.2477874755859375, 1.30865478515625, 1.3695220947265625, 1.430389404296875, 1.4912567138671875, 1.5521240234375, 1.6129913330078125, 1.673858642578125, 1.7347259521484375, 1.79559326171875, 1.8564605712890625, 1.917327880859375, 1.9781951904296875, 2.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 17.0, 27.0, 29.0, 52.0, 88.0, 145.0, 262.0, 507.0, 1117.0, 8223.0, 988035.0, 46968.0, 1688.0, 647.0, 284.0, 180.0, 97.0, 72.0, 34.0, 25.0, 19.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.03768491744995117, -0.036093711853027344, -0.034502506256103516, -0.03291130065917969, -0.03132009506225586, -0.02972888946533203, -0.028137683868408203, -0.026546478271484375, -0.024955272674560547, -0.02336406707763672, -0.02177286148071289, -0.020181655883789062, -0.018590450286865234, -0.016999244689941406, -0.015408039093017578, -0.01381683349609375, -0.012225627899169922, -0.010634422302246094, -0.009043216705322266, -0.0074520111083984375, -0.005860805511474609, -0.004269599914550781, -0.002678394317626953, -0.001087188720703125, 0.0005040168762207031, 0.0020952224731445312, 0.0036864280700683594, 0.0052776336669921875, 0.006868839263916016, 0.008460044860839844, 0.010051250457763672, 0.0116424560546875, 0.013233661651611328, 0.014824867248535156, 0.016416072845458984, 0.018007278442382812, 0.01959848403930664, 0.02118968963623047, 0.022780895233154297, 0.024372100830078125, 0.025963306427001953, 0.02755451202392578, 0.02914571762084961, 0.030736923217773438, 0.032328128814697266, 0.033919334411621094, 0.03551054000854492, 0.03710174560546875, 0.03869295120239258, 0.040284156799316406, 0.041875362396240234, 0.04346656799316406, 0.04505777359008789, 0.04664897918701172, 0.04824018478393555, 0.049831390380859375, 0.0514225959777832, 0.05301380157470703, 0.05460500717163086, 0.05619621276855469, 0.057787418365478516, 0.059378623962402344, 0.06096982955932617, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 21.0, 32.0, 24.0, 52.0, 61.0, 97.0, 95.0, 110.0, 117.0, 94.0, 67.0, 60.0, 42.0, 38.0, 12.0, 12.0, 4.0, 12.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.008676528930664e-05, -1.9341707229614258e-05, -1.8596649169921875e-05, -1.7851591110229492e-05, -1.710653305053711e-05, -1.6361474990844727e-05, -1.5616416931152344e-05, -1.4871358871459961e-05, -1.4126300811767578e-05, -1.3381242752075195e-05, -1.2636184692382812e-05, -1.189112663269043e-05, -1.1146068572998047e-05, -1.0401010513305664e-05, -9.655952453613281e-06, -8.910894393920898e-06, -8.165836334228516e-06, -7.420778274536133e-06, -6.67572021484375e-06, -5.930662155151367e-06, -5.185604095458984e-06, -4.4405460357666016e-06, -3.6954879760742188e-06, -2.950429916381836e-06, -2.205371856689453e-06, -1.4603137969970703e-06, -7.152557373046875e-07, 2.9802322387695312e-08, 7.748603820800781e-07, 1.519918441772461e-06, 2.2649765014648438e-06, 3.0100345611572266e-06, 3.7550926208496094e-06, 4.500150680541992e-06, 5.245208740234375e-06, 5.990266799926758e-06, 6.735324859619141e-06, 7.4803829193115234e-06, 8.225440979003906e-06, 8.970499038696289e-06, 9.715557098388672e-06, 1.0460615158081055e-05, 1.1205673217773438e-05, 1.195073127746582e-05, 1.2695789337158203e-05, 1.3440847396850586e-05, 1.4185905456542969e-05, 1.4930963516235352e-05, 1.5676021575927734e-05, 1.6421079635620117e-05, 1.71661376953125e-05, 1.7911195755004883e-05, 1.8656253814697266e-05, 1.940131187438965e-05, 2.014636993408203e-05, 2.0891427993774414e-05, 2.1636486053466797e-05, 2.238154411315918e-05, 2.3126602172851562e-05, 2.3871660232543945e-05, 2.4616718292236328e-05, 2.536177635192871e-05, 2.6106834411621094e-05, 2.6851892471313477e-05, 2.759695053100586e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 14.0, 17.0, 16.0, 16.0, 35.0, 66.0, 114.0, 477.0, 4234.0, 259389.0, 777929.0, 5289.0, 532.0, 117.0, 67.0, 33.0, 33.0, 25.0, 16.0, 19.0, 10.0, 4.0, 13.0, 8.0, 7.0, 2.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13435745239257812, -0.13016510009765625, -0.12597274780273438, -0.1217803955078125, -0.11758804321289062, -0.11339569091796875, -0.10920333862304688, -0.105010986328125, -0.10081863403320312, -0.09662628173828125, -0.09243392944335938, -0.0882415771484375, -0.08404922485351562, -0.07985687255859375, -0.07566452026367188, -0.07147216796875, -0.06727981567382812, -0.06308746337890625, -0.058895111083984375, -0.0547027587890625, -0.050510406494140625, -0.04631805419921875, -0.042125701904296875, -0.037933349609375, -0.033740997314453125, -0.02954864501953125, -0.025356292724609375, -0.0211639404296875, -0.016971588134765625, -0.01277923583984375, -0.008586883544921875, -0.00439453125, -0.000202178955078125, 0.00399017333984375, 0.008182525634765625, 0.0123748779296875, 0.016567230224609375, 0.02075958251953125, 0.024951934814453125, 0.029144287109375, 0.033336639404296875, 0.03752899169921875, 0.041721343994140625, 0.0459136962890625, 0.050106048583984375, 0.05429840087890625, 0.058490753173828125, 0.06268310546875, 0.06687545776367188, 0.07106781005859375, 0.07526016235351562, 0.0794525146484375, 0.08364486694335938, 0.08783721923828125, 0.09202957153320312, 0.096221923828125, 0.10041427612304688, 0.10460662841796875, 0.10879898071289062, 0.1129913330078125, 0.11718368530273438, 0.12137603759765625, 0.12556838989257812, 0.1297607421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 16.0, 35.0, 38.0, 74.0, 187.0, 264.0, 190.0, 67.0, 36.0, 13.0, 14.0, 10.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0125885009765625, -0.012222528457641602, -0.011856555938720703, -0.011490583419799805, -0.011124610900878906, -0.010758638381958008, -0.01039266586303711, -0.010026693344116211, -0.009660720825195312, -0.009294748306274414, -0.008928775787353516, -0.008562803268432617, -0.008196830749511719, -0.00783085823059082, -0.007464885711669922, -0.0070989131927490234, -0.006732940673828125, -0.0063669681549072266, -0.006000995635986328, -0.00563502311706543, -0.005269050598144531, -0.004903078079223633, -0.004537105560302734, -0.004171133041381836, -0.0038051605224609375, -0.003439188003540039, -0.0030732154846191406, -0.002707242965698242, -0.0023412704467773438, -0.0019752979278564453, -0.0016093254089355469, -0.0012433528900146484, -0.00087738037109375, -0.0005114078521728516, -0.00014543533325195312, 0.0002205371856689453, 0.0005865097045898438, 0.0009524822235107422, 0.0013184547424316406, 0.001684427261352539, 0.0020503997802734375, 0.002416372299194336, 0.0027823448181152344, 0.003148317337036133, 0.0035142898559570312, 0.0038802623748779297, 0.004246234893798828, 0.0046122074127197266, 0.004978179931640625, 0.0053441524505615234, 0.005710124969482422, 0.00607609748840332, 0.006442070007324219, 0.006808042526245117, 0.007174015045166016, 0.007539987564086914, 0.007905960083007812, 0.008271932601928711, 0.00863790512084961, 0.009003877639770508, 0.009369850158691406, 0.009735822677612305, 0.010101795196533203, 0.010467767715454102, 0.010833740234375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 12.0, 32.0, 202.0, 482.0, 208.0, 44.0, 9.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.336677551269531, -14.041184425354004, -13.745691299438477, -13.45019817352295, -13.154705047607422, -12.859211921691895, -12.563718795776367, -12.26822566986084, -11.972732543945312, -11.677239418029785, -11.381746292114258, -11.08625316619873, -10.790760040283203, -10.495266914367676, -10.199773788452148, -9.904280662536621, -9.608787536621094, -9.313294410705566, -9.017801284790039, -8.722308158874512, -8.426815032958984, -8.131321907043457, -7.83582878112793, -7.540335655212402, -7.244842529296875, -6.949349403381348, -6.65385627746582, -6.358363151550293, -6.062870025634766, -5.767376899719238, -5.471883773803711, -5.176390647888184, -4.8808979988098145, -4.585404872894287, -4.28991174697876, -3.9944186210632324, -3.698925495147705, -3.4034323692321777, -3.1079392433166504, -2.812446117401123, -2.5169529914855957, -2.2214598655700684, -1.925966739654541, -1.6304736137390137, -1.3349804878234863, -1.039487361907959, -0.7439942359924316, -0.4485011100769043, -0.15300798416137695, 0.1424851417541504, 0.43797826766967773, 0.7334713935852051, 1.0289645195007324, 1.3244576454162598, 1.619950771331787, 1.9154438972473145, 2.210937023162842, 2.506430149078369, 2.8019232749938965, 3.097416400909424, 3.392909526824951, 3.6884026527404785, 3.983895778656006, 4.279388904571533, 4.5748820304870605]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 1.0, 10.0, 6.0, 10.0, 18.0, 22.0, 15.0, 20.0, 22.0, 35.0, 36.0, 30.0, 35.0, 39.0, 44.0, 35.0, 52.0, 46.0, 47.0, 56.0, 46.0, 40.0, 34.0, 30.0, 39.0, 38.0, 26.0, 26.0, 23.0, 30.0, 15.0, 8.0, 16.0, 8.0, 10.0, 6.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3640011548995972, -1.3239569664001465, -1.2839126586914062, -1.2438684701919556, -1.2038242816925049, -1.1637799739837646, -1.123735785484314, -1.0836915969848633, -1.043647289276123, -1.0036031007766724, -0.9635588526725769, -0.9235146045684814, -0.8834704160690308, -0.8434261679649353, -0.8033819198608398, -0.7633377313613892, -0.7232935428619385, -0.683249294757843, -0.6432051062583923, -0.6031608581542969, -0.5631166696548462, -0.5230724215507507, -0.4830281734466553, -0.4429839551448822, -0.40293973684310913, -0.36289551854133606, -0.322851300239563, -0.28280705213546753, -0.24276283383369446, -0.2027186155319214, -0.16267438232898712, -0.12263014912605286, -0.08258581161499023, -0.042541585862636566, -0.002497360110282898, 0.03754686564207077, 0.07759109139442444, 0.11763530969619751, 0.15767954289913177, 0.19772377610206604, 0.2377679944038391, 0.2778122127056122, 0.31785643100738525, 0.3579006791114807, 0.3979448974132538, 0.43798911571502686, 0.4780333638191223, 0.5180776119232178, 0.5581218004226685, 0.5981660485267639, 0.6382102370262146, 0.6782544851303101, 0.7182986736297607, 0.7583429217338562, 0.7983871698379517, 0.8384313583374023, 0.8784756064414978, 0.9185198545455933, 0.958564043045044, 0.9986082911491394, 1.0386525392532349, 1.0786967277526855, 1.1187409162521362, 1.1587852239608765, 1.1988294124603271]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 12.0, 15.0, 23.0, 27.0, 44.0, 53.0, 103.0, 137.0, 225.0, 351.0, 628.0, 1101.0, 2130.0, 4295.0, 9160.0, 22758.0, 69604.0, 526633.0, 324739.0, 52382.0, 18255.0, 7986.0, 3654.0, 1921.0, 959.0, 513.0, 301.0, 185.0, 122.0, 57.0, 46.0, 30.0, 23.0, 18.0, 16.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.4921875, -1.4517364501953125, -1.411285400390625, -1.3708343505859375, -1.33038330078125, -1.2899322509765625, -1.249481201171875, -1.2090301513671875, -1.1685791015625, -1.1281280517578125, -1.087677001953125, -1.0472259521484375, -1.00677490234375, -0.9663238525390625, -0.925872802734375, -0.8854217529296875, -0.844970703125, -0.8045196533203125, -0.764068603515625, -0.7236175537109375, -0.68316650390625, -0.6427154541015625, -0.602264404296875, -0.5618133544921875, -0.5213623046875, -0.4809112548828125, -0.440460205078125, -0.4000091552734375, -0.35955810546875, -0.3191070556640625, -0.278656005859375, -0.2382049560546875, -0.19775390625, -0.1573028564453125, -0.116851806640625, -0.0764007568359375, -0.03594970703125, 0.0045013427734375, 0.044952392578125, 0.0854034423828125, 0.1258544921875, 0.1663055419921875, 0.206756591796875, 0.2472076416015625, 0.28765869140625, 0.3281097412109375, 0.368560791015625, 0.4090118408203125, 0.449462890625, 0.4899139404296875, 0.530364990234375, 0.5708160400390625, 0.61126708984375, 0.6517181396484375, 0.692169189453125, 0.7326202392578125, 0.7730712890625, 0.8135223388671875, 0.853973388671875, 0.8944244384765625, 0.93487548828125, 0.9753265380859375, 1.015777587890625, 1.0562286376953125, 1.0966796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 7.0, 14.0, 17.0, 18.0, 23.0, 27.0, 36.0, 47.0, 34.0, 35.0, 45.0, 37.0, 41.0, 53.0, 57.0, 53.0, 45.0, 45.0, 46.0, 33.0, 31.0, 28.0, 29.0, 22.0, 24.0, 24.0, 21.0, 15.0, 14.0, 7.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.81640625, -3.7147216796875, -3.613037109375, -3.5113525390625, -3.40966796875, -3.3079833984375, -3.206298828125, -3.1046142578125, -3.0029296875, -2.9012451171875, -2.799560546875, -2.6978759765625, -2.59619140625, -2.4945068359375, -2.392822265625, -2.2911376953125, -2.189453125, -2.0877685546875, -1.986083984375, -1.8843994140625, -1.78271484375, -1.6810302734375, -1.579345703125, -1.4776611328125, -1.3759765625, -1.2742919921875, -1.172607421875, -1.0709228515625, -0.96923828125, -0.8675537109375, -0.765869140625, -0.6641845703125, -0.5625, -0.4608154296875, -0.359130859375, -0.2574462890625, -0.15576171875, -0.0540771484375, 0.047607421875, 0.1492919921875, 0.2509765625, 0.3526611328125, 0.454345703125, 0.5560302734375, 0.65771484375, 0.7593994140625, 0.861083984375, 0.9627685546875, 1.064453125, 1.1661376953125, 1.267822265625, 1.3695068359375, 1.47119140625, 1.5728759765625, 1.674560546875, 1.7762451171875, 1.8779296875, 1.9796142578125, 2.081298828125, 2.1829833984375, 2.28466796875, 2.3863525390625, 2.488037109375, 2.5897216796875, 2.69140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 10.0, 8.0, 16.0, 15.0, 28.0, 29.0, 35.0, 63.0, 62.0, 113.0, 337.0, 1044557.0, 2842.0, 130.0, 63.0, 57.0, 47.0, 34.0, 19.0, 27.0, 13.0, 8.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.21875, -21.539306640625, -20.85986328125, -20.180419921875, -19.5009765625, -18.821533203125, -18.14208984375, -17.462646484375, -16.783203125, -16.103759765625, -15.42431640625, -14.744873046875, -14.0654296875, -13.385986328125, -12.70654296875, -12.027099609375, -11.34765625, -10.668212890625, -9.98876953125, -9.309326171875, -8.6298828125, -7.950439453125, -7.27099609375, -6.591552734375, -5.912109375, -5.232666015625, -4.55322265625, -3.873779296875, -3.1943359375, -2.514892578125, -1.83544921875, -1.156005859375, -0.4765625, 0.202880859375, 0.88232421875, 1.561767578125, 2.2412109375, 2.920654296875, 3.60009765625, 4.279541015625, 4.958984375, 5.638427734375, 6.31787109375, 6.997314453125, 7.6767578125, 8.356201171875, 9.03564453125, 9.715087890625, 10.39453125, 11.073974609375, 11.75341796875, 12.432861328125, 13.1123046875, 13.791748046875, 14.47119140625, 15.150634765625, 15.830078125, 16.509521484375, 17.18896484375, 17.868408203125, 18.5478515625, 19.227294921875, 19.90673828125, 20.586181640625, 21.265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 10.0, 17.0, 14.0, 25.0, 31.0, 36.0, 63.0, 61.0, 73.0, 80.0, 105.0, 82.0, 86.0, 63.0, 53.0, 47.0, 36.0, 18.0, 30.0, 13.0, 8.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.5244140625, -7.287109375, -7.0498046875, -6.8125, -6.5751953125, -6.337890625, -6.1005859375, -5.86328125, -5.6259765625, -5.388671875, -5.1513671875, -4.9140625, -4.6767578125, -4.439453125, -4.2021484375, -3.96484375, -3.7275390625, -3.490234375, -3.2529296875, -3.015625, -2.7783203125, -2.541015625, -2.3037109375, -2.06640625, -1.8291015625, -1.591796875, -1.3544921875, -1.1171875, -0.8798828125, -0.642578125, -0.4052734375, -0.16796875, 0.0693359375, 0.306640625, 0.5439453125, 0.78125, 1.0185546875, 1.255859375, 1.4931640625, 1.73046875, 1.9677734375, 2.205078125, 2.4423828125, 2.6796875, 2.9169921875, 3.154296875, 3.3916015625, 3.62890625, 3.8662109375, 4.103515625, 4.3408203125, 4.578125, 4.8154296875, 5.052734375, 5.2900390625, 5.52734375, 5.7646484375, 6.001953125, 6.2392578125, 6.4765625, 6.7138671875, 6.951171875, 7.1884765625, 7.42578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 6.0, 10.0, 15.0, 32.0, 61.0, 67.0, 156.0, 348.0, 958.0, 3239.0, 17044.0, 772024.0, 236224.0, 14087.0, 2763.0, 871.0, 305.0, 127.0, 76.0, 50.0, 29.0, 13.0, 8.0, 6.0, 8.0, 8.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.64971923828125, -0.6256103515625, -0.60150146484375, -0.577392578125, -0.55328369140625, -0.5291748046875, -0.50506591796875, -0.48095703125, -0.45684814453125, -0.4327392578125, -0.40863037109375, -0.384521484375, -0.36041259765625, -0.3363037109375, -0.31219482421875, -0.2880859375, -0.26397705078125, -0.2398681640625, -0.21575927734375, -0.191650390625, -0.16754150390625, -0.1434326171875, -0.11932373046875, -0.09521484375, -0.07110595703125, -0.0469970703125, -0.02288818359375, 0.001220703125, 0.02532958984375, 0.0494384765625, 0.07354736328125, 0.09765625, 0.12176513671875, 0.1458740234375, 0.16998291015625, 0.194091796875, 0.21820068359375, 0.2423095703125, 0.26641845703125, 0.29052734375, 0.31463623046875, 0.3387451171875, 0.36285400390625, 0.386962890625, 0.41107177734375, 0.4351806640625, 0.45928955078125, 0.4833984375, 0.50750732421875, 0.5316162109375, 0.55572509765625, 0.579833984375, 0.60394287109375, 0.6280517578125, 0.65216064453125, 0.67626953125, 0.70037841796875, 0.7244873046875, 0.74859619140625, 0.772705078125, 0.79681396484375, 0.8209228515625, 0.84503173828125, 0.869140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 3.0, 10.0, 9.0, 23.0, 37.0, 55.0, 126.0, 298.0, 187.0, 94.0, 43.0, 29.0, 16.0, 12.0, 10.0, 8.0, 6.0, 7.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.888410568237305e-05, -9.626150131225586e-05, -9.363889694213867e-05, -9.101629257202148e-05, -8.83936882019043e-05, -8.577108383178711e-05, -8.314847946166992e-05, -8.052587509155273e-05, -7.790327072143555e-05, -7.528066635131836e-05, -7.265806198120117e-05, -7.003545761108398e-05, -6.74128532409668e-05, -6.479024887084961e-05, -6.216764450073242e-05, -5.9545040130615234e-05, -5.692243576049805e-05, -5.429983139038086e-05, -5.167722702026367e-05, -4.9054622650146484e-05, -4.64320182800293e-05, -4.380941390991211e-05, -4.118680953979492e-05, -3.8564205169677734e-05, -3.594160079956055e-05, -3.331899642944336e-05, -3.069639205932617e-05, -2.8073787689208984e-05, -2.5451183319091797e-05, -2.282857894897461e-05, -2.0205974578857422e-05, -1.7583370208740234e-05, -1.4960765838623047e-05, -1.233816146850586e-05, -9.715557098388672e-06, -7.092952728271484e-06, -4.470348358154297e-06, -1.8477439880371094e-06, 7.748603820800781e-07, 3.3974647521972656e-06, 6.020069122314453e-06, 8.64267349243164e-06, 1.1265277862548828e-05, 1.3887882232666016e-05, 1.6510486602783203e-05, 1.913309097290039e-05, 2.1755695343017578e-05, 2.4378299713134766e-05, 2.7000904083251953e-05, 2.962350845336914e-05, 3.224611282348633e-05, 3.4868717193603516e-05, 3.74913215637207e-05, 4.011392593383789e-05, 4.273653030395508e-05, 4.5359134674072266e-05, 4.798173904418945e-05, 5.060434341430664e-05, 5.322694778442383e-05, 5.5849552154541016e-05, 5.84721565246582e-05, 6.109476089477539e-05, 6.371736526489258e-05, 6.633996963500977e-05, 6.896257400512695e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 4.0, 8.0, 9.0, 12.0, 24.0, 31.0, 60.0, 76.0, 114.0, 242.0, 436.0, 954.0, 2488.0, 7975.0, 42338.0, 901018.0, 75977.0, 11312.0, 3141.0, 1140.0, 559.0, 256.0, 151.0, 87.0, 55.0, 31.0, 12.0, 14.0, 6.0, 8.0, 2.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6416015625, -0.6225204467773438, -0.6034393310546875, -0.5843582153320312, -0.565277099609375, -0.5461959838867188, -0.5271148681640625, -0.5080337524414062, -0.48895263671875, -0.46987152099609375, -0.4507904052734375, -0.43170928955078125, -0.412628173828125, -0.39354705810546875, -0.3744659423828125, -0.35538482666015625, -0.3363037109375, -0.31722259521484375, -0.2981414794921875, -0.27906036376953125, -0.259979248046875, -0.24089813232421875, -0.2218170166015625, -0.20273590087890625, -0.18365478515625, -0.16457366943359375, -0.1454925537109375, -0.12641143798828125, -0.107330322265625, -0.08824920654296875, -0.0691680908203125, -0.05008697509765625, -0.031005859375, -0.01192474365234375, 0.0071563720703125, 0.02623748779296875, 0.045318603515625, 0.06439971923828125, 0.0834808349609375, 0.10256195068359375, 0.12164306640625, 0.14072418212890625, 0.1598052978515625, 0.17888641357421875, 0.197967529296875, 0.21704864501953125, 0.2361297607421875, 0.25521087646484375, 0.2742919921875, 0.29337310791015625, 0.3124542236328125, 0.33153533935546875, 0.350616455078125, 0.36969757080078125, 0.3887786865234375, 0.40785980224609375, 0.42694091796875, 0.44602203369140625, 0.4651031494140625, 0.48418426513671875, 0.503265380859375, 0.5223464965820312, 0.5414276123046875, 0.5605087280273438, 0.57958984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 8.0, 7.0, 13.0, 16.0, 18.0, 30.0, 40.0, 82.0, 141.0, 351.0, 117.0, 67.0, 35.0, 19.0, 11.0, 13.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.21435165405273438, -0.20812225341796875, -0.20189285278320312, -0.1956634521484375, -0.18943405151367188, -0.18320465087890625, -0.17697525024414062, -0.170745849609375, -0.16451644897460938, -0.15828704833984375, -0.15205764770507812, -0.1458282470703125, -0.13959884643554688, -0.13336944580078125, -0.12714004516601562, -0.12091064453125, -0.11468124389648438, -0.10845184326171875, -0.10222244262695312, -0.0959930419921875, -0.08976364135742188, -0.08353424072265625, -0.07730484008789062, -0.071075439453125, -0.06484603881835938, -0.05861663818359375, -0.052387237548828125, -0.0461578369140625, -0.039928436279296875, -0.03369903564453125, -0.027469635009765625, -0.021240234375, -0.015010833740234375, -0.00878143310546875, -0.002552032470703125, 0.0036773681640625, 0.009906768798828125, 0.01613616943359375, 0.022365570068359375, 0.028594970703125, 0.034824371337890625, 0.04105377197265625, 0.047283172607421875, 0.0535125732421875, 0.059741973876953125, 0.06597137451171875, 0.07220077514648438, 0.07843017578125, 0.08465957641601562, 0.09088897705078125, 0.09711837768554688, 0.1033477783203125, 0.10957717895507812, 0.11580657958984375, 0.12203598022460938, 0.128265380859375, 0.13449478149414062, 0.14072418212890625, 0.14695358276367188, 0.1531829833984375, 0.15941238403320312, 0.16564178466796875, 0.17187118530273438, 0.1781005859375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 13.0, 15.0, 34.0, 115.0, 243.0, 285.0, 163.0, 61.0, 36.0, 11.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.668109893798828, -12.3677339553833, -12.06735897064209, -11.766983032226562, -11.466608047485352, -11.166232109069824, -10.865856170654297, -10.565481185913086, -10.265105247497559, -9.964729309082031, -9.66435432434082, -9.363978385925293, -9.063603401184082, -8.763227462768555, -8.462852478027344, -8.162476539611816, -7.862101078033447, -7.561725616455078, -7.261350154876709, -6.96097469329834, -6.6605987548828125, -6.360223293304443, -6.059847831726074, -5.759471893310547, -5.459096908569336, -5.158721446990967, -4.858345985412598, -4.55797004699707, -4.257594585418701, -3.957219123840332, -3.656843662261963, -3.3564679622650146, -3.0560927391052246, -2.7557172775268555, -2.4553415775299072, -2.154966115951538, -1.8545905351638794, -1.5542149543762207, -1.2538394927978516, -0.9534637928009033, -0.6530883312225342, -0.3527127802371979, -0.05233722925186157, 0.24803829193115234, 0.548413872718811, 0.8487894535064697, 1.1491649150848389, 1.449540615081787, 1.7499160766601562, 2.0502915382385254, 2.3506672382354736, 2.6510426998138428, 2.951418399810791, 3.25179386138916, 3.5521693229675293, 3.8525450229644775, 4.152920722961426, 4.453296184539795, 4.753671646118164, 5.054047584533691, 5.3544230461120605, 5.65479850769043, 5.955173969268799, 6.255549430847168, 6.555924892425537]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 17.0, 10.0, 12.0, 22.0, 13.0, 27.0, 24.0, 34.0, 34.0, 32.0, 46.0, 53.0, 60.0, 47.0, 35.0, 45.0, 38.0, 56.0, 49.0, 38.0, 46.0, 45.0, 33.0, 26.0, 27.0, 21.0, 22.0, 23.0, 7.0, 11.0, 7.0, 4.0, 7.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450930118560791, -7.241085529327393, -7.031241416931152, -6.821396827697754, -6.6115522384643555, -6.401707649230957, -6.191863536834717, -5.982018947601318, -5.772174835205078, -5.56233024597168, -5.3524861335754395, -5.142641544342041, -4.932796955108643, -4.722952842712402, -4.513108253479004, -4.3032636642456055, -4.093419075012207, -3.8835747241973877, -3.6737301349639893, -3.46388578414917, -3.2540411949157715, -3.044196844100952, -2.834352493286133, -2.6245079040527344, -2.414663553237915, -2.2048192024230957, -1.9949746131896973, -1.785130262374878, -1.575285792350769, -1.3654413223266602, -1.1555969715118408, -0.9457525014877319, -0.735908031463623, -0.5260635614395142, -0.31621915102005005, -0.10637474060058594, 0.10346972942352295, 0.31331419944763184, 0.5231585502624512, 0.7330030202865601, 0.942847490310669, 1.1526919603347778, 1.3625364303588867, 1.572380781173706, 1.782225251197815, 1.9920697212219238, 2.201914072036743, 2.4117584228515625, 2.621603012084961, 2.8314473628997803, 3.0412919521331787, 3.251136302947998, 3.4609808921813965, 3.670825242996216, 3.880669593811035, 4.090514183044434, 4.300358772277832, 4.5102033615112305, 4.720047473907471, 4.929892063140869, 5.139736652374268, 5.349580764770508, 5.559425354003906, 5.769269943237305, 5.979114055633545]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 14.0, 6.0, 15.0, 20.0, 25.0, 29.0, 37.0, 73.0, 78.0, 148.0, 322.0, 777.0, 2909.0, 15151.0, 218424.0, 3837478.0, 105163.0, 10207.0, 2088.0, 630.0, 247.0, 139.0, 71.0, 61.0, 31.0, 26.0, 14.0, 11.0, 16.0, 14.0, 10.0, 6.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.09735107421875, -4.9447021484375, -4.79205322265625, -4.639404296875, -4.48675537109375, -4.3341064453125, -4.18145751953125, -4.02880859375, -3.87615966796875, -3.7235107421875, -3.57086181640625, -3.418212890625, -3.26556396484375, -3.1129150390625, -2.96026611328125, -2.8076171875, -2.65496826171875, -2.5023193359375, -2.34967041015625, -2.197021484375, -2.04437255859375, -1.8917236328125, -1.73907470703125, -1.58642578125, -1.43377685546875, -1.2811279296875, -1.12847900390625, -0.975830078125, -0.82318115234375, -0.6705322265625, -0.51788330078125, -0.365234375, -0.21258544921875, -0.0599365234375, 0.09271240234375, 0.245361328125, 0.39801025390625, 0.5506591796875, 0.70330810546875, 0.85595703125, 1.00860595703125, 1.1612548828125, 1.31390380859375, 1.466552734375, 1.61920166015625, 1.7718505859375, 1.92449951171875, 2.0771484375, 2.22979736328125, 2.3824462890625, 2.53509521484375, 2.687744140625, 2.84039306640625, 2.9930419921875, 3.14569091796875, 3.29833984375, 3.45098876953125, 3.6036376953125, 3.75628662109375, 3.908935546875, 4.06158447265625, 4.2142333984375, 4.36688232421875, 4.51953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 11.0, 5.0, 9.0, 18.0, 17.0, 25.0, 28.0, 35.0, 40.0, 47.0, 56.0, 51.0, 50.0, 68.0, 58.0, 59.0, 48.0, 52.0, 49.0, 38.0, 37.0, 26.0, 20.0, 33.0, 23.0, 19.0, 10.0, 8.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.796875, -1.7444610595703125, -1.692047119140625, -1.6396331787109375, -1.58721923828125, -1.5348052978515625, -1.482391357421875, -1.4299774169921875, -1.3775634765625, -1.3251495361328125, -1.272735595703125, -1.2203216552734375, -1.16790771484375, -1.1154937744140625, -1.063079833984375, -1.0106658935546875, -0.958251953125, -0.9058380126953125, -0.853424072265625, -0.8010101318359375, -0.74859619140625, -0.6961822509765625, -0.643768310546875, -0.5913543701171875, -0.5389404296875, -0.4865264892578125, -0.434112548828125, -0.3816986083984375, -0.32928466796875, -0.2768707275390625, -0.224456787109375, -0.1720428466796875, -0.11962890625, -0.0672149658203125, -0.014801025390625, 0.0376129150390625, 0.09002685546875, 0.1424407958984375, 0.194854736328125, 0.2472686767578125, 0.2996826171875, 0.3520965576171875, 0.404510498046875, 0.4569244384765625, 0.50933837890625, 0.5617523193359375, 0.614166259765625, 0.6665802001953125, 0.718994140625, 0.7714080810546875, 0.823822021484375, 0.8762359619140625, 0.92864990234375, 0.9810638427734375, 1.033477783203125, 1.0858917236328125, 1.1383056640625, 1.1907196044921875, 1.243133544921875, 1.2955474853515625, 1.34796142578125, 1.4003753662109375, 1.452789306640625, 1.5052032470703125, 1.5576171875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 12.0, 30.0, 158.0, 4463.0, 4187854.0, 1613.0, 108.0, 26.0, 9.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.3565673828125, -32.588134765625, -31.8197021484375, -31.05126953125, -30.2828369140625, -29.514404296875, -28.7459716796875, -27.9775390625, -27.2091064453125, -26.440673828125, -25.6722412109375, -24.90380859375, -24.1353759765625, -23.366943359375, -22.5985107421875, -21.830078125, -21.0616455078125, -20.293212890625, -19.5247802734375, -18.75634765625, -17.9879150390625, -17.219482421875, -16.4510498046875, -15.6826171875, -14.9141845703125, -14.145751953125, -13.3773193359375, -12.60888671875, -11.8404541015625, -11.072021484375, -10.3035888671875, -9.53515625, -8.7667236328125, -7.998291015625, -7.2298583984375, -6.46142578125, -5.6929931640625, -4.924560546875, -4.1561279296875, -3.3876953125, -2.6192626953125, -1.850830078125, -1.0823974609375, -0.31396484375, 0.4544677734375, 1.222900390625, 1.9913330078125, 2.759765625, 3.5281982421875, 4.296630859375, 5.0650634765625, 5.83349609375, 6.6019287109375, 7.370361328125, 8.1387939453125, 8.9072265625, 9.6756591796875, 10.444091796875, 11.2125244140625, 11.98095703125, 12.7493896484375, 13.517822265625, 14.2862548828125, 15.0546875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 15.0, 17.0, 28.0, 34.0, 71.0, 99.0, 143.0, 288.0, 687.0, 1466.0, 506.0, 245.0, 177.0, 110.0, 69.0, 39.0, 28.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.534332275390625, -0.50811767578125, -0.481903076171875, -0.4556884765625, -0.429473876953125, -0.40325927734375, -0.377044677734375, -0.350830078125, -0.324615478515625, -0.29840087890625, -0.272186279296875, -0.2459716796875, -0.219757080078125, -0.19354248046875, -0.167327880859375, -0.14111328125, -0.114898681640625, -0.08868408203125, -0.062469482421875, -0.0362548828125, -0.010040283203125, 0.01617431640625, 0.042388916015625, 0.068603515625, 0.094818115234375, 0.12103271484375, 0.147247314453125, 0.1734619140625, 0.199676513671875, 0.22589111328125, 0.252105712890625, 0.2783203125, 0.304534912109375, 0.33074951171875, 0.356964111328125, 0.3831787109375, 0.409393310546875, 0.43560791015625, 0.461822509765625, 0.488037109375, 0.514251708984375, 0.54046630859375, 0.566680908203125, 0.5928955078125, 0.619110107421875, 0.64532470703125, 0.671539306640625, 0.69775390625, 0.723968505859375, 0.75018310546875, 0.776397705078125, 0.8026123046875, 0.828826904296875, 0.85504150390625, 0.881256103515625, 0.907470703125, 0.933685302734375, 0.95989990234375, 0.986114501953125, 1.0123291015625, 1.038543701171875, 1.06475830078125, 1.090972900390625, 1.1171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 13.0, 8.0, 14.0, 28.0, 29.0, 71.0, 120.0, 156.0, 214.0, 130.0, 80.0, 48.0, 24.0, 16.0, 11.0, 12.0, 5.0, 2.0, 6.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.755366802215576, -4.611855983734131, -4.4683451652526855, -4.32483434677124, -4.181323528289795, -4.03781270980835, -3.8943018913269043, -3.750791072845459, -3.6072802543640137, -3.4637694358825684, -3.320258617401123, -3.1767477989196777, -3.0332369804382324, -2.889726161956787, -2.746215343475342, -2.6027045249938965, -2.4591939449310303, -2.315683126449585, -2.1721723079681396, -2.0286614894866943, -1.885150671005249, -1.7416398525238037, -1.598129153251648, -1.4546183347702026, -1.3111075162887573, -1.167596697807312, -1.0240858793258667, -0.8805751204490662, -0.7370643019676208, -0.5935534834861755, -0.450042724609375, -0.3065319061279297, -0.16302108764648438, -0.019510284066200256, 0.12400051951408386, 0.2675113081932068, 0.4110221266746521, 0.5545329451560974, 0.698043704032898, 0.8415545225143433, 0.9850653409957886, 1.1285761594772339, 1.2720869779586792, 1.415597677230835, 1.5591084957122803, 1.7026193141937256, 1.846130132675171, 1.9896409511566162, 2.1331517696380615, 2.276662588119507, 2.420173406600952, 2.5636842250823975, 2.7071950435638428, 2.850705862045288, 2.9942164421081543, 3.1377272605895996, 3.281238079071045, 3.4247488975524902, 3.5682597160339355, 3.711770534515381, 3.855281352996826, 3.9987921714782715, 4.142302989959717, 4.285813808441162, 4.429324626922607]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 7.0, 8.0, 3.0, 4.0, 9.0, 14.0, 18.0, 15.0, 19.0, 29.0, 40.0, 41.0, 52.0, 50.0, 52.0, 42.0, 54.0, 46.0, 55.0, 40.0, 58.0, 40.0, 32.0, 47.0, 38.0, 26.0, 22.0, 20.0, 22.0, 13.0, 12.0, 17.0, 17.0, 5.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8465375900268555, -1.7900300025939941, -1.7335222959518433, -1.6770145893096924, -1.620507001876831, -1.5639994144439697, -1.5074917078018188, -1.450984001159668, -1.3944764137268066, -1.3379688262939453, -1.2814611196517944, -1.2249534130096436, -1.1684458255767822, -1.111938238143921, -1.05543053150177, -0.9989228844642639, -0.9424152374267578, -0.8859075903892517, -0.8293999433517456, -0.7728922963142395, -0.7163846492767334, -0.6598770022392273, -0.6033693552017212, -0.5468617081642151, -0.490354061126709, -0.4338464140892029, -0.3773387670516968, -0.3208311200141907, -0.26432347297668457, -0.20781582593917847, -0.15130817890167236, -0.09480053186416626, -0.03829300403594971, 0.018214643001556396, 0.0747222900390625, 0.1312299370765686, 0.1877375841140747, 0.2442452311515808, 0.3007528781890869, 0.357260525226593, 0.4137681722640991, 0.4702758193016052, 0.5267834663391113, 0.5832911133766174, 0.6397987604141235, 0.6963064074516296, 0.7528140544891357, 0.8093217015266418, 0.865829348564148, 0.922336995601654, 0.9788446426391602, 1.0353522300720215, 1.0918599367141724, 1.1483676433563232, 1.2048752307891846, 1.261382818222046, 1.3178905248641968, 1.3743982315063477, 1.430905818939209, 1.4874134063720703, 1.5439211130142212, 1.600428819656372, 1.6569364070892334, 1.7134439945220947, 1.7699517011642456]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 8.0, 21.0, 21.0, 21.0, 22.0, 29.0, 63.0, 92.0, 148.0, 224.0, 458.0, 836.0, 1750.0, 4785.0, 26718.0, 815720.0, 181080.0, 10823.0, 2920.0, 1261.0, 632.0, 381.0, 192.0, 134.0, 75.0, 30.0, 29.0, 16.0, 18.0, 11.0, 4.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.4609375, -0.4459648132324219, -0.43099212646484375, -0.4160194396972656, -0.4010467529296875, -0.3860740661621094, -0.37110137939453125, -0.3561286926269531, -0.341156005859375, -0.3261833190917969, -0.31121063232421875, -0.2962379455566406, -0.2812652587890625, -0.2662925720214844, -0.25131988525390625, -0.23634719848632812, -0.22137451171875, -0.20640182495117188, -0.19142913818359375, -0.17645645141601562, -0.1614837646484375, -0.14651107788085938, -0.13153839111328125, -0.11656570434570312, -0.101593017578125, -0.08662033081054688, -0.07164764404296875, -0.056674957275390625, -0.0417022705078125, -0.026729583740234375, -0.01175689697265625, 0.003215789794921875, 0.0181884765625, 0.033161163330078125, 0.04813385009765625, 0.06310653686523438, 0.0780792236328125, 0.09305191040039062, 0.10802459716796875, 0.12299728393554688, 0.137969970703125, 0.15294265747070312, 0.16791534423828125, 0.18288803100585938, 0.1978607177734375, 0.21283340454101562, 0.22780609130859375, 0.24277877807617188, 0.25775146484375, 0.2727241516113281, 0.28769683837890625, 0.3026695251464844, 0.3176422119140625, 0.3326148986816406, 0.34758758544921875, 0.3625602722167969, 0.377532958984375, 0.3925056457519531, 0.40747833251953125, 0.4224510192871094, 0.4374237060546875, 0.4523963928222656, 0.46736907958984375, 0.4823417663574219, 0.497314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 12.0, 7.0, 7.0, 12.0, 14.0, 25.0, 37.0, 27.0, 41.0, 63.0, 60.0, 70.0, 51.0, 50.0, 72.0, 55.0, 47.0, 45.0, 43.0, 44.0, 33.0, 30.0, 27.0, 17.0, 13.0, 17.0, 17.0, 10.0, 15.0, 5.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.311553955078125, -1.27056884765625, -1.229583740234375, -1.1885986328125, -1.147613525390625, -1.10662841796875, -1.065643310546875, -1.024658203125, -0.983673095703125, -0.94268798828125, -0.901702880859375, -0.8607177734375, -0.819732666015625, -0.77874755859375, -0.737762451171875, -0.69677734375, -0.655792236328125, -0.61480712890625, -0.573822021484375, -0.5328369140625, -0.491851806640625, -0.45086669921875, -0.409881591796875, -0.368896484375, -0.327911376953125, -0.28692626953125, -0.245941162109375, -0.2049560546875, -0.163970947265625, -0.12298583984375, -0.082000732421875, -0.041015625, -3.0517578125e-05, 0.04095458984375, 0.081939697265625, 0.1229248046875, 0.163909912109375, 0.20489501953125, 0.245880126953125, 0.286865234375, 0.327850341796875, 0.36883544921875, 0.409820556640625, 0.4508056640625, 0.491790771484375, 0.53277587890625, 0.573760986328125, 0.61474609375, 0.655731201171875, 0.69671630859375, 0.737701416015625, 0.7786865234375, 0.819671630859375, 0.86065673828125, 0.901641845703125, 0.942626953125, 0.983612060546875, 1.02459716796875, 1.065582275390625, 1.1065673828125, 1.147552490234375, 1.18853759765625, 1.229522705078125, 1.2705078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 6.0, 5.0, 13.0, 12.0, 21.0, 18.0, 17.0, 33.0, 41.0, 55.0, 63.0, 122.0, 158.0, 282.0, 466.0, 1247.0, 5436.0, 53881.0, 738085.0, 229383.0, 14984.0, 2416.0, 746.0, 318.0, 206.0, 139.0, 113.0, 75.0, 54.0, 39.0, 30.0, 19.0, 25.0, 14.0, 6.0, 8.0, 3.0, 5.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2059326171875, -0.1994457244873047, -0.19295883178710938, -0.18647193908691406, -0.17998504638671875, -0.17349815368652344, -0.16701126098632812, -0.1605243682861328, -0.1540374755859375, -0.1475505828857422, -0.14106369018554688, -0.13457679748535156, -0.12808990478515625, -0.12160301208496094, -0.11511611938476562, -0.10862922668457031, -0.102142333984375, -0.09565544128417969, -0.08916854858398438, -0.08268165588378906, -0.07619476318359375, -0.06970787048339844, -0.06322097778320312, -0.05673408508300781, -0.0502471923828125, -0.04376029968261719, -0.037273406982421875, -0.030786514282226562, -0.02429962158203125, -0.017812728881835938, -0.011325836181640625, -0.0048389434814453125, 0.00164794921875, 0.008134841918945312, 0.014621734619140625, 0.021108627319335938, 0.02759552001953125, 0.03408241271972656, 0.040569305419921875, 0.04705619812011719, 0.0535430908203125, 0.06002998352050781, 0.06651687622070312, 0.07300376892089844, 0.07949066162109375, 0.08597755432128906, 0.09246444702148438, 0.09895133972167969, 0.105438232421875, 0.11192512512207031, 0.11841201782226562, 0.12489891052246094, 0.13138580322265625, 0.13787269592285156, 0.14435958862304688, 0.1508464813232422, 0.1573333740234375, 0.1638202667236328, 0.17030715942382812, 0.17679405212402344, 0.18328094482421875, 0.18976783752441406, 0.19625473022460938, 0.2027416229248047, 0.209228515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 16.0, 11.0, 16.0, 19.0, 18.0, 20.0, 36.0, 21.0, 32.0, 24.0, 52.0, 43.0, 44.0, 59.0, 60.0, 41.0, 52.0, 38.0, 45.0, 54.0, 42.0, 32.0, 48.0, 22.0, 27.0, 24.0, 23.0, 14.0, 13.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7871551513671875, -1.723724365234375, -1.6602935791015625, -1.59686279296875, -1.5334320068359375, -1.470001220703125, -1.4065704345703125, -1.3431396484375, -1.2797088623046875, -1.216278076171875, -1.1528472900390625, -1.08941650390625, -1.0259857177734375, -0.962554931640625, -0.8991241455078125, -0.835693359375, -0.7722625732421875, -0.708831787109375, -0.6454010009765625, -0.58197021484375, -0.5185394287109375, -0.455108642578125, -0.3916778564453125, -0.3282470703125, -0.2648162841796875, -0.201385498046875, -0.1379547119140625, -0.07452392578125, -0.0110931396484375, 0.052337646484375, 0.1157684326171875, 0.17919921875, 0.2426300048828125, 0.306060791015625, 0.3694915771484375, 0.43292236328125, 0.4963531494140625, 0.559783935546875, 0.6232147216796875, 0.6866455078125, 0.7500762939453125, 0.813507080078125, 0.8769378662109375, 0.94036865234375, 1.0037994384765625, 1.067230224609375, 1.1306610107421875, 1.194091796875, 1.2575225830078125, 1.320953369140625, 1.3843841552734375, 1.44781494140625, 1.5112457275390625, 1.574676513671875, 1.6381072998046875, 1.7015380859375, 1.7649688720703125, 1.828399658203125, 1.8918304443359375, 1.95526123046875, 2.0186920166015625, 2.082122802734375, 2.1455535888671875, 2.208984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 7.0, 10.0, 6.0, 14.0, 28.0, 57.0, 89.0, 201.0, 832.0, 14911.0, 1027949.0, 3640.0, 493.0, 130.0, 82.0, 29.0, 18.0, 15.0, 13.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2421875, -0.2360248565673828, -0.22986221313476562, -0.22369956970214844, -0.21753692626953125, -0.21137428283691406, -0.20521163940429688, -0.1990489959716797, -0.1928863525390625, -0.1867237091064453, -0.18056106567382812, -0.17439842224121094, -0.16823577880859375, -0.16207313537597656, -0.15591049194335938, -0.1497478485107422, -0.143585205078125, -0.1374225616455078, -0.13125991821289062, -0.12509727478027344, -0.11893463134765625, -0.11277198791503906, -0.10660934448242188, -0.10044670104980469, -0.0942840576171875, -0.08812141418457031, -0.08195877075195312, -0.07579612731933594, -0.06963348388671875, -0.06347084045410156, -0.057308197021484375, -0.05114555358886719, -0.04498291015625, -0.03882026672363281, -0.032657623291015625, -0.026494979858398438, -0.02033233642578125, -0.014169692993164062, -0.008007049560546875, -0.0018444061279296875, 0.0043182373046875, 0.010480880737304688, 0.016643524169921875, 0.022806167602539062, 0.02896881103515625, 0.03513145446777344, 0.041294097900390625, 0.04745674133300781, 0.053619384765625, 0.05978202819824219, 0.06594467163085938, 0.07210731506347656, 0.07826995849609375, 0.08443260192871094, 0.09059524536132812, 0.09675788879394531, 0.1029205322265625, 0.10908317565917969, 0.11524581909179688, 0.12140846252441406, 0.12757110595703125, 0.13373374938964844, 0.13989639282226562, 0.1460590362548828, 0.1522216796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 8.0, 11.0, 10.0, 27.0, 37.0, 59.0, 91.0, 148.0, 151.0, 125.0, 119.0, 70.0, 42.0, 37.0, 30.0, 13.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.825764775276184e-05, -1.738220453262329e-05, -1.650676131248474e-05, -1.563131809234619e-05, -1.4755874872207642e-05, -1.3880431652069092e-05, -1.3004988431930542e-05, -1.2129545211791992e-05, -1.1254101991653442e-05, -1.0378658771514893e-05, -9.503215551376343e-06, -8.627772331237793e-06, -7.752329111099243e-06, -6.876885890960693e-06, -6.0014426708221436e-06, -5.125999450683594e-06, -4.250556230545044e-06, -3.375113010406494e-06, -2.4996697902679443e-06, -1.6242265701293945e-06, -7.487833499908447e-07, 1.2665987014770508e-07, 1.0021030902862549e-06, 1.8775463104248047e-06, 2.7529895305633545e-06, 3.6284327507019043e-06, 4.503875970840454e-06, 5.379319190979004e-06, 6.254762411117554e-06, 7.1302056312561035e-06, 8.005648851394653e-06, 8.881092071533203e-06, 9.756535291671753e-06, 1.0631978511810303e-05, 1.1507421731948853e-05, 1.2382864952087402e-05, 1.3258308172225952e-05, 1.4133751392364502e-05, 1.5009194612503052e-05, 1.58846378326416e-05, 1.676008105278015e-05, 1.76355242729187e-05, 1.851096749305725e-05, 1.93864107131958e-05, 2.026185393333435e-05, 2.11372971534729e-05, 2.201274037361145e-05, 2.288818359375e-05, 2.376362681388855e-05, 2.46390700340271e-05, 2.551451325416565e-05, 2.63899564743042e-05, 2.726539969444275e-05, 2.81408429145813e-05, 2.901628613471985e-05, 2.98917293548584e-05, 3.076717257499695e-05, 3.16426157951355e-05, 3.251805901527405e-05, 3.33935022354126e-05, 3.426894545555115e-05, 3.51443886756897e-05, 3.601983189582825e-05, 3.68952751159668e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 8.0, 8.0, 11.0, 21.0, 22.0, 55.0, 88.0, 161.0, 282.0, 651.0, 1894.0, 7260.0, 99331.0, 918212.0, 15632.0, 2989.0, 997.0, 416.0, 201.0, 113.0, 57.0, 36.0, 33.0, 20.0, 12.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.0976724624633789, -0.09420967102050781, -0.09074687957763672, -0.08728408813476562, -0.08382129669189453, -0.08035850524902344, -0.07689571380615234, -0.07343292236328125, -0.06997013092041016, -0.06650733947753906, -0.06304454803466797, -0.059581756591796875, -0.05611896514892578, -0.05265617370605469, -0.049193382263183594, -0.0457305908203125, -0.042267799377441406, -0.03880500793457031, -0.03534221649169922, -0.031879425048828125, -0.02841663360595703, -0.024953842163085938, -0.021491050720214844, -0.01802825927734375, -0.014565467834472656, -0.011102676391601562, -0.007639884948730469, -0.004177093505859375, -0.0007143020629882812, 0.0027484893798828125, 0.006211280822753906, 0.009674072265625, 0.013136863708496094, 0.016599655151367188, 0.02006244659423828, 0.023525238037109375, 0.02698802947998047, 0.030450820922851562, 0.033913612365722656, 0.03737640380859375, 0.040839195251464844, 0.04430198669433594, 0.04776477813720703, 0.051227569580078125, 0.05469036102294922, 0.05815315246582031, 0.061615943908691406, 0.0650787353515625, 0.0685415267944336, 0.07200431823730469, 0.07546710968017578, 0.07892990112304688, 0.08239269256591797, 0.08585548400878906, 0.08931827545166016, 0.09278106689453125, 0.09624385833740234, 0.09970664978027344, 0.10316944122314453, 0.10663223266601562, 0.11009502410888672, 0.11355781555175781, 0.1170206069946289, 0.1204833984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 8.0, 7.0, 14.0, 23.0, 44.0, 77.0, 274.0, 350.0, 74.0, 41.0, 23.0, 14.0, 6.0, 10.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.011848926544189453, -0.011155128479003906, -0.01046133041381836, -0.009767532348632812, -0.009073734283447266, -0.008379936218261719, -0.007686138153076172, -0.006992340087890625, -0.006298542022705078, -0.005604743957519531, -0.004910945892333984, -0.0042171478271484375, -0.0035233497619628906, -0.0028295516967773438, -0.002135753631591797, -0.00144195556640625, -0.0007481575012207031, -5.435943603515625e-05, 0.0006394386291503906, 0.0013332366943359375, 0.0020270347595214844, 0.0027208328247070312, 0.003414630889892578, 0.004108428955078125, 0.004802227020263672, 0.005496025085449219, 0.006189823150634766, 0.0068836212158203125, 0.007577419281005859, 0.008271217346191406, 0.008965015411376953, 0.0096588134765625, 0.010352611541748047, 0.011046409606933594, 0.01174020767211914, 0.012434005737304688, 0.013127803802490234, 0.013821601867675781, 0.014515399932861328, 0.015209197998046875, 0.015902996063232422, 0.01659679412841797, 0.017290592193603516, 0.017984390258789062, 0.01867818832397461, 0.019371986389160156, 0.020065784454345703, 0.02075958251953125, 0.021453380584716797, 0.022147178649902344, 0.02284097671508789, 0.023534774780273438, 0.024228572845458984, 0.02492237091064453, 0.025616168975830078, 0.026309967041015625, 0.027003765106201172, 0.02769756317138672, 0.028391361236572266, 0.029085159301757812, 0.02977895736694336, 0.030472755432128906, 0.031166553497314453, 0.0318603515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 32.0, 46.0, 108.0, 209.0, 261.0, 137.0, 77.0, 30.0, 13.0, 19.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.129145622253418, -4.015045166015625, -3.900944709777832, -3.786844253540039, -3.672743558883667, -3.558643102645874, -3.444542646408081, -3.330442190170288, -3.216341495513916, -3.102241039276123, -2.98814058303833, -2.874040126800537, -2.759939432144165, -2.645838975906372, -2.531738519668579, -2.417638063430786, -2.303537607192993, -2.1894371509552, -2.0753366947174072, -1.9612361192703247, -1.8471355438232422, -1.7330350875854492, -1.6189346313476562, -1.5048341751098633, -1.3907335996627808, -1.2766331434249878, -1.1625325679779053, -1.0484321117401123, -0.9343315958976746, -0.8202310800552368, -0.7061306238174438, -0.5920301079750061, -0.47792959213256836, -0.3638290762901306, -0.24972859025001526, -0.1356281042098999, -0.021527588367462158, 0.09257292747497559, 0.20667338371276855, 0.3207738995552063, 0.43487441539764404, 0.5489749312400818, 0.6630754470825195, 0.7771759033203125, 0.8912764191627502, 1.005376935005188, 1.119477391242981, 1.2335779666900635, 1.3476784229278564, 1.4617788791656494, 1.575879454612732, 1.689979910850525, 1.8040804862976074, 1.9181809425354004, 2.0322813987731934, 2.1463818550109863, 2.2604823112487793, 2.3745827674865723, 2.4886832237243652, 2.602783679962158, 2.7168843746185303, 2.8309848308563232, 2.945085287094116, 3.059185743331909, 3.1732864379882812]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 9.0, 4.0, 5.0, 9.0, 11.0, 15.0, 29.0, 20.0, 45.0, 45.0, 49.0, 54.0, 53.0, 57.0, 60.0, 54.0, 58.0, 66.0, 42.0, 45.0, 47.0, 35.0, 29.0, 23.0, 10.0, 19.0, 15.0, 19.0, 21.0, 5.0, 13.0, 2.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3247147798538208, -1.2860833406448364, -1.2474520206451416, -1.2088205814361572, -1.1701891422271729, -1.1315577030181885, -1.0929263830184937, -1.0542949438095093, -1.0156636238098145, -0.9770322442054749, -0.9384008049964905, -0.8997694253921509, -0.8611379861831665, -0.8225066065788269, -0.7838752269744873, -0.7452437877655029, -0.7066123485565186, -0.667980968952179, -0.6293495297431946, -0.590718150138855, -0.5520867109298706, -0.513455331325531, -0.4748239517211914, -0.4361925423145294, -0.39756113290786743, -0.35892972350120544, -0.32029831409454346, -0.28166693449020386, -0.24303552508354187, -0.20440411567687988, -0.1657727211713791, -0.1271413266658783, -0.08851003646850586, -0.04987863451242447, -0.011247232556343079, 0.027384169399738312, 0.0660155713558197, 0.10464698076248169, 0.14327837526798248, 0.18190976977348328, 0.22054117918014526, 0.25917258858680725, 0.29780399799346924, 0.33643537759780884, 0.3750667870044708, 0.4136981964111328, 0.4523295760154724, 0.4909609854221344, 0.5295923948287964, 0.568223774433136, 0.6068552136421204, 0.64548659324646, 0.6841180324554443, 0.7227494120597839, 0.7613807916641235, 0.8000122308731079, 0.8386436104774475, 0.8772749900817871, 0.9159064292907715, 0.9545378088951111, 0.9931691884994507, 1.031800627708435, 1.0704320669174194, 1.1090633869171143, 1.1476948261260986]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 14.0, 18.0, 30.0, 37.0, 50.0, 95.0, 148.0, 256.0, 429.0, 794.0, 1563.0, 3264.0, 7900.0, 21247.0, 71944.0, 354205.0, 458317.0, 86806.0, 24890.0, 8904.0, 3762.0, 1779.0, 894.0, 477.0, 267.0, 139.0, 95.0, 72.0, 37.0, 31.0, 15.0, 11.0, 14.0, 7.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.361328125, -1.322509765625, -1.28369140625, -1.244873046875, -1.2060546875, -1.167236328125, -1.12841796875, -1.089599609375, -1.05078125, -1.011962890625, -0.97314453125, -0.934326171875, -0.8955078125, -0.856689453125, -0.81787109375, -0.779052734375, -0.740234375, -0.701416015625, -0.66259765625, -0.623779296875, -0.5849609375, -0.546142578125, -0.50732421875, -0.468505859375, -0.4296875, -0.390869140625, -0.35205078125, -0.313232421875, -0.2744140625, -0.235595703125, -0.19677734375, -0.157958984375, -0.119140625, -0.080322265625, -0.04150390625, -0.002685546875, 0.0361328125, 0.074951171875, 0.11376953125, 0.152587890625, 0.19140625, 0.230224609375, 0.26904296875, 0.307861328125, 0.3466796875, 0.385498046875, 0.42431640625, 0.463134765625, 0.501953125, 0.540771484375, 0.57958984375, 0.618408203125, 0.6572265625, 0.696044921875, 0.73486328125, 0.773681640625, 0.8125, 0.851318359375, 0.89013671875, 0.928955078125, 0.9677734375, 1.006591796875, 1.04541015625, 1.084228515625, 1.123046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 18.0, 12.0, 16.0, 10.0, 15.0, 19.0, 27.0, 32.0, 44.0, 41.0, 52.0, 61.0, 57.0, 60.0, 73.0, 58.0, 43.0, 43.0, 57.0, 35.0, 43.0, 30.0, 32.0, 16.0, 22.0, 10.0, 8.0, 14.0, 11.0, 5.0, 2.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.419921875, -3.330657958984375, -3.24139404296875, -3.152130126953125, -3.0628662109375, -2.973602294921875, -2.88433837890625, -2.795074462890625, -2.705810546875, -2.616546630859375, -2.52728271484375, -2.438018798828125, -2.3487548828125, -2.259490966796875, -2.17022705078125, -2.080963134765625, -1.99169921875, -1.902435302734375, -1.81317138671875, -1.723907470703125, -1.6346435546875, -1.545379638671875, -1.45611572265625, -1.366851806640625, -1.277587890625, -1.188323974609375, -1.09906005859375, -1.009796142578125, -0.9205322265625, -0.831268310546875, -0.74200439453125, -0.652740478515625, -0.5634765625, -0.474212646484375, -0.38494873046875, -0.295684814453125, -0.2064208984375, -0.117156982421875, -0.02789306640625, 0.061370849609375, 0.150634765625, 0.239898681640625, 0.32916259765625, 0.418426513671875, 0.5076904296875, 0.596954345703125, 0.68621826171875, 0.775482177734375, 0.86474609375, 0.954010009765625, 1.04327392578125, 1.132537841796875, 1.2218017578125, 1.311065673828125, 1.40032958984375, 1.489593505859375, 1.578857421875, 1.668121337890625, 1.75738525390625, 1.846649169921875, 1.9359130859375, 2.025177001953125, 2.11444091796875, 2.203704833984375, 2.29296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 6.0, 3.0, 11.0, 13.0, 8.0, 11.0, 14.0, 16.0, 30.0, 37.0, 35.0, 31.0, 35.0, 34.0, 35.0, 42.0, 80.0, 677.0, 854934.0, 191594.0, 453.0, 81.0, 35.0, 49.0, 44.0, 32.0, 23.0, 29.0, 37.0, 16.0, 21.0, 24.0, 16.0, 13.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.21875, -8.95489501953125, -8.6910400390625, -8.42718505859375, -8.163330078125, -7.89947509765625, -7.6356201171875, -7.37176513671875, -7.10791015625, -6.84405517578125, -6.5802001953125, -6.31634521484375, -6.052490234375, -5.78863525390625, -5.5247802734375, -5.26092529296875, -4.9970703125, -4.73321533203125, -4.4693603515625, -4.20550537109375, -3.941650390625, -3.67779541015625, -3.4139404296875, -3.15008544921875, -2.88623046875, -2.62237548828125, -2.3585205078125, -2.09466552734375, -1.830810546875, -1.56695556640625, -1.3031005859375, -1.03924560546875, -0.775390625, -0.51153564453125, -0.2476806640625, 0.01617431640625, 0.280029296875, 0.54388427734375, 0.8077392578125, 1.07159423828125, 1.33544921875, 1.59930419921875, 1.8631591796875, 2.12701416015625, 2.390869140625, 2.65472412109375, 2.9185791015625, 3.18243408203125, 3.4462890625, 3.71014404296875, 3.9739990234375, 4.23785400390625, 4.501708984375, 4.76556396484375, 5.0294189453125, 5.29327392578125, 5.55712890625, 5.82098388671875, 6.0848388671875, 6.34869384765625, 6.612548828125, 6.87640380859375, 7.1402587890625, 7.40411376953125, 7.66796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 7.0, 5.0, 8.0, 11.0, 8.0, 12.0, 14.0, 19.0, 35.0, 32.0, 42.0, 30.0, 32.0, 31.0, 38.0, 46.0, 45.0, 44.0, 60.0, 39.0, 38.0, 37.0, 38.0, 33.0, 37.0, 37.0, 33.0, 36.0, 22.0, 25.0, 20.0, 15.0, 22.0, 15.0, 3.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.891021728515625, -2.80548095703125, -2.719940185546875, -2.6343994140625, -2.548858642578125, -2.46331787109375, -2.377777099609375, -2.292236328125, -2.206695556640625, -2.12115478515625, -2.035614013671875, -1.9500732421875, -1.864532470703125, -1.77899169921875, -1.693450927734375, -1.60791015625, -1.522369384765625, -1.43682861328125, -1.351287841796875, -1.2657470703125, -1.180206298828125, -1.09466552734375, -1.009124755859375, -0.923583984375, -0.838043212890625, -0.75250244140625, -0.666961669921875, -0.5814208984375, -0.495880126953125, -0.41033935546875, -0.324798583984375, -0.2392578125, -0.153717041015625, -0.06817626953125, 0.017364501953125, 0.1029052734375, 0.188446044921875, 0.27398681640625, 0.359527587890625, 0.445068359375, 0.530609130859375, 0.61614990234375, 0.701690673828125, 0.7872314453125, 0.872772216796875, 0.95831298828125, 1.043853759765625, 1.12939453125, 1.214935302734375, 1.30047607421875, 1.386016845703125, 1.4715576171875, 1.557098388671875, 1.64263916015625, 1.728179931640625, 1.813720703125, 1.899261474609375, 1.98480224609375, 2.070343017578125, 2.1558837890625, 2.241424560546875, 2.32696533203125, 2.412506103515625, 2.498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 18.0, 23.0, 37.0, 54.0, 82.0, 126.0, 232.0, 449.0, 832.0, 2053.0, 5649.0, 25278.0, 307525.0, 655078.0, 38707.0, 7563.0, 2500.0, 1101.0, 519.0, 293.0, 160.0, 80.0, 44.0, 44.0, 34.0, 11.0, 13.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.7095108032226562, -0.6851348876953125, -0.6607589721679688, -0.636383056640625, -0.6120071411132812, -0.5876312255859375, -0.5632553100585938, -0.53887939453125, -0.5145034790039062, -0.4901275634765625, -0.46575164794921875, -0.441375732421875, -0.41699981689453125, -0.3926239013671875, -0.36824798583984375, -0.3438720703125, -0.31949615478515625, -0.2951202392578125, -0.27074432373046875, -0.246368408203125, -0.22199249267578125, -0.1976165771484375, -0.17324066162109375, -0.14886474609375, -0.12448883056640625, -0.1001129150390625, -0.07573699951171875, -0.051361083984375, -0.02698516845703125, -0.0026092529296875, 0.02176666259765625, 0.046142578125, 0.07051849365234375, 0.0948944091796875, 0.11927032470703125, 0.143646240234375, 0.16802215576171875, 0.1923980712890625, 0.21677398681640625, 0.24114990234375, 0.26552581787109375, 0.2899017333984375, 0.31427764892578125, 0.338653564453125, 0.36302947998046875, 0.3874053955078125, 0.41178131103515625, 0.4361572265625, 0.46053314208984375, 0.4849090576171875, 0.5092849731445312, 0.533660888671875, 0.5580368041992188, 0.5824127197265625, 0.6067886352539062, 0.63116455078125, 0.6555404663085938, 0.6799163818359375, 0.7042922973632812, 0.728668212890625, 0.7530441284179688, 0.7774200439453125, 0.8017959594726562, 0.826171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 8.0, 15.0, 16.0, 38.0, 43.0, 72.0, 141.0, 199.0, 145.0, 109.0, 61.0, 33.0, 38.0, 14.0, 19.0, 8.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001399517059326172, -0.00013592466711997986, -0.00013189762830734253, -0.0001278705894947052, -0.00012384355068206787, -0.00011981651186943054, -0.00011578947305679321, -0.00011176243424415588, -0.00010773539543151855, -0.00010370835661888123, -9.96813178062439e-05, -9.565427899360657e-05, -9.162724018096924e-05, -8.760020136833191e-05, -8.357316255569458e-05, -7.954612374305725e-05, -7.551908493041992e-05, -7.149204611778259e-05, -6.746500730514526e-05, -6.343796849250793e-05, -5.9410929679870605e-05, -5.5383890867233276e-05, -5.135685205459595e-05, -4.732981324195862e-05, -4.330277442932129e-05, -3.927573561668396e-05, -3.524869680404663e-05, -3.12216579914093e-05, -2.7194619178771973e-05, -2.3167580366134644e-05, -1.9140541553497314e-05, -1.5113502740859985e-05, -1.1086463928222656e-05, -7.059425115585327e-06, -3.032386302947998e-06, 9.94652509689331e-07, 5.02169132232666e-06, 9.04873013496399e-06, 1.3075768947601318e-05, 1.7102807760238647e-05, 2.1129846572875977e-05, 2.5156885385513306e-05, 2.9183924198150635e-05, 3.3210963010787964e-05, 3.723800182342529e-05, 4.126504063606262e-05, 4.529207944869995e-05, 4.931911826133728e-05, 5.334615707397461e-05, 5.737319588661194e-05, 6.140023469924927e-05, 6.54272735118866e-05, 6.945431232452393e-05, 7.348135113716125e-05, 7.750838994979858e-05, 8.153542876243591e-05, 8.556246757507324e-05, 8.958950638771057e-05, 9.36165452003479e-05, 9.764358401298523e-05, 0.00010167062282562256, 0.00010569766163825989, 0.00010972470045089722, 0.00011375173926353455, 0.00011777877807617188]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 9.0, 6.0, 12.0, 8.0, 16.0, 29.0, 35.0, 45.0, 82.0, 107.0, 226.0, 338.0, 727.0, 1469.0, 3319.0, 9574.0, 39787.0, 297847.0, 609315.0, 63743.0, 13805.0, 4344.0, 1761.0, 875.0, 425.0, 233.0, 151.0, 82.0, 43.0, 32.0, 32.0, 17.0, 15.0, 15.0, 13.0, 6.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.56024169921875, -0.5433349609375, -0.52642822265625, -0.509521484375, -0.49261474609375, -0.4757080078125, -0.45880126953125, -0.44189453125, -0.42498779296875, -0.4080810546875, -0.39117431640625, -0.374267578125, -0.35736083984375, -0.3404541015625, -0.32354736328125, -0.306640625, -0.28973388671875, -0.2728271484375, -0.25592041015625, -0.239013671875, -0.22210693359375, -0.2052001953125, -0.18829345703125, -0.17138671875, -0.15447998046875, -0.1375732421875, -0.12066650390625, -0.103759765625, -0.08685302734375, -0.0699462890625, -0.05303955078125, -0.0361328125, -0.01922607421875, -0.0023193359375, 0.01458740234375, 0.031494140625, 0.04840087890625, 0.0653076171875, 0.08221435546875, 0.09912109375, 0.11602783203125, 0.1329345703125, 0.14984130859375, 0.166748046875, 0.18365478515625, 0.2005615234375, 0.21746826171875, 0.234375, 0.25128173828125, 0.2681884765625, 0.28509521484375, 0.302001953125, 0.31890869140625, 0.3358154296875, 0.35272216796875, 0.36962890625, 0.38653564453125, 0.4034423828125, 0.42034912109375, 0.437255859375, 0.45416259765625, 0.4710693359375, 0.48797607421875, 0.5048828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 1.0, 11.0, 13.0, 20.0, 22.0, 29.0, 27.0, 38.0, 54.0, 71.0, 105.0, 129.0, 116.0, 84.0, 64.0, 45.0, 41.0, 26.0, 20.0, 13.0, 10.0, 16.0, 11.0, 11.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22705078125, -0.2201061248779297, -0.21316146850585938, -0.20621681213378906, -0.19927215576171875, -0.19232749938964844, -0.18538284301757812, -0.1784381866455078, -0.1714935302734375, -0.1645488739013672, -0.15760421752929688, -0.15065956115722656, -0.14371490478515625, -0.13677024841308594, -0.12982559204101562, -0.12288093566894531, -0.115936279296875, -0.10899162292480469, -0.10204696655273438, -0.09510231018066406, -0.08815765380859375, -0.08121299743652344, -0.07426834106445312, -0.06732368469238281, -0.0603790283203125, -0.05343437194824219, -0.046489715576171875, -0.03954505920410156, -0.03260040283203125, -0.025655746459960938, -0.018711090087890625, -0.011766433715820312, -0.00482177734375, 0.0021228790283203125, 0.009067535400390625, 0.016012191772460938, 0.02295684814453125, 0.029901504516601562, 0.036846160888671875, 0.04379081726074219, 0.0507354736328125, 0.05768013000488281, 0.06462478637695312, 0.07156944274902344, 0.07851409912109375, 0.08545875549316406, 0.09240341186523438, 0.09934806823730469, 0.106292724609375, 0.11323738098144531, 0.12018203735351562, 0.12712669372558594, 0.13407135009765625, 0.14101600646972656, 0.14796066284179688, 0.1549053192138672, 0.1618499755859375, 0.1687946319580078, 0.17573928833007812, 0.18268394470214844, 0.18962860107421875, 0.19657325744628906, 0.20351791381835938, 0.2104625701904297, 0.2174072265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 14.0, 27.0, 58.0, 239.0, 429.0, 153.0, 47.0, 19.0, 11.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8340229988098145, -4.407226085662842, -3.980429172515869, -3.5536322593688965, -3.126835346221924, -2.7000386714935303, -2.2732417583465576, -1.846444845199585, -1.4196479320526123, -0.9928510189056396, -0.5660541653633118, -0.1392573118209839, 0.28753960132598877, 0.7143363952636719, 1.1411333084106445, 1.5679302215576172, 1.9947271347045898, 2.4215240478515625, 2.848320960998535, 3.275117874145508, 3.7019147872924805, 4.128711700439453, 4.555508613586426, 4.982305526733398, 5.409102439880371, 5.835899353027344, 6.262696266174316, 6.689493179321289, 7.116290092468262, 7.543087005615234, 7.969883918762207, 8.39668083190918, 8.823477745056152, 9.250274658203125, 9.677071571350098, 10.10386848449707, 10.530665397644043, 10.957462310791016, 11.384259223937988, 11.811056137084961, 12.237853050231934, 12.664649963378906, 13.091446876525879, 13.518243789672852, 13.945040702819824, 14.371837615966797, 14.79863452911377, 15.225431442260742, 15.652227401733398, 16.079023361206055, 16.505821228027344, 16.9326171875, 17.35941505432129, 17.786211013793945, 18.213008880615234, 18.63980484008789, 19.06660270690918, 19.493398666381836, 19.920196533203125, 20.34699249267578, 20.77379035949707, 21.200586318969727, 21.627384185791016, 22.054180145263672, 22.48097801208496]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 14.0, 9.0, 9.0, 30.0, 15.0, 23.0, 39.0, 48.0, 45.0, 46.0, 37.0, 59.0, 56.0, 69.0, 66.0, 56.0, 55.0, 57.0, 53.0, 46.0, 34.0, 40.0, 21.0, 15.0, 14.0, 7.0, 14.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.458180904388428, -6.271032810211182, -6.0838847160339355, -5.8967366218566895, -5.709588050842285, -5.522439956665039, -5.335291862487793, -5.148143768310547, -4.960995674133301, -4.773847579956055, -4.586699485778809, -4.3995513916015625, -4.212403297424316, -4.025254726409912, -3.838106632232666, -3.65095853805542, -3.463810443878174, -3.2766623497009277, -3.0895142555236816, -2.9023659229278564, -2.7152178287506104, -2.5280697345733643, -2.340921401977539, -2.153773307800293, -1.9666252136230469, -1.7794771194458008, -1.5923289060592651, -1.4051806926727295, -1.2180325984954834, -1.0308845043182373, -0.8437362909317017, -0.656588077545166, -0.4694399833679199, -0.28229182958602905, -0.09514367580413818, 0.09200447797775269, 0.27915263175964355, 0.4663007855415344, 0.6534489393234253, 0.8405971527099609, 1.027745246887207, 1.2148933410644531, 1.4020415544509888, 1.5891897678375244, 1.7763378620147705, 1.9634859561920166, 2.150634288787842, 2.337782382965088, 2.524930477142334, 2.71207857131958, 2.899226665496826, 3.0863749980926514, 3.2735230922698975, 3.4606711864471436, 3.6478195190429688, 3.834967613220215, 4.022115707397461, 4.209263801574707, 4.396411895751953, 4.583559989929199, 4.770708084106445, 4.95785665512085, 5.145004749298096, 5.332152843475342, 5.519300937652588]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 4.0, 7.0, 9.0, 12.0, 18.0, 39.0, 58.0, 95.0, 198.0, 448.0, 1126.0, 3983.0, 22101.0, 374345.0, 3678009.0, 99011.0, 11015.0, 2406.0, 756.0, 324.0, 145.0, 74.0, 38.0, 22.0, 11.0, 8.0, 3.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.960357666015625, -4.83087158203125, -4.701385498046875, -4.5718994140625, -4.442413330078125, -4.31292724609375, -4.183441162109375, -4.053955078125, -3.924468994140625, -3.79498291015625, -3.665496826171875, -3.5360107421875, -3.406524658203125, -3.27703857421875, -3.147552490234375, -3.01806640625, -2.888580322265625, -2.75909423828125, -2.629608154296875, -2.5001220703125, -2.370635986328125, -2.24114990234375, -2.111663818359375, -1.982177734375, -1.852691650390625, -1.72320556640625, -1.593719482421875, -1.4642333984375, -1.334747314453125, -1.20526123046875, -1.075775146484375, -0.9462890625, -0.816802978515625, -0.68731689453125, -0.557830810546875, -0.4283447265625, -0.298858642578125, -0.16937255859375, -0.039886474609375, 0.089599609375, 0.219085693359375, 0.34857177734375, 0.478057861328125, 0.6075439453125, 0.737030029296875, 0.86651611328125, 0.996002197265625, 1.12548828125, 1.254974365234375, 1.38446044921875, 1.513946533203125, 1.6434326171875, 1.772918701171875, 1.90240478515625, 2.031890869140625, 2.161376953125, 2.290863037109375, 2.42034912109375, 2.549835205078125, 2.6793212890625, 2.808807373046875, 2.93829345703125, 3.067779541015625, 3.197265625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 7.0, 3.0, 4.0, 4.0, 9.0, 9.0, 21.0, 14.0, 18.0, 18.0, 31.0, 33.0, 46.0, 49.0, 60.0, 61.0, 51.0, 72.0, 52.0, 53.0, 58.0, 50.0, 39.0, 36.0, 27.0, 24.0, 16.0, 15.0, 19.0, 13.0, 17.0, 17.0, 12.0, 8.0, 2.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4296875, -1.3863525390625, -1.343017578125, -1.2996826171875, -1.25634765625, -1.2130126953125, -1.169677734375, -1.1263427734375, -1.0830078125, -1.0396728515625, -0.996337890625, -0.9530029296875, -0.90966796875, -0.8663330078125, -0.822998046875, -0.7796630859375, -0.736328125, -0.6929931640625, -0.649658203125, -0.6063232421875, -0.56298828125, -0.5196533203125, -0.476318359375, -0.4329833984375, -0.3896484375, -0.3463134765625, -0.302978515625, -0.2596435546875, -0.21630859375, -0.1729736328125, -0.129638671875, -0.0863037109375, -0.04296875, 0.0003662109375, 0.043701171875, 0.0870361328125, 0.13037109375, 0.1737060546875, 0.217041015625, 0.2603759765625, 0.3037109375, 0.3470458984375, 0.390380859375, 0.4337158203125, 0.47705078125, 0.5203857421875, 0.563720703125, 0.6070556640625, 0.650390625, 0.6937255859375, 0.737060546875, 0.7803955078125, 0.82373046875, 0.8670654296875, 0.910400390625, 0.9537353515625, 0.9970703125, 1.0404052734375, 1.083740234375, 1.1270751953125, 1.17041015625, 1.2137451171875, 1.257080078125, 1.3004150390625, 1.34375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 23.0, 39.0, 74.0, 162.0, 318.0, 1010.0, 4896.0, 77196.0, 4029152.0, 74834.0, 4925.0, 958.0, 322.0, 137.0, 66.0, 44.0, 27.0, 15.0, 11.0, 7.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3671875, -7.17578125, -6.984375, -6.79296875, -6.6015625, -6.41015625, -6.21875, -6.02734375, -5.8359375, -5.64453125, -5.453125, -5.26171875, -5.0703125, -4.87890625, -4.6875, -4.49609375, -4.3046875, -4.11328125, -3.921875, -3.73046875, -3.5390625, -3.34765625, -3.15625, -2.96484375, -2.7734375, -2.58203125, -2.390625, -2.19921875, -2.0078125, -1.81640625, -1.625, -1.43359375, -1.2421875, -1.05078125, -0.859375, -0.66796875, -0.4765625, -0.28515625, -0.09375, 0.09765625, 0.2890625, 0.48046875, 0.671875, 0.86328125, 1.0546875, 1.24609375, 1.4375, 1.62890625, 1.8203125, 2.01171875, 2.203125, 2.39453125, 2.5859375, 2.77734375, 2.96875, 3.16015625, 3.3515625, 3.54296875, 3.734375, 3.92578125, 4.1171875, 4.30859375, 4.5, 4.69140625, 4.8828125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 5.0, 12.0, 13.0, 21.0, 21.0, 26.0, 27.0, 39.0, 37.0, 64.0, 96.0, 99.0, 136.0, 170.0, 263.0, 475.0, 875.0, 537.0, 321.0, 212.0, 142.0, 110.0, 70.0, 75.0, 49.0, 37.0, 18.0, 20.0, 18.0, 12.0, 10.0, 10.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55712890625, -0.5418930053710938, -0.5266571044921875, -0.5114212036132812, -0.496185302734375, -0.48094940185546875, -0.4657135009765625, -0.45047760009765625, -0.43524169921875, -0.42000579833984375, -0.4047698974609375, -0.38953399658203125, -0.374298095703125, -0.35906219482421875, -0.3438262939453125, -0.32859039306640625, -0.3133544921875, -0.29811859130859375, -0.2828826904296875, -0.26764678955078125, -0.252410888671875, -0.23717498779296875, -0.2219390869140625, -0.20670318603515625, -0.19146728515625, -0.17623138427734375, -0.1609954833984375, -0.14575958251953125, -0.130523681640625, -0.11528778076171875, -0.1000518798828125, -0.08481597900390625, -0.069580078125, -0.05434417724609375, -0.0391082763671875, -0.02387237548828125, -0.008636474609375, 0.00659942626953125, 0.0218353271484375, 0.03707122802734375, 0.05230712890625, 0.06754302978515625, 0.0827789306640625, 0.09801483154296875, 0.113250732421875, 0.12848663330078125, 0.1437225341796875, 0.15895843505859375, 0.1741943359375, 0.18943023681640625, 0.2046661376953125, 0.21990203857421875, 0.235137939453125, 0.25037384033203125, 0.2656097412109375, 0.28084564208984375, 0.29608154296875, 0.31131744384765625, 0.3265533447265625, 0.34178924560546875, 0.357025146484375, 0.37226104736328125, 0.3874969482421875, 0.40273284912109375, 0.41796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 10.0, 5.0, 11.0, 10.0, 17.0, 21.0, 38.0, 72.0, 108.0, 140.0, 172.0, 142.0, 101.0, 54.0, 31.0, 17.0, 13.0, 9.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.207167625427246, -3.095102310180664, -2.983036756515503, -2.870971202850342, -2.7589058876037598, -2.6468405723571777, -2.5347750186920166, -2.4227094650268555, -2.3106441497802734, -2.1985788345336914, -2.0865132808685303, -1.9744478464126587, -1.862382411956787, -1.7503169775009155, -1.638251543045044, -1.5261861085891724, -1.4141206741333008, -1.3020552396774292, -1.1899898052215576, -1.077924370765686, -0.9658589363098145, -0.8537935018539429, -0.7417280673980713, -0.6296626329421997, -0.5175971984863281, -0.40553176403045654, -0.29346632957458496, -0.18140089511871338, -0.0693354606628418, 0.042729973793029785, 0.15479540824890137, 0.26686084270477295, 0.37892627716064453, 0.4909917116165161, 0.6030571460723877, 0.7151225805282593, 0.8271880149841309, 0.9392534494400024, 1.051318883895874, 1.1633843183517456, 1.2754497528076172, 1.3875151872634888, 1.4995806217193604, 1.611646056175232, 1.7237114906311035, 1.835776925086975, 1.9478423595428467, 2.059907913208008, 2.17197322845459, 2.284038543701172, 2.396104097366333, 2.508169651031494, 2.620234966278076, 2.732300281524658, 2.8443658351898193, 2.9564313888549805, 3.0684967041015625, 3.1805620193481445, 3.2926275730133057, 3.404693126678467, 3.516758441925049, 3.628823757171631, 3.740889310836792, 3.852954864501953, 3.965020179748535]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 9.0, 10.0, 13.0, 16.0, 24.0, 22.0, 25.0, 37.0, 28.0, 38.0, 35.0, 54.0, 49.0, 46.0, 45.0, 59.0, 49.0, 40.0, 43.0, 43.0, 45.0, 39.0, 32.0, 29.0, 18.0, 20.0, 23.0, 19.0, 19.0, 10.0, 6.0, 10.0, 8.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6754878759384155, -1.627683401107788, -1.5798790454864502, -1.5320745706558228, -1.4842700958251953, -1.4364656209945679, -1.3886611461639404, -1.3408567905426025, -1.293052315711975, -1.2452478408813477, -1.1974434852600098, -1.1496390104293823, -1.1018345355987549, -1.0540300607681274, -1.0062255859375, -0.9584212303161621, -0.9106167554855347, -0.8628122806549072, -0.8150078654289246, -0.7672034502029419, -0.7193989753723145, -0.671594500541687, -0.6237900853157043, -0.5759856700897217, -0.5281811952590942, -0.4803767502307892, -0.43257230520248413, -0.3847678601741791, -0.336963415145874, -0.28915897011756897, -0.24135452508926392, -0.19355008006095886, -0.14574551582336426, -0.0979410707950592, -0.05013662576675415, -0.0023321807384490967, 0.04547226428985596, 0.09327670931816101, 0.14108115434646606, 0.18888559937477112, 0.23669004440307617, 0.2844944894313812, 0.3322989344596863, 0.38010337948799133, 0.4279078245162964, 0.47571226954460144, 0.5235167145729065, 0.5713211297988892, 0.6191256046295166, 0.666930079460144, 0.7147344946861267, 0.7625389099121094, 0.8103433847427368, 0.8581478595733643, 0.9059522747993469, 0.9537566900253296, 1.001561164855957, 1.0493656396865845, 1.097170114517212, 1.1449744701385498, 1.1927789449691772, 1.2405834197998047, 1.2883877754211426, 1.33619225025177, 1.3839967250823975]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 12.0, 13.0, 23.0, 33.0, 46.0, 58.0, 94.0, 130.0, 256.0, 376.0, 799.0, 1954.0, 6571.0, 44193.0, 749175.0, 222094.0, 16462.0, 3549.0, 1246.0, 533.0, 327.0, 172.0, 134.0, 70.0, 53.0, 32.0, 30.0, 19.0, 21.0, 16.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3271484375, -0.3168525695800781, -0.30655670166015625, -0.2962608337402344, -0.2859649658203125, -0.2756690979003906, -0.26537322998046875, -0.2550773620605469, -0.244781494140625, -0.23448562622070312, -0.22418975830078125, -0.21389389038085938, -0.2035980224609375, -0.19330215454101562, -0.18300628662109375, -0.17271041870117188, -0.16241455078125, -0.15211868286132812, -0.14182281494140625, -0.13152694702148438, -0.1212310791015625, -0.11093521118164062, -0.10063934326171875, -0.09034347534179688, -0.080047607421875, -0.06975173950195312, -0.05945587158203125, -0.049160003662109375, -0.0388641357421875, -0.028568267822265625, -0.01827239990234375, -0.007976531982421875, 0.0023193359375, 0.012615203857421875, 0.02291107177734375, 0.033206939697265625, 0.0435028076171875, 0.053798675537109375, 0.06409454345703125, 0.07439041137695312, 0.084686279296875, 0.09498214721679688, 0.10527801513671875, 0.11557388305664062, 0.1258697509765625, 0.13616561889648438, 0.14646148681640625, 0.15675735473632812, 0.16705322265625, 0.17734909057617188, 0.18764495849609375, 0.19794082641601562, 0.2082366943359375, 0.21853256225585938, 0.22882843017578125, 0.23912429809570312, 0.249420166015625, 0.2597160339355469, 0.27001190185546875, 0.2803077697753906, 0.2906036376953125, 0.3008995056152344, 0.31119537353515625, 0.3214912414550781, 0.331787109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 9.0, 7.0, 10.0, 17.0, 24.0, 14.0, 21.0, 29.0, 32.0, 40.0, 54.0, 57.0, 42.0, 57.0, 57.0, 52.0, 56.0, 46.0, 49.0, 39.0, 43.0, 37.0, 32.0, 28.0, 17.0, 25.0, 15.0, 10.0, 12.0, 10.0, 11.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.0732421875, -1.0401611328125, -1.007080078125, -0.9739990234375, -0.94091796875, -0.9078369140625, -0.874755859375, -0.8416748046875, -0.80859375, -0.7755126953125, -0.742431640625, -0.7093505859375, -0.67626953125, -0.6431884765625, -0.610107421875, -0.5770263671875, -0.5439453125, -0.5108642578125, -0.477783203125, -0.4447021484375, -0.41162109375, -0.3785400390625, -0.345458984375, -0.3123779296875, -0.279296875, -0.2462158203125, -0.213134765625, -0.1800537109375, -0.14697265625, -0.1138916015625, -0.080810546875, -0.0477294921875, -0.0146484375, 0.0184326171875, 0.051513671875, 0.0845947265625, 0.11767578125, 0.1507568359375, 0.183837890625, 0.2169189453125, 0.25, 0.2830810546875, 0.316162109375, 0.3492431640625, 0.38232421875, 0.4154052734375, 0.448486328125, 0.4815673828125, 0.5146484375, 0.5477294921875, 0.580810546875, 0.6138916015625, 0.64697265625, 0.6800537109375, 0.713134765625, 0.7462158203125, 0.779296875, 0.8123779296875, 0.845458984375, 0.8785400390625, 0.91162109375, 0.9447021484375, 0.977783203125, 1.0108642578125, 1.0439453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 8.0, 11.0, 13.0, 26.0, 32.0, 39.0, 58.0, 75.0, 96.0, 144.0, 202.0, 320.0, 589.0, 1656.0, 7219.0, 77036.0, 803060.0, 142335.0, 11705.0, 2032.0, 707.0, 381.0, 206.0, 180.0, 104.0, 86.0, 56.0, 45.0, 31.0, 26.0, 17.0, 5.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1795654296875, -0.17305946350097656, -0.16655349731445312, -0.1600475311279297, -0.15354156494140625, -0.1470355987548828, -0.14052963256835938, -0.13402366638183594, -0.1275177001953125, -0.12101173400878906, -0.11450576782226562, -0.10799980163574219, -0.10149383544921875, -0.09498786926269531, -0.08848190307617188, -0.08197593688964844, -0.075469970703125, -0.06896400451660156, -0.062458038330078125, -0.05595207214355469, -0.04944610595703125, -0.04294013977050781, -0.036434173583984375, -0.029928207397460938, -0.0234222412109375, -0.016916275024414062, -0.010410308837890625, -0.0039043426513671875, 0.00260162353515625, 0.009107589721679688, 0.015613555908203125, 0.022119522094726562, 0.02862548828125, 0.03513145446777344, 0.041637420654296875, 0.04814338684082031, 0.05464935302734375, 0.06115531921386719, 0.06766128540039062, 0.07416725158691406, 0.0806732177734375, 0.08717918395996094, 0.09368515014648438, 0.10019111633300781, 0.10669708251953125, 0.11320304870605469, 0.11970901489257812, 0.12621498107910156, 0.132720947265625, 0.13922691345214844, 0.14573287963867188, 0.1522388458251953, 0.15874481201171875, 0.1652507781982422, 0.17175674438476562, 0.17826271057128906, 0.1847686767578125, 0.19127464294433594, 0.19778060913085938, 0.2042865753173828, 0.21079254150390625, 0.2172985076904297, 0.22380447387695312, 0.23031044006347656, 0.23681640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 9.0, 7.0, 4.0, 16.0, 10.0, 15.0, 10.0, 22.0, 23.0, 25.0, 28.0, 32.0, 44.0, 44.0, 43.0, 53.0, 51.0, 45.0, 55.0, 44.0, 41.0, 45.0, 40.0, 47.0, 38.0, 31.0, 29.0, 27.0, 24.0, 14.0, 15.0, 14.0, 8.0, 11.0, 9.0, 4.0, 10.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6826171875, -1.63177490234375, -1.5809326171875, -1.53009033203125, -1.479248046875, -1.42840576171875, -1.3775634765625, -1.32672119140625, -1.27587890625, -1.22503662109375, -1.1741943359375, -1.12335205078125, -1.072509765625, -1.02166748046875, -0.9708251953125, -0.91998291015625, -0.869140625, -0.81829833984375, -0.7674560546875, -0.71661376953125, -0.665771484375, -0.61492919921875, -0.5640869140625, -0.51324462890625, -0.46240234375, -0.41156005859375, -0.3607177734375, -0.30987548828125, -0.259033203125, -0.20819091796875, -0.1573486328125, -0.10650634765625, -0.0556640625, -0.00482177734375, 0.0460205078125, 0.09686279296875, 0.147705078125, 0.19854736328125, 0.2493896484375, 0.30023193359375, 0.35107421875, 0.40191650390625, 0.4527587890625, 0.50360107421875, 0.554443359375, 0.60528564453125, 0.6561279296875, 0.70697021484375, 0.7578125, 0.80865478515625, 0.8594970703125, 0.91033935546875, 0.961181640625, 1.01202392578125, 1.0628662109375, 1.11370849609375, 1.16455078125, 1.21539306640625, 1.2662353515625, 1.31707763671875, 1.367919921875, 1.41876220703125, 1.4696044921875, 1.52044677734375, 1.5712890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 16.0, 16.0, 15.0, 31.0, 34.0, 24.0, 30.0, 48.0, 63.0, 80.0, 97.0, 125.0, 230.0, 347.0, 788.0, 2422.0, 13505.0, 720317.0, 297149.0, 9728.0, 1790.0, 606.0, 293.0, 194.0, 125.0, 85.0, 93.0, 62.0, 49.0, 37.0, 28.0, 31.0, 20.0, 11.0, 9.0, 10.0, 8.0, 8.0, 3.0, 8.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05755615234375, -0.05556678771972656, -0.053577423095703125, -0.05158805847167969, -0.04959869384765625, -0.04760932922363281, -0.045619964599609375, -0.04363059997558594, -0.0416412353515625, -0.03965187072753906, -0.037662506103515625, -0.03567314147949219, -0.03368377685546875, -0.03169441223144531, -0.029705047607421875, -0.027715682983398438, -0.025726318359375, -0.023736953735351562, -0.021747589111328125, -0.019758224487304688, -0.01776885986328125, -0.015779495239257812, -0.013790130615234375, -0.011800765991210938, -0.0098114013671875, -0.007822036743164062, -0.005832672119140625, -0.0038433074951171875, -0.00185394287109375, 0.0001354217529296875, 0.002124786376953125, 0.0041141510009765625, 0.006103515625, 0.008092880249023438, 0.010082244873046875, 0.012071609497070312, 0.01406097412109375, 0.016050338745117188, 0.018039703369140625, 0.020029067993164062, 0.0220184326171875, 0.024007797241210938, 0.025997161865234375, 0.027986526489257812, 0.02997589111328125, 0.03196525573730469, 0.033954620361328125, 0.03594398498535156, 0.037933349609375, 0.03992271423339844, 0.041912078857421875, 0.04390144348144531, 0.04589080810546875, 0.04788017272949219, 0.049869537353515625, 0.05185890197753906, 0.0538482666015625, 0.05583763122558594, 0.057826995849609375, 0.05981636047363281, 0.06180572509765625, 0.06379508972167969, 0.06578445434570312, 0.06777381896972656, 0.06976318359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 15.0, 20.0, 28.0, 42.0, 65.0, 89.0, 102.0, 114.0, 110.0, 88.0, 77.0, 51.0, 45.0, 29.0, 22.0, 17.0, 13.0, 10.0, 10.0, 8.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-3.039836883544922e-05, -2.9678456485271454e-05, -2.895854413509369e-05, -2.8238631784915924e-05, -2.751871943473816e-05, -2.6798807084560394e-05, -2.607889473438263e-05, -2.5358982384204865e-05, -2.46390700340271e-05, -2.3919157683849335e-05, -2.319924533367157e-05, -2.2479332983493805e-05, -2.175942063331604e-05, -2.1039508283138275e-05, -2.031959593296051e-05, -1.9599683582782745e-05, -1.887977123260498e-05, -1.8159858882427216e-05, -1.743994653224945e-05, -1.6720034182071686e-05, -1.600012183189392e-05, -1.5280209481716156e-05, -1.4560297131538391e-05, -1.3840384781360626e-05, -1.3120472431182861e-05, -1.2400560081005096e-05, -1.1680647730827332e-05, -1.0960735380649567e-05, -1.0240823030471802e-05, -9.520910680294037e-06, -8.800998330116272e-06, -8.081085979938507e-06, -7.361173629760742e-06, -6.641261279582977e-06, -5.921348929405212e-06, -5.2014365792274475e-06, -4.481524229049683e-06, -3.7616118788719177e-06, -3.041699528694153e-06, -2.321787178516388e-06, -1.601874828338623e-06, -8.819624781608582e-07, -1.6205012798309326e-07, 5.578622221946716e-07, 1.2777745723724365e-06, 1.9976869225502014e-06, 2.7175992727279663e-06, 3.437511622905731e-06, 4.157423973083496e-06, 4.877336323261261e-06, 5.597248673439026e-06, 6.317161023616791e-06, 7.037073373794556e-06, 7.75698572397232e-06, 8.476898074150085e-06, 9.19681042432785e-06, 9.916722774505615e-06, 1.063663512468338e-05, 1.1356547474861145e-05, 1.207645982503891e-05, 1.2796372175216675e-05, 1.351628452539444e-05, 1.4236196875572205e-05, 1.495610922574997e-05, 1.5676021575927734e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 16.0, 12.0, 26.0, 40.0, 62.0, 89.0, 177.0, 338.0, 654.0, 1383.0, 3830.0, 14017.0, 119796.0, 860012.0, 36514.0, 7164.0, 2417.0, 895.0, 480.0, 236.0, 137.0, 73.0, 55.0, 27.0, 22.0, 17.0, 10.0, 13.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08740234375, -0.08485221862792969, -0.08230209350585938, -0.07975196838378906, -0.07720184326171875, -0.07465171813964844, -0.07210159301757812, -0.06955146789550781, -0.0670013427734375, -0.06445121765136719, -0.061901092529296875, -0.05935096740722656, -0.05680084228515625, -0.05425071716308594, -0.051700592041015625, -0.04915046691894531, -0.046600341796875, -0.04405021667480469, -0.041500091552734375, -0.03894996643066406, -0.03639984130859375, -0.03384971618652344, -0.031299591064453125, -0.028749465942382812, -0.0261993408203125, -0.023649215698242188, -0.021099090576171875, -0.018548965454101562, -0.01599884033203125, -0.013448715209960938, -0.010898590087890625, -0.008348464965820312, -0.00579833984375, -0.0032482147216796875, -0.000698089599609375, 0.0018520355224609375, 0.00440216064453125, 0.0069522857666015625, 0.009502410888671875, 0.012052536010742188, 0.0146026611328125, 0.017152786254882812, 0.019702911376953125, 0.022253036499023438, 0.02480316162109375, 0.027353286743164062, 0.029903411865234375, 0.03245353698730469, 0.035003662109375, 0.03755378723144531, 0.040103912353515625, 0.04265403747558594, 0.04520416259765625, 0.04775428771972656, 0.050304412841796875, 0.05285453796386719, 0.0554046630859375, 0.05795478820800781, 0.060504913330078125, 0.06305503845214844, 0.06560516357421875, 0.06815528869628906, 0.07070541381835938, 0.07325553894042969, 0.0758056640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 3.0, 14.0, 10.0, 14.0, 22.0, 39.0, 66.0, 98.0, 161.0, 210.0, 125.0, 67.0, 26.0, 24.0, 24.0, 13.0, 13.0, 7.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01253509521484375, -0.012157917022705078, -0.011780738830566406, -0.011403560638427734, -0.011026382446289062, -0.01064920425415039, -0.010272026062011719, -0.009894847869873047, -0.009517669677734375, -0.009140491485595703, -0.008763313293457031, -0.00838613510131836, -0.008008956909179688, -0.007631778717041016, -0.007254600524902344, -0.006877422332763672, -0.006500244140625, -0.006123065948486328, -0.005745887756347656, -0.005368709564208984, -0.0049915313720703125, -0.004614353179931641, -0.004237174987792969, -0.003859996795654297, -0.003482818603515625, -0.003105640411376953, -0.0027284622192382812, -0.0023512840270996094, -0.0019741058349609375, -0.0015969276428222656, -0.0012197494506835938, -0.0008425712585449219, -0.00046539306640625, -8.821487426757812e-05, 0.00028896331787109375, 0.0006661415100097656, 0.0010433197021484375, 0.0014204978942871094, 0.0017976760864257812, 0.002174854278564453, 0.002552032470703125, 0.002929210662841797, 0.0033063888549804688, 0.0036835670471191406, 0.0040607452392578125, 0.004437923431396484, 0.004815101623535156, 0.005192279815673828, 0.0055694580078125, 0.005946636199951172, 0.006323814392089844, 0.006700992584228516, 0.0070781707763671875, 0.007455348968505859, 0.007832527160644531, 0.008209705352783203, 0.008586883544921875, 0.008964061737060547, 0.009341239929199219, 0.00971841812133789, 0.010095596313476562, 0.010472774505615234, 0.010849952697753906, 0.011227130889892578, 0.01160430908203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 13.0, 16.0, 22.0, 33.0, 76.0, 161.0, 208.0, 197.0, 104.0, 67.0, 21.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3700778484344482, -2.281541585922241, -2.1930055618286133, -2.1044692993164062, -2.015933036804199, -1.9273970127105713, -1.8388607501983643, -1.7503246068954468, -1.6617884635925293, -1.5732523202896118, -1.4847161769866943, -1.3961799144744873, -1.3076437711715698, -1.2191076278686523, -1.1305713653564453, -1.0420352220535278, -0.9534990787506104, -0.8649629354476929, -0.7764267325401306, -0.6878905296325684, -0.5993543863296509, -0.5108182430267334, -0.42228204011917114, -0.3337458372116089, -0.2452096939086914, -0.15667352080345154, -0.06813734769821167, 0.020398825407028198, 0.10893499851226807, 0.19747117161750793, 0.2860073447227478, 0.37454354763031006, 0.46307945251464844, 0.5516155958175659, 0.6401517987251282, 0.7286880016326904, 0.8172241449356079, 0.9057602882385254, 0.9942964911460876, 1.08283269405365, 1.1713688373565674, 1.2599049806594849, 1.3484411239624023, 1.4369773864746094, 1.5255135297775269, 1.6140496730804443, 1.7025859355926514, 1.7911220788955688, 1.8796582221984863, 1.9681943655014038, 2.0567305088043213, 2.1452667713165283, 2.2338027954101562, 2.3223390579223633, 2.4108753204345703, 2.4994115829467773, 2.5879476070404053, 2.6764838695526123, 2.7650198936462402, 2.8535561561584473, 2.9420924186706543, 3.0306284427642822, 3.1191647052764893, 3.207700729370117, 3.296236991882324]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 10.0, 6.0, 11.0, 12.0, 16.0, 28.0, 18.0, 29.0, 32.0, 32.0, 44.0, 43.0, 57.0, 61.0, 56.0, 58.0, 63.0, 45.0, 45.0, 53.0, 49.0, 43.0, 19.0, 32.0, 23.0, 21.0, 14.0, 22.0, 8.0, 7.0, 7.0, 9.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0773781538009644, -1.0444740056991577, -1.011569857597351, -0.9786656498908997, -0.945761501789093, -0.9128572940826416, -0.879953145980835, -0.8470489978790283, -0.8141448497772217, -0.781240701675415, -0.7483364939689636, -0.715432345867157, -0.6825281977653503, -0.6496239900588989, -0.6167198419570923, -0.5838156938552856, -0.5509114861488342, -0.5180073380470276, -0.48510316014289856, -0.45219898223876953, -0.4192948341369629, -0.38639065623283386, -0.35348647832870483, -0.3205823302268982, -0.28767815232276917, -0.25477397441864014, -0.2218698263168335, -0.18896564841270447, -0.15606148540973663, -0.1231573224067688, -0.09025314450263977, -0.057348981499671936, -0.0244448184967041, 0.008459348231554031, 0.041363514959812164, 0.0742676854133606, 0.10717184841632843, 0.14007601141929626, 0.1729801893234253, 0.20588435232639313, 0.23878851532936096, 0.27169269323349, 0.30459684133529663, 0.33750101923942566, 0.3704051971435547, 0.40330934524536133, 0.43621352314949036, 0.4691177010536194, 0.502021849155426, 0.5349259972572327, 0.5678302049636841, 0.6007343530654907, 0.6336385011672974, 0.666542649269104, 0.6994468569755554, 0.7323510050773621, 0.7652552127838135, 0.7981593608856201, 0.8310635685920715, 0.8639677166938782, 0.8968718647956848, 0.9297760725021362, 0.9626802206039429, 0.9955843687057495, 1.0284885168075562]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 5.0, 12.0, 17.0, 25.0, 49.0, 66.0, 125.0, 167.0, 229.0, 390.0, 628.0, 1075.0, 1792.0, 3420.0, 6792.0, 14847.0, 37620.0, 121127.0, 489600.0, 261634.0, 65030.0, 23188.0, 9951.0, 4726.0, 2459.0, 1455.0, 764.0, 481.0, 298.0, 209.0, 115.0, 76.0, 62.0, 39.0, 24.0, 20.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.525390625, -1.48272705078125, -1.4400634765625, -1.39739990234375, -1.354736328125, -1.31207275390625, -1.2694091796875, -1.22674560546875, -1.18408203125, -1.14141845703125, -1.0987548828125, -1.05609130859375, -1.013427734375, -0.97076416015625, -0.9281005859375, -0.88543701171875, -0.8427734375, -0.80010986328125, -0.7574462890625, -0.71478271484375, -0.672119140625, -0.62945556640625, -0.5867919921875, -0.54412841796875, -0.50146484375, -0.45880126953125, -0.4161376953125, -0.37347412109375, -0.330810546875, -0.28814697265625, -0.2454833984375, -0.20281982421875, -0.16015625, -0.11749267578125, -0.0748291015625, -0.03216552734375, 0.010498046875, 0.05316162109375, 0.0958251953125, 0.13848876953125, 0.18115234375, 0.22381591796875, 0.2664794921875, 0.30914306640625, 0.351806640625, 0.39447021484375, 0.4371337890625, 0.47979736328125, 0.5224609375, 0.56512451171875, 0.6077880859375, 0.65045166015625, 0.693115234375, 0.73577880859375, 0.7784423828125, 0.82110595703125, 0.86376953125, 0.90643310546875, 0.9490966796875, 0.99176025390625, 1.034423828125, 1.07708740234375, 1.1197509765625, 1.16241455078125, 1.205078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 16.0, 12.0, 20.0, 20.0, 27.0, 43.0, 42.0, 58.0, 62.0, 72.0, 66.0, 65.0, 81.0, 61.0, 74.0, 57.0, 38.0, 40.0, 27.0, 19.0, 14.0, 18.0, 14.0, 10.0, 4.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.840545654296875, -2.75335693359375, -2.666168212890625, -2.5789794921875, -2.491790771484375, -2.40460205078125, -2.317413330078125, -2.230224609375, -2.143035888671875, -2.05584716796875, -1.968658447265625, -1.8814697265625, -1.794281005859375, -1.70709228515625, -1.619903564453125, -1.53271484375, -1.445526123046875, -1.35833740234375, -1.271148681640625, -1.1839599609375, -1.096771240234375, -1.00958251953125, -0.922393798828125, -0.835205078125, -0.748016357421875, -0.66082763671875, -0.573638916015625, -0.4864501953125, -0.399261474609375, -0.31207275390625, -0.224884033203125, -0.1376953125, -0.050506591796875, 0.03668212890625, 0.123870849609375, 0.2110595703125, 0.298248291015625, 0.38543701171875, 0.472625732421875, 0.559814453125, 0.647003173828125, 0.73419189453125, 0.821380615234375, 0.9085693359375, 0.995758056640625, 1.08294677734375, 1.170135498046875, 1.25732421875, 1.344512939453125, 1.43170166015625, 1.518890380859375, 1.6060791015625, 1.693267822265625, 1.78045654296875, 1.867645263671875, 1.954833984375, 2.042022705078125, 2.12921142578125, 2.216400146484375, 2.3035888671875, 2.390777587890625, 2.47796630859375, 2.565155029296875, 2.65234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 5.0, 5.0, 14.0, 12.0, 9.0, 21.0, 22.0, 22.0, 23.0, 39.0, 25.0, 44.0, 44.0, 74.0, 93.0, 311.0, 1883.0, 51684.0, 979498.0, 13177.0, 924.0, 188.0, 94.0, 72.0, 30.0, 33.0, 27.0, 22.0, 21.0, 16.0, 21.0, 13.0, 18.0, 12.0, 8.0, 4.0, 10.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.703125, -6.495849609375, -6.28857421875, -6.081298828125, -5.8740234375, -5.666748046875, -5.45947265625, -5.252197265625, -5.044921875, -4.837646484375, -4.63037109375, -4.423095703125, -4.2158203125, -4.008544921875, -3.80126953125, -3.593994140625, -3.38671875, -3.179443359375, -2.97216796875, -2.764892578125, -2.5576171875, -2.350341796875, -2.14306640625, -1.935791015625, -1.728515625, -1.521240234375, -1.31396484375, -1.106689453125, -0.8994140625, -0.692138671875, -0.48486328125, -0.277587890625, -0.0703125, 0.136962890625, 0.34423828125, 0.551513671875, 0.7587890625, 0.966064453125, 1.17333984375, 1.380615234375, 1.587890625, 1.795166015625, 2.00244140625, 2.209716796875, 2.4169921875, 2.624267578125, 2.83154296875, 3.038818359375, 3.24609375, 3.453369140625, 3.66064453125, 3.867919921875, 4.0751953125, 4.282470703125, 4.48974609375, 4.697021484375, 4.904296875, 5.111572265625, 5.31884765625, 5.526123046875, 5.7333984375, 5.940673828125, 6.14794921875, 6.355224609375, 6.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 15.0, 11.0, 13.0, 14.0, 27.0, 27.0, 29.0, 33.0, 36.0, 38.0, 30.0, 44.0, 39.0, 51.0, 46.0, 52.0, 42.0, 46.0, 44.0, 42.0, 45.0, 31.0, 28.0, 32.0, 19.0, 25.0, 23.0, 16.0, 19.0, 15.0, 9.0, 10.0, 6.0, 9.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9159088134765625, -1.844512939453125, -1.7731170654296875, -1.70172119140625, -1.6303253173828125, -1.558929443359375, -1.4875335693359375, -1.4161376953125, -1.3447418212890625, -1.273345947265625, -1.2019500732421875, -1.13055419921875, -1.0591583251953125, -0.987762451171875, -0.9163665771484375, -0.844970703125, -0.7735748291015625, -0.702178955078125, -0.6307830810546875, -0.55938720703125, -0.4879913330078125, -0.416595458984375, -0.3451995849609375, -0.2738037109375, -0.2024078369140625, -0.131011962890625, -0.0596160888671875, 0.01177978515625, 0.0831756591796875, 0.154571533203125, 0.2259674072265625, 0.29736328125, 0.3687591552734375, 0.440155029296875, 0.5115509033203125, 0.58294677734375, 0.6543426513671875, 0.725738525390625, 0.7971343994140625, 0.8685302734375, 0.9399261474609375, 1.011322021484375, 1.0827178955078125, 1.15411376953125, 1.2255096435546875, 1.296905517578125, 1.3683013916015625, 1.439697265625, 1.5110931396484375, 1.582489013671875, 1.6538848876953125, 1.72528076171875, 1.7966766357421875, 1.868072509765625, 1.9394683837890625, 2.0108642578125, 2.0822601318359375, 2.153656005859375, 2.2250518798828125, 2.29644775390625, 2.3678436279296875, 2.439239501953125, 2.5106353759765625, 2.58203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 12.0, 6.0, 13.0, 15.0, 17.0, 19.0, 42.0, 42.0, 68.0, 93.0, 188.0, 279.0, 425.0, 901.0, 1808.0, 4125.0, 11360.0, 41583.0, 231141.0, 605608.0, 112937.0, 24311.0, 7634.0, 2841.0, 1334.0, 692.0, 386.0, 215.0, 129.0, 90.0, 68.0, 44.0, 26.0, 28.0, 14.0, 12.0, 10.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5128631591796875, -0.495941162109375, -0.4790191650390625, -0.46209716796875, -0.4451751708984375, -0.428253173828125, -0.4113311767578125, -0.3944091796875, -0.3774871826171875, -0.360565185546875, -0.3436431884765625, -0.32672119140625, -0.3097991943359375, -0.292877197265625, -0.2759552001953125, -0.259033203125, -0.2421112060546875, -0.225189208984375, -0.2082672119140625, -0.19134521484375, -0.1744232177734375, -0.157501220703125, -0.1405792236328125, -0.1236572265625, -0.1067352294921875, -0.089813232421875, -0.0728912353515625, -0.05596923828125, -0.0390472412109375, -0.022125244140625, -0.0052032470703125, 0.01171875, 0.0286407470703125, 0.045562744140625, 0.0624847412109375, 0.07940673828125, 0.0963287353515625, 0.113250732421875, 0.1301727294921875, 0.1470947265625, 0.1640167236328125, 0.180938720703125, 0.1978607177734375, 0.21478271484375, 0.2317047119140625, 0.248626708984375, 0.2655487060546875, 0.282470703125, 0.2993927001953125, 0.316314697265625, 0.3332366943359375, 0.35015869140625, 0.3670806884765625, 0.384002685546875, 0.4009246826171875, 0.4178466796875, 0.4347686767578125, 0.451690673828125, 0.4686126708984375, 0.48553466796875, 0.5024566650390625, 0.519378662109375, 0.5363006591796875, 0.55322265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 10.0, 7.0, 15.0, 16.0, 23.0, 19.0, 23.0, 31.0, 36.0, 70.0, 80.0, 95.0, 114.0, 86.0, 78.0, 54.0, 51.0, 39.0, 33.0, 23.0, 13.0, 19.0, 11.0, 10.0, 6.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375810623168945e-05, -9.087100625038147e-05, -8.798390626907349e-05, -8.50968062877655e-05, -8.220970630645752e-05, -7.932260632514954e-05, -7.643550634384155e-05, -7.354840636253357e-05, -7.066130638122559e-05, -6.77742063999176e-05, -6.488710641860962e-05, -6.200000643730164e-05, -5.911290645599365e-05, -5.622580647468567e-05, -5.3338706493377686e-05, -5.04516065120697e-05, -4.756450653076172e-05, -4.4677406549453735e-05, -4.179030656814575e-05, -3.890320658683777e-05, -3.6016106605529785e-05, -3.31290066242218e-05, -3.024190664291382e-05, -2.7354806661605835e-05, -2.446770668029785e-05, -2.1580606698989868e-05, -1.8693506717681885e-05, -1.58064067363739e-05, -1.2919306755065918e-05, -1.0032206773757935e-05, -7.145106792449951e-06, -4.258006811141968e-06, -1.3709068298339844e-06, 1.516193151473999e-06, 4.403293132781982e-06, 7.290393114089966e-06, 1.017749309539795e-05, 1.3064593076705933e-05, 1.5951693058013916e-05, 1.88387930393219e-05, 2.1725893020629883e-05, 2.4612993001937866e-05, 2.750009298324585e-05, 3.0387192964553833e-05, 3.3274292945861816e-05, 3.61613929271698e-05, 3.904849290847778e-05, 4.1935592889785767e-05, 4.482269287109375e-05, 4.7709792852401733e-05, 5.059689283370972e-05, 5.34839928150177e-05, 5.6371092796325684e-05, 5.925819277763367e-05, 6.214529275894165e-05, 6.503239274024963e-05, 6.791949272155762e-05, 7.08065927028656e-05, 7.369369268417358e-05, 7.658079266548157e-05, 7.946789264678955e-05, 8.235499262809753e-05, 8.524209260940552e-05, 8.81291925907135e-05, 9.101629257202148e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 13.0, 11.0, 10.0, 14.0, 30.0, 40.0, 39.0, 61.0, 102.0, 146.0, 279.0, 391.0, 650.0, 1261.0, 2191.0, 4395.0, 9379.0, 23871.0, 77056.0, 341617.0, 438687.0, 97748.0, 28697.0, 11291.0, 4881.0, 2427.0, 1320.0, 709.0, 405.0, 260.0, 181.0, 120.0, 75.0, 58.0, 49.0, 28.0, 20.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3670654296875, -0.353515625, -0.3399658203125, -0.326416015625, -0.3128662109375, -0.29931640625, -0.2857666015625, -0.272216796875, -0.2586669921875, -0.2451171875, -0.2315673828125, -0.218017578125, -0.2044677734375, -0.19091796875, -0.1773681640625, -0.163818359375, -0.1502685546875, -0.13671875, -0.1231689453125, -0.109619140625, -0.0960693359375, -0.08251953125, -0.0689697265625, -0.055419921875, -0.0418701171875, -0.0283203125, -0.0147705078125, -0.001220703125, 0.0123291015625, 0.02587890625, 0.0394287109375, 0.052978515625, 0.0665283203125, 0.080078125, 0.0936279296875, 0.107177734375, 0.1207275390625, 0.13427734375, 0.1478271484375, 0.161376953125, 0.1749267578125, 0.1884765625, 0.2020263671875, 0.215576171875, 0.2291259765625, 0.24267578125, 0.2562255859375, 0.269775390625, 0.2833251953125, 0.296875, 0.3104248046875, 0.323974609375, 0.3375244140625, 0.35107421875, 0.3646240234375, 0.378173828125, 0.3917236328125, 0.4052734375, 0.4188232421875, 0.432373046875, 0.4459228515625, 0.45947265625, 0.4730224609375, 0.486572265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 11.0, 5.0, 13.0, 11.0, 15.0, 12.0, 19.0, 35.0, 26.0, 46.0, 42.0, 57.0, 63.0, 89.0, 88.0, 73.0, 77.0, 61.0, 60.0, 42.0, 27.0, 37.0, 14.0, 13.0, 17.0, 8.0, 7.0, 10.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21265602111816406, -0.20595169067382812, -0.1992473602294922, -0.19254302978515625, -0.1858386993408203, -0.17913436889648438, -0.17243003845214844, -0.1657257080078125, -0.15902137756347656, -0.15231704711914062, -0.1456127166748047, -0.13890838623046875, -0.1322040557861328, -0.12549972534179688, -0.11879539489746094, -0.112091064453125, -0.10538673400878906, -0.09868240356445312, -0.09197807312011719, -0.08527374267578125, -0.07856941223144531, -0.07186508178710938, -0.06516075134277344, -0.0584564208984375, -0.05175209045410156, -0.045047760009765625, -0.03834342956542969, -0.03163909912109375, -0.024934768676757812, -0.018230438232421875, -0.011526107788085938, -0.00482177734375, 0.0018825531005859375, 0.008586883544921875, 0.015291213989257812, 0.02199554443359375, 0.028699874877929688, 0.035404205322265625, 0.04210853576660156, 0.0488128662109375, 0.05551719665527344, 0.062221527099609375, 0.06892585754394531, 0.07563018798828125, 0.08233451843261719, 0.08903884887695312, 0.09574317932128906, 0.102447509765625, 0.10915184020996094, 0.11585617065429688, 0.12256050109863281, 0.12926483154296875, 0.1359691619873047, 0.14267349243164062, 0.14937782287597656, 0.1560821533203125, 0.16278648376464844, 0.16949081420898438, 0.1761951446533203, 0.18289947509765625, 0.1896038055419922, 0.19630813598632812, 0.20301246643066406, 0.209716796875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 19.0, 29.0, 120.0, 272.0, 344.0, 122.0, 38.0, 21.0, 17.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.135523319244385, -4.795766353607178, -4.4560089111328125, -4.1162519454956055, -3.7764949798583984, -3.4367377758026123, -3.096980571746826, -2.757223606109619, -2.417466402053833, -2.077709197998047, -1.7379522323608398, -1.3981950283050537, -1.0584379434585571, -0.7186808586120605, -0.3789236545562744, -0.03916668891906738, 0.30059051513671875, 0.6403475999832153, 0.9801047444343567, 1.319861888885498, 1.6596189737319946, 1.9993760585784912, 2.3391332626342773, 2.6788902282714844, 3.0186474323272705, 3.3584046363830566, 3.6981616020202637, 4.037919044494629, 4.377676010131836, 4.717432975769043, 5.05718994140625, 5.396946907043457, 5.7367048263549805, 6.0764617919921875, 6.416219234466553, 6.75597620010376, 7.095733165740967, 7.435490608215332, 7.775247573852539, 8.115004539489746, 8.454761505126953, 8.79451847076416, 9.134275436401367, 9.47403335571289, 9.813790321350098, 10.153547286987305, 10.493304252624512, 10.833061218261719, 11.172819137573242, 11.51257610321045, 11.852333068847656, 12.19209098815918, 12.531847953796387, 12.871604919433594, 13.2113618850708, 13.551118850708008, 13.890875816345215, 14.230632781982422, 14.570389747619629, 14.910146713256836, 15.24990463256836, 15.589661598205566, 15.929418563842773, 16.269176483154297, 16.608932495117188]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 9.0, 12.0, 10.0, 20.0, 14.0, 20.0, 19.0, 27.0, 32.0, 25.0, 27.0, 40.0, 51.0, 50.0, 45.0, 38.0, 41.0, 50.0, 51.0, 36.0, 39.0, 30.0, 30.0, 35.0, 37.0, 32.0, 23.0, 27.0, 19.0, 23.0, 13.0, 10.0, 13.0, 5.0, 10.0, 4.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.8744328022003174, -3.752547264099121, -3.630661964416504, -3.5087764263153076, -3.3868908882141113, -3.265005588531494, -3.143120050430298, -3.0212345123291016, -2.8993492126464844, -2.777463674545288, -2.655578374862671, -2.5336928367614746, -2.4118072986602783, -2.289921760559082, -2.168036460876465, -2.0461509227752686, -1.9242653846740723, -1.8023799657821655, -1.6804944276809692, -1.5586090087890625, -1.4367234706878662, -1.3148380517959595, -1.1929526329040527, -1.0710670948028564, -0.9491816759109497, -0.8272961974143982, -0.7054107189178467, -0.5835253000259399, -0.4616398215293884, -0.3397543430328369, -0.21786892414093018, -0.09598344564437866, 0.02590203285217285, 0.14778749644756317, 0.2696729600429535, 0.3915584087371826, 0.5134438872337341, 0.6353293657302856, 0.7572147846221924, 0.8791002631187439, 1.0009857416152954, 1.1228711605072021, 1.2447566986083984, 1.3666421175003052, 1.488527536392212, 1.6104130744934082, 1.732298493385315, 1.8541839122772217, 1.976069450378418, 2.0979549884796143, 2.2198402881622314, 2.3417258262634277, 2.463611364364624, 2.5854969024658203, 2.7073822021484375, 2.829267740249634, 2.95115327835083, 3.0730388164520264, 3.1949241161346436, 3.31680965423584, 3.438695192337036, 3.5605807304382324, 3.6824660301208496, 3.804351568222046, 3.926236867904663]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 15.0, 12.0, 22.0, 32.0, 34.0, 65.0, 75.0, 154.0, 208.0, 367.0, 685.0, 1336.0, 2770.0, 7011.0, 21827.0, 102292.0, 1752568.0, 2156839.0, 110894.0, 23587.0, 7548.0, 2921.0, 1367.0, 711.0, 359.0, 202.0, 128.0, 83.0, 68.0, 30.0, 18.0, 16.0, 9.0, 6.0, 12.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.91015625, -1.84197998046875, -1.7738037109375, -1.70562744140625, -1.637451171875, -1.56927490234375, -1.5010986328125, -1.43292236328125, -1.36474609375, -1.29656982421875, -1.2283935546875, -1.16021728515625, -1.092041015625, -1.02386474609375, -0.9556884765625, -0.88751220703125, -0.8193359375, -0.75115966796875, -0.6829833984375, -0.61480712890625, -0.546630859375, -0.47845458984375, -0.4102783203125, -0.34210205078125, -0.27392578125, -0.20574951171875, -0.1375732421875, -0.06939697265625, -0.001220703125, 0.06695556640625, 0.1351318359375, 0.20330810546875, 0.271484375, 0.33966064453125, 0.4078369140625, 0.47601318359375, 0.544189453125, 0.61236572265625, 0.6805419921875, 0.74871826171875, 0.81689453125, 0.88507080078125, 0.9532470703125, 1.02142333984375, 1.089599609375, 1.15777587890625, 1.2259521484375, 1.29412841796875, 1.3623046875, 1.43048095703125, 1.4986572265625, 1.56683349609375, 1.635009765625, 1.70318603515625, 1.7713623046875, 1.83953857421875, 1.90771484375, 1.97589111328125, 2.0440673828125, 2.11224365234375, 2.180419921875, 2.24859619140625, 2.3167724609375, 2.38494873046875, 2.453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 11.0, 21.0, 22.0, 33.0, 45.0, 40.0, 58.0, 53.0, 60.0, 63.0, 66.0, 55.0, 66.0, 56.0, 54.0, 52.0, 40.0, 32.0, 29.0, 15.0, 22.0, 15.0, 10.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6416015625, -1.5928955078125, -1.544189453125, -1.4954833984375, -1.44677734375, -1.3980712890625, -1.349365234375, -1.3006591796875, -1.251953125, -1.2032470703125, -1.154541015625, -1.1058349609375, -1.05712890625, -1.0084228515625, -0.959716796875, -0.9110107421875, -0.8623046875, -0.8135986328125, -0.764892578125, -0.7161865234375, -0.66748046875, -0.6187744140625, -0.570068359375, -0.5213623046875, -0.47265625, -0.4239501953125, -0.375244140625, -0.3265380859375, -0.27783203125, -0.2291259765625, -0.180419921875, -0.1317138671875, -0.0830078125, -0.0343017578125, 0.014404296875, 0.0631103515625, 0.11181640625, 0.1605224609375, 0.209228515625, 0.2579345703125, 0.306640625, 0.3553466796875, 0.404052734375, 0.4527587890625, 0.50146484375, 0.5501708984375, 0.598876953125, 0.6475830078125, 0.6962890625, 0.7449951171875, 0.793701171875, 0.8424072265625, 0.89111328125, 0.9398193359375, 0.988525390625, 1.0372314453125, 1.0859375, 1.1346435546875, 1.183349609375, 1.2320556640625, 1.28076171875, 1.3294677734375, 1.378173828125, 1.4268798828125, 1.4755859375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 11.0, 14.0, 34.0, 51.0, 117.0, 247.0, 1038.0, 20761.0, 4145054.0, 25223.0, 1211.0, 271.0, 109.0, 57.0, 30.0, 13.0, 9.0, 5.0, 2.0, 2.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.03759765625, -8.7314453125, -8.42529296875, -8.119140625, -7.81298828125, -7.5068359375, -7.20068359375, -6.89453125, -6.58837890625, -6.2822265625, -5.97607421875, -5.669921875, -5.36376953125, -5.0576171875, -4.75146484375, -4.4453125, -4.13916015625, -3.8330078125, -3.52685546875, -3.220703125, -2.91455078125, -2.6083984375, -2.30224609375, -1.99609375, -1.68994140625, -1.3837890625, -1.07763671875, -0.771484375, -0.46533203125, -0.1591796875, 0.14697265625, 0.453125, 0.75927734375, 1.0654296875, 1.37158203125, 1.677734375, 1.98388671875, 2.2900390625, 2.59619140625, 2.90234375, 3.20849609375, 3.5146484375, 3.82080078125, 4.126953125, 4.43310546875, 4.7392578125, 5.04541015625, 5.3515625, 5.65771484375, 5.9638671875, 6.27001953125, 6.576171875, 6.88232421875, 7.1884765625, 7.49462890625, 7.80078125, 8.10693359375, 8.4130859375, 8.71923828125, 9.025390625, 9.33154296875, 9.6376953125, 9.94384765625, 10.25]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 6.0, 7.0, 5.0, 12.0, 13.0, 15.0, 22.0, 25.0, 34.0, 55.0, 62.0, 68.0, 125.0, 213.0, 368.0, 817.0, 982.0, 448.0, 233.0, 140.0, 101.0, 77.0, 53.0, 47.0, 28.0, 26.0, 25.0, 15.0, 8.0, 10.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.525390625, -0.5090408325195312, -0.4926910400390625, -0.47634124755859375, -0.459991455078125, -0.44364166259765625, -0.4272918701171875, -0.41094207763671875, -0.39459228515625, -0.37824249267578125, -0.3618927001953125, -0.34554290771484375, -0.329193115234375, -0.31284332275390625, -0.2964935302734375, -0.28014373779296875, -0.2637939453125, -0.24744415283203125, -0.2310943603515625, -0.21474456787109375, -0.198394775390625, -0.18204498291015625, -0.1656951904296875, -0.14934539794921875, -0.13299560546875, -0.11664581298828125, -0.1002960205078125, -0.08394622802734375, -0.067596435546875, -0.05124664306640625, -0.0348968505859375, -0.01854705810546875, -0.002197265625, 0.01415252685546875, 0.0305023193359375, 0.04685211181640625, 0.063201904296875, 0.07955169677734375, 0.0959014892578125, 0.11225128173828125, 0.12860107421875, 0.14495086669921875, 0.1613006591796875, 0.17765045166015625, 0.194000244140625, 0.21035003662109375, 0.2266998291015625, 0.24304962158203125, 0.2593994140625, 0.27574920654296875, 0.2920989990234375, 0.30844879150390625, 0.324798583984375, 0.34114837646484375, 0.3574981689453125, 0.37384796142578125, 0.39019775390625, 0.40654754638671875, 0.4228973388671875, 0.43924713134765625, 0.455596923828125, 0.47194671630859375, 0.4882965087890625, 0.5046463012695312, 0.52099609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 12.0, 13.0, 27.0, 47.0, 81.0, 168.0, 191.0, 166.0, 119.0, 64.0, 37.0, 21.0, 13.0, 5.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.697857856750488, -4.566412448883057, -4.434967041015625, -4.303522109985352, -4.17207670211792, -4.040631294250488, -3.9091858863830566, -3.777740478515625, -3.6462950706481934, -3.5148496627807617, -3.383404493331909, -3.2519590854644775, -3.120513677597046, -2.9890685081481934, -2.8576231002807617, -2.72617769241333, -2.5947325229644775, -2.463287115097046, -2.3318419456481934, -2.2003965377807617, -2.06895112991333, -1.937505841255188, -1.806060552597046, -1.6746151447296143, -1.5431698560714722, -1.41172456741333, -1.2802791595458984, -1.1488338708877563, -1.0173885822296143, -0.8859431743621826, -0.7544978857040405, -0.6230525374412537, -0.4916071891784668, -0.36016184091567993, -0.22871652245521545, -0.09727120399475098, 0.03417414426803589, 0.16561949253082275, 0.29706478118896484, 0.4285101294517517, 0.5599554777145386, 0.6914008259773254, 0.8228461742401123, 0.9542914628982544, 1.0857367515563965, 1.2171821594238281, 1.3486274480819702, 1.4800727367401123, 1.611518144607544, 1.742963433265686, 1.8744088411331177, 2.0058541297912598, 2.1372995376586914, 2.268744945526123, 2.4001901149749756, 2.5316355228424072, 2.6630806922912598, 2.7945261001586914, 2.925971269607544, 3.0574166774749756, 3.1888620853424072, 3.3203072547912598, 3.4517526626586914, 3.583198070526123, 3.7146434783935547]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 8.0, 12.0, 10.0, 11.0, 13.0, 20.0, 14.0, 24.0, 31.0, 38.0, 50.0, 51.0, 57.0, 63.0, 52.0, 69.0, 56.0, 48.0, 60.0, 46.0, 51.0, 34.0, 35.0, 29.0, 31.0, 16.0, 17.0, 12.0, 9.0, 8.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5557526350021362, -1.5006544589996338, -1.4455562829971313, -1.390458106994629, -1.3353599309921265, -1.280261754989624, -1.225163459777832, -1.1700654029846191, -1.1149671077728271, -1.0598689317703247, -1.0047707557678223, -0.9496725797653198, -0.8945744037628174, -0.8394762277603149, -0.7843779921531677, -0.7292798161506653, -0.6741816997528076, -0.6190835237503052, -0.5639853477478027, -0.5088871717453003, -0.45378896594047546, -0.398690789937973, -0.3435925841331482, -0.28849440813064575, -0.2333962321281433, -0.17829805612564087, -0.12319986522197723, -0.0681016743183136, -0.013003498315811157, 0.042094677686691284, 0.09719288349151611, 0.15229105949401855, 0.207389235496521, 0.26248741149902344, 0.3175855875015259, 0.3726837933063507, 0.42778196930885315, 0.4828801453113556, 0.5379783511161804, 0.5930765271186829, 0.6481747031211853, 0.7032728791236877, 0.7583710551261902, 0.8134692907333374, 0.8685674667358398, 0.9236656427383423, 0.9787638187408447, 1.0338619947433472, 1.0889601707458496, 1.144058346748352, 1.1991565227508545, 1.254254698753357, 1.3093528747558594, 1.3644510507583618, 1.4195492267608643, 1.4746475219726562, 1.5297455787658691, 1.5848437547683716, 1.639941930770874, 1.6950401067733765, 1.750138282775879, 1.8052364587783813, 1.8603346347808838, 1.9154329299926758, 1.9705311059951782]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 13.0, 6.0, 19.0, 17.0, 36.0, 51.0, 64.0, 103.0, 148.0, 253.0, 476.0, 924.0, 2024.0, 5350.0, 17526.0, 85339.0, 616640.0, 265823.0, 37735.0, 9576.0, 3405.0, 1433.0, 690.0, 363.0, 189.0, 109.0, 62.0, 44.0, 33.0, 24.0, 18.0, 25.0, 10.0, 3.0, 4.0, 2.0, 6.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1854248046875, -0.1797657012939453, -0.17410659790039062, -0.16844749450683594, -0.16278839111328125, -0.15712928771972656, -0.15147018432617188, -0.1458110809326172, -0.1401519775390625, -0.1344928741455078, -0.12883377075195312, -0.12317466735839844, -0.11751556396484375, -0.11185646057128906, -0.10619735717773438, -0.10053825378417969, -0.094879150390625, -0.08922004699707031, -0.08356094360351562, -0.07790184020996094, -0.07224273681640625, -0.06658363342285156, -0.060924530029296875, -0.05526542663574219, -0.0496063232421875, -0.04394721984863281, -0.038288116455078125, -0.03262901306152344, -0.02696990966796875, -0.021310806274414062, -0.015651702880859375, -0.009992599487304688, -0.00433349609375, 0.0013256072998046875, 0.006984710693359375, 0.012643814086914062, 0.01830291748046875, 0.023962020874023438, 0.029621124267578125, 0.03528022766113281, 0.0409393310546875, 0.04659843444824219, 0.052257537841796875, 0.05791664123535156, 0.06357574462890625, 0.06923484802246094, 0.07489395141601562, 0.08055305480957031, 0.086212158203125, 0.09187126159667969, 0.09753036499023438, 0.10318946838378906, 0.10884857177734375, 0.11450767517089844, 0.12016677856445312, 0.1258258819580078, 0.1314849853515625, 0.1371440887451172, 0.14280319213867188, 0.14846229553222656, 0.15412139892578125, 0.15978050231933594, 0.16543960571289062, 0.1710987091064453, 0.1767578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 8.0, 12.0, 14.0, 22.0, 29.0, 49.0, 62.0, 50.0, 72.0, 68.0, 75.0, 68.0, 68.0, 70.0, 59.0, 53.0, 31.0, 41.0, 23.0, 20.0, 17.0, 11.0, 15.0, 9.0, 3.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.336395263671875, -1.29193115234375, -1.247467041015625, -1.2030029296875, -1.158538818359375, -1.11407470703125, -1.069610595703125, -1.025146484375, -0.980682373046875, -0.93621826171875, -0.891754150390625, -0.8472900390625, -0.802825927734375, -0.75836181640625, -0.713897705078125, -0.66943359375, -0.624969482421875, -0.58050537109375, -0.536041259765625, -0.4915771484375, -0.447113037109375, -0.40264892578125, -0.358184814453125, -0.313720703125, -0.269256591796875, -0.22479248046875, -0.180328369140625, -0.1358642578125, -0.091400146484375, -0.04693603515625, -0.002471923828125, 0.0419921875, 0.086456298828125, 0.13092041015625, 0.175384521484375, 0.2198486328125, 0.264312744140625, 0.30877685546875, 0.353240966796875, 0.397705078125, 0.442169189453125, 0.48663330078125, 0.531097412109375, 0.5755615234375, 0.620025634765625, 0.66448974609375, 0.708953857421875, 0.75341796875, 0.797882080078125, 0.84234619140625, 0.886810302734375, 0.9312744140625, 0.975738525390625, 1.02020263671875, 1.064666748046875, 1.109130859375, 1.153594970703125, 1.19805908203125, 1.242523193359375, 1.2869873046875, 1.331451416015625, 1.37591552734375, 1.420379638671875, 1.46484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 10.0, 14.0, 14.0, 18.0, 32.0, 33.0, 47.0, 50.0, 80.0, 99.0, 158.0, 202.0, 304.0, 567.0, 1477.0, 9798.0, 138877.0, 789412.0, 96860.0, 7628.0, 1386.0, 462.0, 293.0, 167.0, 150.0, 117.0, 68.0, 59.0, 43.0, 30.0, 18.0, 20.0, 12.0, 8.0, 7.0, 14.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2099609375, -0.20403671264648438, -0.19811248779296875, -0.19218826293945312, -0.1862640380859375, -0.18033981323242188, -0.17441558837890625, -0.16849136352539062, -0.162567138671875, -0.15664291381835938, -0.15071868896484375, -0.14479446411132812, -0.1388702392578125, -0.13294601440429688, -0.12702178955078125, -0.12109756469726562, -0.11517333984375, -0.10924911499023438, -0.10332489013671875, -0.09740066528320312, -0.0914764404296875, -0.08555221557617188, -0.07962799072265625, -0.07370376586914062, -0.067779541015625, -0.061855316162109375, -0.05593109130859375, -0.050006866455078125, -0.0440826416015625, -0.038158416748046875, -0.03223419189453125, -0.026309967041015625, -0.0203857421875, -0.014461517333984375, -0.00853729248046875, -0.002613067626953125, 0.0033111572265625, 0.009235382080078125, 0.01515960693359375, 0.021083831787109375, 0.027008056640625, 0.032932281494140625, 0.03885650634765625, 0.044780731201171875, 0.0507049560546875, 0.056629180908203125, 0.06255340576171875, 0.06847763061523438, 0.07440185546875, 0.08032608032226562, 0.08625030517578125, 0.09217453002929688, 0.0980987548828125, 0.10402297973632812, 0.10994720458984375, 0.11587142944335938, 0.121795654296875, 0.12771987915039062, 0.13364410400390625, 0.13956832885742188, 0.1454925537109375, 0.15141677856445312, 0.15734100341796875, 0.16326522827148438, 0.169189453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 6.0, 6.0, 10.0, 12.0, 12.0, 24.0, 18.0, 25.0, 25.0, 39.0, 40.0, 53.0, 38.0, 50.0, 56.0, 42.0, 56.0, 64.0, 54.0, 44.0, 51.0, 33.0, 35.0, 34.0, 23.0, 33.0, 22.0, 20.0, 14.0, 7.0, 15.0, 7.0, 6.0, 3.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.2265625, -2.164337158203125, -2.10211181640625, -2.039886474609375, -1.9776611328125, -1.915435791015625, -1.85321044921875, -1.790985107421875, -1.728759765625, -1.666534423828125, -1.60430908203125, -1.542083740234375, -1.4798583984375, -1.417633056640625, -1.35540771484375, -1.293182373046875, -1.23095703125, -1.168731689453125, -1.10650634765625, -1.044281005859375, -0.9820556640625, -0.919830322265625, -0.85760498046875, -0.795379638671875, -0.733154296875, -0.670928955078125, -0.60870361328125, -0.546478271484375, -0.4842529296875, -0.422027587890625, -0.35980224609375, -0.297576904296875, -0.2353515625, -0.173126220703125, -0.11090087890625, -0.048675537109375, 0.0135498046875, 0.075775146484375, 0.13800048828125, 0.200225830078125, 0.262451171875, 0.324676513671875, 0.38690185546875, 0.449127197265625, 0.5113525390625, 0.573577880859375, 0.63580322265625, 0.698028564453125, 0.76025390625, 0.822479248046875, 0.88470458984375, 0.946929931640625, 1.0091552734375, 1.071380615234375, 1.13360595703125, 1.195831298828125, 1.258056640625, 1.320281982421875, 1.38250732421875, 1.444732666015625, 1.5069580078125, 1.569183349609375, 1.63140869140625, 1.693634033203125, 1.755859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 7.0, 9.0, 16.0, 17.0, 20.0, 32.0, 28.0, 51.0, 39.0, 92.0, 134.0, 248.0, 776.0, 5497.0, 973658.0, 64704.0, 2154.0, 438.0, 206.0, 104.0, 85.0, 63.0, 44.0, 34.0, 28.0, 17.0, 18.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12042236328125, -0.11715030670166016, -0.11387825012207031, -0.11060619354248047, -0.10733413696289062, -0.10406208038330078, -0.10079002380371094, -0.0975179672241211, -0.09424591064453125, -0.0909738540649414, -0.08770179748535156, -0.08442974090576172, -0.08115768432617188, -0.07788562774658203, -0.07461357116699219, -0.07134151458740234, -0.0680694580078125, -0.06479740142822266, -0.06152534484863281, -0.05825328826904297, -0.054981231689453125, -0.05170917510986328, -0.04843711853027344, -0.045165061950683594, -0.04189300537109375, -0.038620948791503906, -0.03534889221191406, -0.03207683563232422, -0.028804779052734375, -0.02553272247314453, -0.022260665893554688, -0.018988609313964844, -0.015716552734375, -0.012444496154785156, -0.009172439575195312, -0.005900382995605469, -0.002628326416015625, 0.0006437301635742188, 0.0039157867431640625, 0.007187843322753906, 0.01045989990234375, 0.013731956481933594, 0.017004013061523438, 0.02027606964111328, 0.023548126220703125, 0.02682018280029297, 0.030092239379882812, 0.033364295959472656, 0.0366363525390625, 0.039908409118652344, 0.04318046569824219, 0.04645252227783203, 0.049724578857421875, 0.05299663543701172, 0.05626869201660156, 0.059540748596191406, 0.06281280517578125, 0.0660848617553711, 0.06935691833496094, 0.07262897491455078, 0.07590103149414062, 0.07917308807373047, 0.08244514465332031, 0.08571720123291016, 0.0889892578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 13.0, 35.0, 77.0, 203.0, 344.0, 194.0, 75.0, 30.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -2.908799797296524e-05, -2.6943162083625793e-05, -2.4798326194286346e-05, -2.26534903049469e-05, -2.0508654415607452e-05, -1.8363818526268005e-05, -1.621898263692856e-05, -1.4074146747589111e-05, -1.1929310858249664e-05, -9.784474968910217e-06, -7.63963907957077e-06, -5.494803190231323e-06, -3.3499673008918762e-06, -1.2051314115524292e-06, 9.397044777870178e-07, 3.084540367126465e-06, 5.229376256465912e-06, 7.374212145805359e-06, 9.519048035144806e-06, 1.1663883924484253e-05, 1.38087198138237e-05, 1.5953555703163147e-05, 1.8098391592502594e-05, 2.024322748184204e-05, 2.2388063371181488e-05, 2.4532899260520935e-05, 2.6677735149860382e-05, 2.882257103919983e-05, 3.0967406928539276e-05, 3.311224281787872e-05, 3.525707870721817e-05, 3.740191459655762e-05, 3.9546750485897064e-05, 4.169158637523651e-05, 4.383642226457596e-05, 4.5981258153915405e-05, 4.812609404325485e-05, 5.02709299325943e-05, 5.2415765821933746e-05, 5.456060171127319e-05, 5.670543760061264e-05, 5.885027348995209e-05, 6.0995109379291534e-05, 6.313994526863098e-05, 6.528478115797043e-05, 6.742961704730988e-05, 6.957445293664932e-05, 7.171928882598877e-05, 7.386412471532822e-05, 7.600896060466766e-05, 7.815379649400711e-05, 8.029863238334656e-05, 8.2443468272686e-05, 8.458830416202545e-05, 8.67331400513649e-05, 8.887797594070435e-05, 9.102281183004379e-05, 9.316764771938324e-05, 9.531248360872269e-05, 9.745731949806213e-05, 9.960215538740158e-05, 0.00010174699127674103, 0.00010389182716608047, 0.00010603666305541992]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 6.0, 7.0, 8.0, 3.0, 10.0, 17.0, 10.0, 28.0, 35.0, 44.0, 68.0, 100.0, 175.0, 272.0, 546.0, 1065.0, 2635.0, 7985.0, 63648.0, 924861.0, 36584.0, 6410.0, 1990.0, 875.0, 437.0, 218.0, 177.0, 106.0, 60.0, 57.0, 33.0, 23.0, 21.0, 9.0, 10.0, 5.0, 2.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07647037506103516, -0.07377815246582031, -0.07108592987060547, -0.06839370727539062, -0.06570148468017578, -0.06300926208496094, -0.060317039489746094, -0.05762481689453125, -0.054932594299316406, -0.05224037170410156, -0.04954814910888672, -0.046855926513671875, -0.04416370391845703, -0.04147148132324219, -0.038779258728027344, -0.0360870361328125, -0.033394813537597656, -0.030702590942382812, -0.02801036834716797, -0.025318145751953125, -0.02262592315673828, -0.019933700561523438, -0.017241477966308594, -0.01454925537109375, -0.011857032775878906, -0.009164810180664062, -0.006472587585449219, -0.003780364990234375, -0.0010881423950195312, 0.0016040802001953125, 0.004296302795410156, 0.006988525390625, 0.009680747985839844, 0.012372970581054688, 0.015065193176269531, 0.017757415771484375, 0.02044963836669922, 0.023141860961914062, 0.025834083557128906, 0.02852630615234375, 0.031218528747558594, 0.03391075134277344, 0.03660297393798828, 0.039295196533203125, 0.04198741912841797, 0.04467964172363281, 0.047371864318847656, 0.0500640869140625, 0.052756309509277344, 0.05544853210449219, 0.05814075469970703, 0.060832977294921875, 0.06352519989013672, 0.06621742248535156, 0.0689096450805664, 0.07160186767578125, 0.0742940902709961, 0.07698631286621094, 0.07967853546142578, 0.08237075805664062, 0.08506298065185547, 0.08775520324707031, 0.09044742584228516, 0.0931396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 14.0, 21.0, 22.0, 33.0, 70.0, 173.0, 324.0, 132.0, 59.0, 44.0, 26.0, 18.0, 13.0, 5.0, 5.0, 8.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0171661376953125, -0.016760945320129395, -0.01635575294494629, -0.015950560569763184, -0.015545368194580078, -0.015140175819396973, -0.014734983444213867, -0.014329791069030762, -0.013924598693847656, -0.01351940631866455, -0.013114213943481445, -0.01270902156829834, -0.012303829193115234, -0.011898636817932129, -0.011493444442749023, -0.011088252067565918, -0.010683059692382812, -0.010277867317199707, -0.009872674942016602, -0.009467482566833496, -0.00906229019165039, -0.008657097816467285, -0.00825190544128418, -0.007846713066101074, -0.007441520690917969, -0.007036328315734863, -0.006631135940551758, -0.006225943565368652, -0.005820751190185547, -0.005415558815002441, -0.005010366439819336, -0.0046051740646362305, -0.004199981689453125, -0.0037947893142700195, -0.003389596939086914, -0.0029844045639038086, -0.002579212188720703, -0.0021740198135375977, -0.0017688274383544922, -0.0013636350631713867, -0.0009584426879882812, -0.0005532503128051758, -0.0001480579376220703, 0.00025713443756103516, 0.0006623268127441406, 0.001067519187927246, 0.0014727115631103516, 0.001877903938293457, 0.0022830963134765625, 0.002688288688659668, 0.0030934810638427734, 0.003498673439025879, 0.0039038658142089844, 0.00430905818939209, 0.004714250564575195, 0.005119442939758301, 0.005524635314941406, 0.005929827690124512, 0.006335020065307617, 0.006740212440490723, 0.007145404815673828, 0.007550597190856934, 0.007955789566040039, 0.008360981941223145, 0.00876617431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 16.0, 29.0, 54.0, 123.0, 244.0, 226.0, 151.0, 55.0, 36.0, 15.0, 12.0, 5.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8232192993164062, -3.71435284614563, -3.6054863929748535, -3.496619939804077, -3.387753486633301, -3.2788872718811035, -3.170020818710327, -3.061154365539551, -2.9522879123687744, -2.843421459197998, -2.7345550060272217, -2.6256885528564453, -2.516822338104248, -2.4079556465148926, -2.2990894317626953, -2.190222978591919, -2.0813565254211426, -1.9724900722503662, -1.8636236190795898, -1.754757285118103, -1.6458908319473267, -1.5370243787765503, -1.4281580448150635, -1.319291591644287, -1.2104251384735107, -1.1015586853027344, -0.9926922917366028, -0.8838258981704712, -0.7749594449996948, -0.6660929918289185, -0.5572265982627869, -0.4483602046966553, -0.3394935131072998, -0.23062708973884583, -0.12176066637039185, -0.012894243001937866, 0.09597218036651611, 0.20483863353729248, 0.3137050271034241, 0.42257142066955566, 0.531437873840332, 0.6403043270111084, 0.74917072057724, 0.8580371141433716, 0.966903567314148, 1.0757700204849243, 1.1846363544464111, 1.2935028076171875, 1.4023692607879639, 1.5112357139587402, 1.6201021671295166, 1.7289685010910034, 1.8378349542617798, 1.9467014074325562, 2.055567741394043, 2.1644341945648193, 2.2733006477355957, 2.382167100906372, 2.4910335540771484, 2.599900007247925, 2.708766460418701, 2.8176326751708984, 2.926499128341675, 3.035365581512451, 3.1442320346832275]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 12.0, 8.0, 11.0, 12.0, 18.0, 23.0, 30.0, 48.0, 58.0, 64.0, 79.0, 85.0, 80.0, 64.0, 83.0, 61.0, 51.0, 45.0, 41.0, 35.0, 14.0, 21.0, 16.0, 7.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2564345598220825, -1.2110927104949951, -1.1657508611679077, -1.1204090118408203, -1.075067162513733, -1.0297253131866455, -0.9843835234642029, -0.9390417337417603, -0.8936998844146729, -0.8483580350875854, -0.803016185760498, -0.7576743364334106, -0.712332546710968, -0.6669906973838806, -0.6216488480567932, -0.5763070583343506, -0.5309651494026184, -0.485623300075531, -0.440281480550766, -0.3949396312236786, -0.3495978116989136, -0.30425596237182617, -0.25891411304473877, -0.21357229351997375, -0.16823044419288635, -0.12288860976696014, -0.07754676789045334, -0.03220492601394653, 0.013136908411979675, 0.058478742837905884, 0.10382059216499329, 0.1491624116897583, 0.1945042610168457, 0.2398460954427719, 0.2851879298686981, 0.3305297791957855, 0.37587159872055054, 0.42121344804763794, 0.46655529737472534, 0.511897087097168, 0.5572389364242554, 0.6025807857513428, 0.6479226350784302, 0.6932644844055176, 0.7386062741279602, 0.7839481234550476, 0.829289972782135, 0.8746317625045776, 0.9199736714363098, 0.9653155207633972, 1.0106573104858398, 1.0559991598129272, 1.1013410091400146, 1.146682858467102, 1.1920247077941895, 1.2373665571212769, 1.2827084064483643, 1.3280502557754517, 1.373392105102539, 1.4187339544296265, 1.4640758037567139, 1.5094175338745117, 1.5547595024108887, 1.6001012325286865, 1.645443081855774]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 5.0, 4.0, 4.0, 8.0, 18.0, 36.0, 88.0, 287.0, 2050.0, 52535.0, 966615.0, 25169.0, 1320.0, 233.0, 78.0, 31.0, 16.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.51171875, -4.326904296875, -4.14208984375, -3.957275390625, -3.7724609375, -3.587646484375, -3.40283203125, -3.218017578125, -3.033203125, -2.848388671875, -2.66357421875, -2.478759765625, -2.2939453125, -2.109130859375, -1.92431640625, -1.739501953125, -1.5546875, -1.369873046875, -1.18505859375, -1.000244140625, -0.8154296875, -0.630615234375, -0.44580078125, -0.260986328125, -0.076171875, 0.108642578125, 0.29345703125, 0.478271484375, 0.6630859375, 0.847900390625, 1.03271484375, 1.217529296875, 1.40234375, 1.587158203125, 1.77197265625, 1.956787109375, 2.1416015625, 2.326416015625, 2.51123046875, 2.696044921875, 2.880859375, 3.065673828125, 3.25048828125, 3.435302734375, 3.6201171875, 3.804931640625, 3.98974609375, 4.174560546875, 4.359375, 4.544189453125, 4.72900390625, 4.913818359375, 5.0986328125, 5.283447265625, 5.46826171875, 5.653076171875, 5.837890625, 6.022705078125, 6.20751953125, 6.392333984375, 6.5771484375, 6.761962890625, 6.94677734375, 7.131591796875, 7.31640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 9.0, 7.0, 15.0, 16.0, 18.0, 33.0, 46.0, 37.0, 60.0, 65.0, 66.0, 69.0, 91.0, 75.0, 64.0, 58.0, 57.0, 39.0, 31.0, 23.0, 23.0, 20.0, 12.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.064453125, -2.969573974609375, -2.87469482421875, -2.779815673828125, -2.6849365234375, -2.590057373046875, -2.49517822265625, -2.400299072265625, -2.305419921875, -2.210540771484375, -2.11566162109375, -2.020782470703125, -1.9259033203125, -1.831024169921875, -1.73614501953125, -1.641265869140625, -1.54638671875, -1.451507568359375, -1.35662841796875, -1.261749267578125, -1.1668701171875, -1.071990966796875, -0.97711181640625, -0.882232666015625, -0.787353515625, -0.692474365234375, -0.59759521484375, -0.502716064453125, -0.4078369140625, -0.312957763671875, -0.21807861328125, -0.123199462890625, -0.0283203125, 0.066558837890625, 0.16143798828125, 0.256317138671875, 0.3511962890625, 0.446075439453125, 0.54095458984375, 0.635833740234375, 0.730712890625, 0.825592041015625, 0.92047119140625, 1.015350341796875, 1.1102294921875, 1.205108642578125, 1.29998779296875, 1.394866943359375, 1.48974609375, 1.584625244140625, 1.67950439453125, 1.774383544921875, 1.8692626953125, 1.964141845703125, 2.05902099609375, 2.153900146484375, 2.248779296875, 2.343658447265625, 2.43853759765625, 2.533416748046875, 2.6282958984375, 2.723175048828125, 2.81805419921875, 2.912933349609375, 3.0078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 12.0, 14.0, 18.0, 24.0, 11.0, 20.0, 32.0, 31.0, 33.0, 45.0, 61.0, 83.0, 100.0, 143.0, 265.0, 865.0, 4561.0, 55435.0, 868115.0, 109736.0, 6794.0, 1137.0, 321.0, 154.0, 105.0, 78.0, 47.0, 59.0, 33.0, 49.0, 28.0, 17.0, 19.0, 17.0, 13.0, 9.0, 7.0, 7.0, 5.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.064453125, -2.970458984375, -2.87646484375, -2.782470703125, -2.6884765625, -2.594482421875, -2.50048828125, -2.406494140625, -2.3125, -2.218505859375, -2.12451171875, -2.030517578125, -1.9365234375, -1.842529296875, -1.74853515625, -1.654541015625, -1.560546875, -1.466552734375, -1.37255859375, -1.278564453125, -1.1845703125, -1.090576171875, -0.99658203125, -0.902587890625, -0.80859375, -0.714599609375, -0.62060546875, -0.526611328125, -0.4326171875, -0.338623046875, -0.24462890625, -0.150634765625, -0.056640625, 0.037353515625, 0.13134765625, 0.225341796875, 0.3193359375, 0.413330078125, 0.50732421875, 0.601318359375, 0.6953125, 0.789306640625, 0.88330078125, 0.977294921875, 1.0712890625, 1.165283203125, 1.25927734375, 1.353271484375, 1.447265625, 1.541259765625, 1.63525390625, 1.729248046875, 1.8232421875, 1.917236328125, 2.01123046875, 2.105224609375, 2.19921875, 2.293212890625, 2.38720703125, 2.481201171875, 2.5751953125, 2.669189453125, 2.76318359375, 2.857177734375, 2.951171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 10.0, 12.0, 11.0, 13.0, 14.0, 16.0, 19.0, 26.0, 29.0, 30.0, 27.0, 27.0, 33.0, 45.0, 32.0, 42.0, 34.0, 48.0, 34.0, 39.0, 45.0, 32.0, 40.0, 30.0, 35.0, 32.0, 24.0, 32.0, 25.0, 24.0, 15.0, 21.0, 13.0, 10.0, 8.0, 10.0, 4.0, 5.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.3671875, -2.294708251953125, -2.22222900390625, -2.149749755859375, -2.0772705078125, -2.004791259765625, -1.93231201171875, -1.859832763671875, -1.787353515625, -1.714874267578125, -1.64239501953125, -1.569915771484375, -1.4974365234375, -1.424957275390625, -1.35247802734375, -1.279998779296875, -1.20751953125, -1.135040283203125, -1.06256103515625, -0.990081787109375, -0.9176025390625, -0.845123291015625, -0.77264404296875, -0.700164794921875, -0.627685546875, -0.555206298828125, -0.48272705078125, -0.410247802734375, -0.3377685546875, -0.265289306640625, -0.19281005859375, -0.120330810546875, -0.0478515625, 0.024627685546875, 0.09710693359375, 0.169586181640625, 0.2420654296875, 0.314544677734375, 0.38702392578125, 0.459503173828125, 0.531982421875, 0.604461669921875, 0.67694091796875, 0.749420166015625, 0.8218994140625, 0.894378662109375, 0.96685791015625, 1.039337158203125, 1.11181640625, 1.184295654296875, 1.25677490234375, 1.329254150390625, 1.4017333984375, 1.474212646484375, 1.54669189453125, 1.619171142578125, 1.691650390625, 1.764129638671875, 1.83660888671875, 1.909088134765625, 1.9815673828125, 2.054046630859375, 2.12652587890625, 2.199005126953125, 2.271484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 14.0, 17.0, 18.0, 44.0, 53.0, 90.0, 142.0, 212.0, 346.0, 617.0, 975.0, 2081.0, 4205.0, 10050.0, 28631.0, 110217.0, 504842.0, 292142.0, 61922.0, 18179.0, 6972.0, 3179.0, 1487.0, 811.0, 515.0, 267.0, 164.0, 130.0, 65.0, 43.0, 31.0, 19.0, 18.0, 8.0, 8.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3742332458496094, -0.36077117919921875, -0.3473091125488281, -0.3338470458984375, -0.3203849792480469, -0.30692291259765625, -0.2934608459472656, -0.279998779296875, -0.2665367126464844, -0.25307464599609375, -0.23961257934570312, -0.2261505126953125, -0.21268844604492188, -0.19922637939453125, -0.18576431274414062, -0.17230224609375, -0.15884017944335938, -0.14537811279296875, -0.13191604614257812, -0.1184539794921875, -0.10499191284179688, -0.09152984619140625, -0.07806777954101562, -0.064605712890625, -0.051143646240234375, -0.03768157958984375, -0.024219512939453125, -0.0107574462890625, 0.002704620361328125, 0.01616668701171875, 0.029628753662109375, 0.0430908203125, 0.056552886962890625, 0.07001495361328125, 0.08347702026367188, 0.0969390869140625, 0.11040115356445312, 0.12386322021484375, 0.13732528686523438, 0.150787353515625, 0.16424942016601562, 0.17771148681640625, 0.19117355346679688, 0.2046356201171875, 0.21809768676757812, 0.23155975341796875, 0.24502182006835938, 0.25848388671875, 0.2719459533691406, 0.28540802001953125, 0.2988700866699219, 0.3123321533203125, 0.3257942199707031, 0.33925628662109375, 0.3527183532714844, 0.366180419921875, 0.3796424865722656, 0.39310455322265625, 0.4065666198730469, 0.4200286865234375, 0.4334907531738281, 0.44695281982421875, 0.4604148864746094, 0.473876953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 14.0, 20.0, 33.0, 44.0, 54.0, 82.0, 96.0, 107.0, 116.0, 110.0, 105.0, 57.0, 41.0, 31.0, 24.0, 17.0, 8.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.775161743164062e-05, -9.451806545257568e-05, -9.128451347351074e-05, -8.80509614944458e-05, -8.481740951538086e-05, -8.158385753631592e-05, -7.835030555725098e-05, -7.511675357818604e-05, -7.18832015991211e-05, -6.864964962005615e-05, -6.541609764099121e-05, -6.218254566192627e-05, -5.894899368286133e-05, -5.571544170379639e-05, -5.2481889724731445e-05, -4.9248337745666504e-05, -4.601478576660156e-05, -4.278123378753662e-05, -3.954768180847168e-05, -3.631412982940674e-05, -3.30805778503418e-05, -2.9847025871276855e-05, -2.6613473892211914e-05, -2.3379921913146973e-05, -2.014636993408203e-05, -1.691281795501709e-05, -1.3679265975952148e-05, -1.0445713996887207e-05, -7.212162017822266e-06, -3.978610038757324e-06, -7.450580596923828e-07, 2.4884939193725586e-06, 5.7220458984375e-06, 8.955597877502441e-06, 1.2189149856567383e-05, 1.5422701835632324e-05, 1.8656253814697266e-05, 2.1889805793762207e-05, 2.512335777282715e-05, 2.835690975189209e-05, 3.159046173095703e-05, 3.482401371002197e-05, 3.8057565689086914e-05, 4.1291117668151855e-05, 4.45246696472168e-05, 4.775822162628174e-05, 5.099177360534668e-05, 5.422532558441162e-05, 5.745887756347656e-05, 6.0692429542541504e-05, 6.392598152160645e-05, 6.715953350067139e-05, 7.039308547973633e-05, 7.362663745880127e-05, 7.686018943786621e-05, 8.009374141693115e-05, 8.33272933959961e-05, 8.656084537506104e-05, 8.979439735412598e-05, 9.302794933319092e-05, 9.626150131225586e-05, 9.94950532913208e-05, 0.00010272860527038574, 0.00010596215724945068, 0.00010919570922851562]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 12.0, 14.0, 7.0, 19.0, 36.0, 36.0, 61.0, 75.0, 110.0, 186.0, 246.0, 474.0, 890.0, 1872.0, 4191.0, 11225.0, 39824.0, 224842.0, 606728.0, 118754.0, 24890.0, 7713.0, 3061.0, 1433.0, 751.0, 402.0, 236.0, 150.0, 91.0, 56.0, 34.0, 24.0, 24.0, 12.0, 11.0, 18.0, 10.0, 7.0, 7.0, 2.0, 1.0, 7.0, 1.0, 1.0, 0.0, 4.0], "bins": [-0.60302734375, -0.5864295959472656, -0.5698318481445312, -0.5532341003417969, -0.5366363525390625, -0.5200386047363281, -0.5034408569335938, -0.4868431091308594, -0.470245361328125, -0.4536476135253906, -0.43704986572265625, -0.4204521179199219, -0.4038543701171875, -0.3872566223144531, -0.37065887451171875, -0.3540611267089844, -0.33746337890625, -0.3208656311035156, -0.30426788330078125, -0.2876701354980469, -0.2710723876953125, -0.2544746398925781, -0.23787689208984375, -0.22127914428710938, -0.204681396484375, -0.18808364868164062, -0.17148590087890625, -0.15488815307617188, -0.1382904052734375, -0.12169265747070312, -0.10509490966796875, -0.08849716186523438, -0.0718994140625, -0.055301666259765625, -0.03870391845703125, -0.022106170654296875, -0.0055084228515625, 0.011089324951171875, 0.02768707275390625, 0.044284820556640625, 0.060882568359375, 0.07748031616210938, 0.09407806396484375, 0.11067581176757812, 0.1272735595703125, 0.14387130737304688, 0.16046905517578125, 0.17706680297851562, 0.19366455078125, 0.21026229858398438, 0.22686004638671875, 0.24345779418945312, 0.2600555419921875, 0.2766532897949219, 0.29325103759765625, 0.3098487854003906, 0.326446533203125, 0.3430442810058594, 0.35964202880859375, 0.3762397766113281, 0.3928375244140625, 0.4094352722167969, 0.42603302001953125, 0.4426307678222656, 0.459228515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 8.0, 0.0, 6.0, 9.0, 8.0, 7.0, 10.0, 10.0, 17.0, 17.0, 47.0, 46.0, 43.0, 74.0, 73.0, 99.0, 105.0, 88.0, 84.0, 56.0, 49.0, 34.0, 25.0, 15.0, 12.0, 10.0, 11.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2507362365722656, -0.24317169189453125, -0.23560714721679688, -0.2280426025390625, -0.22047805786132812, -0.21291351318359375, -0.20534896850585938, -0.197784423828125, -0.19021987915039062, -0.18265533447265625, -0.17509078979492188, -0.1675262451171875, -0.15996170043945312, -0.15239715576171875, -0.14483261108398438, -0.13726806640625, -0.12970352172851562, -0.12213897705078125, -0.11457443237304688, -0.1070098876953125, -0.09944534301757812, -0.09188079833984375, -0.08431625366210938, -0.076751708984375, -0.06918716430664062, -0.06162261962890625, -0.054058074951171875, -0.0464935302734375, -0.038928985595703125, -0.03136444091796875, -0.023799896240234375, -0.0162353515625, -0.008670806884765625, -0.00110626220703125, 0.006458282470703125, 0.0140228271484375, 0.021587371826171875, 0.02915191650390625, 0.036716461181640625, 0.044281005859375, 0.051845550537109375, 0.05941009521484375, 0.06697463989257812, 0.0745391845703125, 0.08210372924804688, 0.08966827392578125, 0.09723281860351562, 0.10479736328125, 0.11236190795898438, 0.11992645263671875, 0.12749099731445312, 0.1350555419921875, 0.14262008666992188, 0.15018463134765625, 0.15774917602539062, 0.165313720703125, 0.17287826538085938, 0.18044281005859375, 0.18800735473632812, 0.1955718994140625, 0.20313644409179688, 0.21070098876953125, 0.21826553344726562, 0.225830078125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 16.0, 49.0, 130.0, 338.0, 280.0, 112.0, 31.0, 15.0, 8.0, 10.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.274903297424316, -13.925827026367188, -13.576750755310059, -13.22767448425293, -12.8785982131958, -12.529521942138672, -12.180445671081543, -11.831369400024414, -11.482293128967285, -11.133216857910156, -10.784140586853027, -10.435064315795898, -10.08598804473877, -9.73691177368164, -9.387835502624512, -9.038759231567383, -8.689682960510254, -8.340606689453125, -7.991530418395996, -7.642454147338867, -7.293377876281738, -6.944301605224609, -6.5952253341674805, -6.246149063110352, -5.897072792053223, -5.547996520996094, -5.198920249938965, -4.849843978881836, -4.500767707824707, -4.151691436767578, -3.802615165710449, -3.4535388946533203, -3.1044626235961914, -2.7553863525390625, -2.4063100814819336, -2.0572338104248047, -1.7081575393676758, -1.3590812683105469, -1.010004997253418, -0.6609287261962891, -0.31185245513916016, 0.03722381591796875, 0.38630008697509766, 0.7353763580322266, 1.0844526290893555, 1.4335289001464844, 1.7826051712036133, 2.131681442260742, 2.480757713317871, 2.829833984375, 3.178910255432129, 3.527986526489258, 3.8770627975463867, 4.226139068603516, 4.5752153396606445, 4.924291610717773, 5.273367881774902, 5.622444152832031, 5.97152042388916, 6.320596694946289, 6.669672966003418, 7.018749237060547, 7.367825508117676, 7.716901779174805, 8.065978050231934]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 10.0, 13.0, 12.0, 14.0, 13.0, 17.0, 23.0, 16.0, 28.0, 32.0, 42.0, 30.0, 27.0, 45.0, 43.0, 54.0, 49.0, 63.0, 43.0, 41.0, 49.0, 39.0, 36.0, 37.0, 29.0, 30.0, 30.0, 14.0, 18.0, 15.0, 15.0, 12.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.055614471435547, -3.9046711921691895, -3.753728151321411, -3.602785110473633, -3.4518418312072754, -3.300898551940918, -3.1499555110931396, -2.9990124702453613, -2.848069190979004, -2.6971259117126465, -2.546182870864868, -2.39523983001709, -2.2442965507507324, -2.093353271484375, -1.9424102306365967, -1.7914670705795288, -1.640523910522461, -1.489580750465393, -1.3386375904083252, -1.1876944303512573, -1.0367512702941895, -0.8858081102371216, -0.7348649501800537, -0.5839217901229858, -0.43297863006591797, -0.2820354700088501, -0.13109230995178223, 0.019850850105285645, 0.17079401016235352, 0.3217371702194214, 0.47268033027648926, 0.6236234903335571, 0.7745671272277832, 0.9255102872848511, 1.076453447341919, 1.2273966073989868, 1.3783397674560547, 1.5292829275131226, 1.6802260875701904, 1.8311692476272583, 1.9821124076843262, 2.1330556869506836, 2.283998727798462, 2.4349417686462402, 2.5858850479125977, 2.736828327178955, 2.8877713680267334, 3.0387144088745117, 3.189657688140869, 3.3406009674072266, 3.491544008255005, 3.642487049102783, 3.7934303283691406, 3.944373607635498, 4.0953168869018555, 4.246259689331055, 4.397202968597412, 4.5481462478637695, 4.699089050292969, 4.850032329559326, 5.000975608825684, 5.151918888092041, 5.302862167358398, 5.453804969787598, 5.604748249053955]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 14.0, 16.0, 14.0, 15.0, 25.0, 35.0, 62.0, 75.0, 144.0, 205.0, 382.0, 610.0, 1152.0, 2208.0, 5146.0, 14479.0, 54614.0, 517049.0, 3410533.0, 144409.0, 27326.0, 8693.0, 3461.0, 1569.0, 819.0, 475.0, 254.0, 147.0, 112.0, 67.0, 59.0, 22.0, 25.0, 20.0, 16.0, 11.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.12109375, -2.048614501953125, -1.97613525390625, -1.903656005859375, -1.8311767578125, -1.758697509765625, -1.68621826171875, -1.613739013671875, -1.541259765625, -1.468780517578125, -1.39630126953125, -1.323822021484375, -1.2513427734375, -1.178863525390625, -1.10638427734375, -1.033905029296875, -0.96142578125, -0.888946533203125, -0.81646728515625, -0.743988037109375, -0.6715087890625, -0.599029541015625, -0.52655029296875, -0.454071044921875, -0.381591796875, -0.309112548828125, -0.23663330078125, -0.164154052734375, -0.0916748046875, -0.019195556640625, 0.05328369140625, 0.125762939453125, 0.1982421875, 0.270721435546875, 0.34320068359375, 0.415679931640625, 0.4881591796875, 0.560638427734375, 0.63311767578125, 0.705596923828125, 0.778076171875, 0.850555419921875, 0.92303466796875, 0.995513916015625, 1.0679931640625, 1.140472412109375, 1.21295166015625, 1.285430908203125, 1.35791015625, 1.430389404296875, 1.50286865234375, 1.575347900390625, 1.6478271484375, 1.720306396484375, 1.79278564453125, 1.865264892578125, 1.937744140625, 2.010223388671875, 2.08270263671875, 2.155181884765625, 2.2276611328125, 2.300140380859375, 2.37261962890625, 2.445098876953125, 2.517578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 11.0, 9.0, 16.0, 16.0, 25.0, 21.0, 34.0, 52.0, 46.0, 56.0, 73.0, 71.0, 77.0, 70.0, 71.0, 62.0, 56.0, 55.0, 35.0, 29.0, 24.0, 11.0, 14.0, 14.0, 15.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8134765625, -1.7582244873046875, -1.702972412109375, -1.6477203369140625, -1.59246826171875, -1.5372161865234375, -1.481964111328125, -1.4267120361328125, -1.3714599609375, -1.3162078857421875, -1.260955810546875, -1.2057037353515625, -1.15045166015625, -1.0951995849609375, -1.039947509765625, -0.9846954345703125, -0.929443359375, -0.8741912841796875, -0.818939208984375, -0.7636871337890625, -0.70843505859375, -0.6531829833984375, -0.597930908203125, -0.5426788330078125, -0.4874267578125, -0.4321746826171875, -0.376922607421875, -0.3216705322265625, -0.26641845703125, -0.2111663818359375, -0.155914306640625, -0.1006622314453125, -0.04541015625, 0.0098419189453125, 0.065093994140625, 0.1203460693359375, 0.17559814453125, 0.2308502197265625, 0.286102294921875, 0.3413543701171875, 0.3966064453125, 0.4518585205078125, 0.507110595703125, 0.5623626708984375, 0.61761474609375, 0.6728668212890625, 0.728118896484375, 0.7833709716796875, 0.838623046875, 0.8938751220703125, 0.949127197265625, 1.0043792724609375, 1.05963134765625, 1.1148834228515625, 1.170135498046875, 1.2253875732421875, 1.2806396484375, 1.3358917236328125, 1.391143798828125, 1.4463958740234375, 1.50164794921875, 1.5569000244140625, 1.612152099609375, 1.6674041748046875, 1.72265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 5.0, 9.0, 14.0, 22.0, 18.0, 29.0, 34.0, 95.0, 208.0, 496.0, 2104.0, 25208.0, 4067669.0, 93143.0, 3978.0, 717.0, 231.0, 109.0, 64.0, 38.0, 32.0, 15.0, 8.0, 9.0, 4.0, 4.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.455322265625, -5.24267578125, -5.030029296875, -4.8173828125, -4.604736328125, -4.39208984375, -4.179443359375, -3.966796875, -3.754150390625, -3.54150390625, -3.328857421875, -3.1162109375, -2.903564453125, -2.69091796875, -2.478271484375, -2.265625, -2.052978515625, -1.84033203125, -1.627685546875, -1.4150390625, -1.202392578125, -0.98974609375, -0.777099609375, -0.564453125, -0.351806640625, -0.13916015625, 0.073486328125, 0.2861328125, 0.498779296875, 0.71142578125, 0.924072265625, 1.13671875, 1.349365234375, 1.56201171875, 1.774658203125, 1.9873046875, 2.199951171875, 2.41259765625, 2.625244140625, 2.837890625, 3.050537109375, 3.26318359375, 3.475830078125, 3.6884765625, 3.901123046875, 4.11376953125, 4.326416015625, 4.5390625, 4.751708984375, 4.96435546875, 5.177001953125, 5.3896484375, 5.602294921875, 5.81494140625, 6.027587890625, 6.240234375, 6.452880859375, 6.66552734375, 6.878173828125, 7.0908203125, 7.303466796875, 7.51611328125, 7.728759765625, 7.94140625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 11.0, 9.0, 20.0, 23.0, 44.0, 52.0, 93.0, 104.0, 205.0, 442.0, 1618.0, 760.0, 236.0, 157.0, 94.0, 55.0, 39.0, 29.0, 24.0, 15.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82861328125, -0.8054351806640625, -0.782257080078125, -0.7590789794921875, -0.73590087890625, -0.7127227783203125, -0.689544677734375, -0.6663665771484375, -0.6431884765625, -0.6200103759765625, -0.596832275390625, -0.5736541748046875, -0.55047607421875, -0.5272979736328125, -0.504119873046875, -0.4809417724609375, -0.457763671875, -0.4345855712890625, -0.411407470703125, -0.3882293701171875, -0.36505126953125, -0.3418731689453125, -0.318695068359375, -0.2955169677734375, -0.2723388671875, -0.2491607666015625, -0.225982666015625, -0.2028045654296875, -0.17962646484375, -0.1564483642578125, -0.133270263671875, -0.1100921630859375, -0.0869140625, -0.0637359619140625, -0.040557861328125, -0.0173797607421875, 0.00579833984375, 0.0289764404296875, 0.052154541015625, 0.0753326416015625, 0.0985107421875, 0.1216888427734375, 0.144866943359375, 0.1680450439453125, 0.19122314453125, 0.2144012451171875, 0.237579345703125, 0.2607574462890625, 0.283935546875, 0.3071136474609375, 0.330291748046875, 0.3534698486328125, 0.37664794921875, 0.3998260498046875, 0.423004150390625, 0.4461822509765625, 0.4693603515625, 0.4925384521484375, 0.515716552734375, 0.5388946533203125, 0.56207275390625, 0.5852508544921875, 0.608428955078125, 0.6316070556640625, 0.65478515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 13.0, 15.0, 21.0, 50.0, 88.0, 190.0, 235.0, 188.0, 81.0, 43.0, 22.0, 13.0, 8.0, 9.0, 11.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.692881107330322, -6.5391998291015625, -6.385518550872803, -6.231837749481201, -6.078156471252441, -5.924475193023682, -5.770793914794922, -5.617112636566162, -5.463431358337402, -5.309750080108643, -5.156068801879883, -5.002388000488281, -4.8487067222595215, -4.695025444030762, -4.541344165802002, -4.387662887573242, -4.233982086181641, -4.080300807952881, -3.9266197681427, -3.7729384899139404, -3.6192574501037598, -3.465576171875, -3.3118948936462402, -3.1582136154174805, -3.0045325756073, -2.85085129737854, -2.6971702575683594, -2.5434889793395996, -2.38980770111084, -2.236126661300659, -2.0824453830718994, -1.9287642240524292, -1.775083303451538, -1.6214021444320679, -1.4677209854125977, -1.314039707183838, -1.1603585481643677, -1.0066773891448975, -0.8529961705207825, -0.6993149518966675, -0.5456337928771973, -0.39195260405540466, -0.23827141523361206, -0.08459022641181946, 0.06909096240997314, 0.22277212142944336, 0.37645334005355835, 0.5301345586776733, 0.6838157176971436, 0.8374968767166138, 0.9911780953407288, 1.1448593139648438, 1.298540472984314, 1.4522216320037842, 1.605902910232544, 1.7595840692520142, 1.9132652282714844, 2.066946506500244, 2.220627546310425, 2.3743088245391846, 2.5279898643493652, 2.681671142578125, 2.8353524208068848, 2.9890336990356445, 3.142714738845825]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 13.0, 16.0, 18.0, 18.0, 23.0, 32.0, 40.0, 56.0, 51.0, 57.0, 73.0, 49.0, 63.0, 78.0, 63.0, 65.0, 46.0, 50.0, 25.0, 30.0, 24.0, 16.0, 17.0, 13.0, 11.0, 11.0, 4.0, 7.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7186754941940308, -1.656463861465454, -1.594252347946167, -1.5320407152175903, -1.4698290824890137, -1.407617449760437, -1.3454058170318604, -1.2831943035125732, -1.2209826707839966, -1.15877103805542, -1.0965595245361328, -1.0343478918075562, -0.9721362590789795, -0.9099246263504028, -0.847713053226471, -0.7855014801025391, -0.7232898473739624, -0.6610782146453857, -0.5988666415214539, -0.536655068397522, -0.4744434356689453, -0.41223183274269104, -0.35002022981643677, -0.2878086268901825, -0.22559702396392822, -0.16338542103767395, -0.10117381811141968, -0.038962215185165405, 0.023249387741088867, 0.08546099066734314, 0.1476725935935974, 0.20988419651985168, 0.2720959186553955, 0.3343075215816498, 0.39651912450790405, 0.4587307274341583, 0.5209423303604126, 0.5831539630889893, 0.6453655362129211, 0.707577109336853, 0.7697887420654297, 0.8320003747940063, 0.8942119479179382, 0.9564235210418701, 1.0186351537704468, 1.0808467864990234, 1.1430583000183105, 1.2052699327468872, 1.2674815654754639, 1.3296931982040405, 1.3919048309326172, 1.4541163444519043, 1.516327977180481, 1.5785396099090576, 1.6407511234283447, 1.7029627561569214, 1.765174388885498, 1.8273860216140747, 1.8895976543426514, 1.9518091678619385, 2.0140209197998047, 2.076232433319092, 2.138443946838379, 2.200655698776245, 2.2628672122955322]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 3.0, 4.0, 9.0, 9.0, 18.0, 20.0, 15.0, 33.0, 53.0, 83.0, 126.0, 176.0, 257.0, 424.0, 702.0, 1174.0, 2101.0, 4217.0, 8470.0, 19796.0, 56936.0, 212582.0, 502344.0, 161046.0, 45767.0, 16658.0, 7196.0, 3625.0, 1841.0, 1084.0, 643.0, 385.0, 274.0, 162.0, 97.0, 69.0, 38.0, 33.0, 25.0, 21.0, 14.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09918212890625, -0.0958089828491211, -0.09243583679199219, -0.08906269073486328, -0.08568954467773438, -0.08231639862060547, -0.07894325256347656, -0.07557010650634766, -0.07219696044921875, -0.06882381439208984, -0.06545066833496094, -0.06207752227783203, -0.058704376220703125, -0.05533123016357422, -0.05195808410644531, -0.048584938049316406, -0.0452117919921875, -0.041838645935058594, -0.03846549987792969, -0.03509235382080078, -0.031719207763671875, -0.02834606170654297, -0.024972915649414062, -0.021599769592285156, -0.01822662353515625, -0.014853477478027344, -0.011480331420898438, -0.008107185363769531, -0.004734039306640625, -0.0013608932495117188, 0.0020122528076171875, 0.005385398864746094, 0.008758544921875, 0.012131690979003906, 0.015504837036132812, 0.01887798309326172, 0.022251129150390625, 0.02562427520751953, 0.028997421264648438, 0.032370567321777344, 0.03574371337890625, 0.039116859436035156, 0.04249000549316406, 0.04586315155029297, 0.049236297607421875, 0.05260944366455078, 0.05598258972167969, 0.059355735778808594, 0.0627288818359375, 0.0661020278930664, 0.06947517395019531, 0.07284832000732422, 0.07622146606445312, 0.07959461212158203, 0.08296775817871094, 0.08634090423583984, 0.08971405029296875, 0.09308719635009766, 0.09646034240722656, 0.09983348846435547, 0.10320663452148438, 0.10657978057861328, 0.10995292663574219, 0.1133260726928711, 0.11669921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 17.0, 22.0, 21.0, 29.0, 48.0, 54.0, 62.0, 78.0, 82.0, 100.0, 88.0, 77.0, 72.0, 54.0, 49.0, 32.0, 21.0, 24.0, 13.0, 9.0, 14.0, 3.0, 7.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5361328125, -1.4805755615234375, -1.425018310546875, -1.3694610595703125, -1.31390380859375, -1.2583465576171875, -1.202789306640625, -1.1472320556640625, -1.0916748046875, -1.0361175537109375, -0.980560302734375, -0.9250030517578125, -0.86944580078125, -0.8138885498046875, -0.758331298828125, -0.7027740478515625, -0.647216796875, -0.5916595458984375, -0.536102294921875, -0.4805450439453125, -0.42498779296875, -0.3694305419921875, -0.313873291015625, -0.2583160400390625, -0.2027587890625, -0.1472015380859375, -0.091644287109375, -0.0360870361328125, 0.01947021484375, 0.0750274658203125, 0.130584716796875, 0.1861419677734375, 0.24169921875, 0.2972564697265625, 0.352813720703125, 0.4083709716796875, 0.46392822265625, 0.5194854736328125, 0.575042724609375, 0.6305999755859375, 0.6861572265625, 0.7417144775390625, 0.797271728515625, 0.8528289794921875, 0.90838623046875, 0.9639434814453125, 1.019500732421875, 1.0750579833984375, 1.130615234375, 1.1861724853515625, 1.241729736328125, 1.2972869873046875, 1.35284423828125, 1.4084014892578125, 1.463958740234375, 1.5195159912109375, 1.5750732421875, 1.6306304931640625, 1.686187744140625, 1.7417449951171875, 1.79730224609375, 1.8528594970703125, 1.908416748046875, 1.9639739990234375, 2.01953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 10.0, 11.0, 12.0, 17.0, 29.0, 36.0, 42.0, 58.0, 95.0, 178.0, 207.0, 444.0, 1316.0, 7356.0, 104749.0, 825492.0, 98049.0, 7884.0, 1339.0, 462.0, 282.0, 149.0, 93.0, 54.0, 48.0, 36.0, 24.0, 19.0, 15.0, 12.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2117919921875, -0.2040882110595703, -0.19638442993164062, -0.18868064880371094, -0.18097686767578125, -0.17327308654785156, -0.16556930541992188, -0.1578655242919922, -0.1501617431640625, -0.1424579620361328, -0.13475418090820312, -0.12705039978027344, -0.11934661865234375, -0.11164283752441406, -0.10393905639648438, -0.09623527526855469, -0.088531494140625, -0.08082771301269531, -0.07312393188476562, -0.06542015075683594, -0.05771636962890625, -0.05001258850097656, -0.042308807373046875, -0.03460502624511719, -0.0269012451171875, -0.019197463989257812, -0.011493682861328125, -0.0037899017333984375, 0.00391387939453125, 0.011617660522460938, 0.019321441650390625, 0.027025222778320312, 0.03472900390625, 0.04243278503417969, 0.050136566162109375, 0.05784034729003906, 0.06554412841796875, 0.07324790954589844, 0.08095169067382812, 0.08865547180175781, 0.0963592529296875, 0.10406303405761719, 0.11176681518554688, 0.11947059631347656, 0.12717437744140625, 0.13487815856933594, 0.14258193969726562, 0.1502857208251953, 0.157989501953125, 0.1656932830810547, 0.17339706420898438, 0.18110084533691406, 0.18880462646484375, 0.19650840759277344, 0.20421218872070312, 0.2119159698486328, 0.2196197509765625, 0.2273235321044922, 0.23502731323242188, 0.24273109436035156, 0.25043487548828125, 0.25813865661621094, 0.2658424377441406, 0.2735462188720703, 0.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 4.0, 0.0, 5.0, 8.0, 9.0, 11.0, 25.0, 17.0, 25.0, 36.0, 34.0, 35.0, 46.0, 50.0, 42.0, 50.0, 41.0, 47.0, 65.0, 70.0, 55.0, 51.0, 44.0, 42.0, 31.0, 26.0, 24.0, 18.0, 20.0, 8.0, 14.0, 11.0, 9.0, 5.0, 3.0, 4.0, 5.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.173828125, -2.0953369140625, -2.016845703125, -1.9383544921875, -1.85986328125, -1.7813720703125, -1.702880859375, -1.6243896484375, -1.5458984375, -1.4674072265625, -1.388916015625, -1.3104248046875, -1.23193359375, -1.1534423828125, -1.074951171875, -0.9964599609375, -0.91796875, -0.8394775390625, -0.760986328125, -0.6824951171875, -0.60400390625, -0.5255126953125, -0.447021484375, -0.3685302734375, -0.2900390625, -0.2115478515625, -0.133056640625, -0.0545654296875, 0.02392578125, 0.1024169921875, 0.180908203125, 0.2593994140625, 0.337890625, 0.4163818359375, 0.494873046875, 0.5733642578125, 0.65185546875, 0.7303466796875, 0.808837890625, 0.8873291015625, 0.9658203125, 1.0443115234375, 1.122802734375, 1.2012939453125, 1.27978515625, 1.3582763671875, 1.436767578125, 1.5152587890625, 1.59375, 1.6722412109375, 1.750732421875, 1.8292236328125, 1.90771484375, 1.9862060546875, 2.064697265625, 2.1431884765625, 2.2216796875, 2.3001708984375, 2.378662109375, 2.4571533203125, 2.53564453125, 2.6141357421875, 2.692626953125, 2.7711181640625, 2.849609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 26.0, 32.0, 50.0, 87.0, 160.0, 316.0, 745.0, 2656.0, 569554.0, 470945.0, 2631.0, 586.0, 305.0, 155.0, 89.0, 51.0, 29.0, 26.0, 14.0, 13.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07598876953125, -0.07294845581054688, -0.06990814208984375, -0.06686782836914062, -0.0638275146484375, -0.060787200927734375, -0.05774688720703125, -0.054706573486328125, -0.051666259765625, -0.048625946044921875, -0.04558563232421875, -0.042545318603515625, -0.0395050048828125, -0.036464691162109375, -0.03342437744140625, -0.030384063720703125, -0.02734375, -0.024303436279296875, -0.02126312255859375, -0.018222808837890625, -0.0151824951171875, -0.012142181396484375, -0.00910186767578125, -0.006061553955078125, -0.003021240234375, 1.9073486328125e-05, 0.00305938720703125, 0.006099700927734375, 0.0091400146484375, 0.012180328369140625, 0.01522064208984375, 0.018260955810546875, 0.02130126953125, 0.024341583251953125, 0.02738189697265625, 0.030422210693359375, 0.0334625244140625, 0.036502838134765625, 0.03954315185546875, 0.042583465576171875, 0.045623779296875, 0.048664093017578125, 0.05170440673828125, 0.054744720458984375, 0.0577850341796875, 0.060825347900390625, 0.06386566162109375, 0.06690597534179688, 0.0699462890625, 0.07298660278320312, 0.07602691650390625, 0.07906723022460938, 0.0821075439453125, 0.08514785766601562, 0.08818817138671875, 0.09122848510742188, 0.094268798828125, 0.09730911254882812, 0.10034942626953125, 0.10338973999023438, 0.1064300537109375, 0.10947036743164062, 0.11251068115234375, 0.11555099487304688, 0.11859130859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 11.0, 7.0, 8.0, 14.0, 21.0, 22.0, 28.0, 43.0, 61.0, 70.0, 77.0, 87.0, 73.0, 81.0, 96.0, 76.0, 53.0, 41.0, 26.0, 30.0, 14.0, 16.0, 13.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.9739381968975067e-05, -1.915358006954193e-05, -1.8567778170108795e-05, -1.798197627067566e-05, -1.7396174371242523e-05, -1.6810372471809387e-05, -1.622457057237625e-05, -1.5638768672943115e-05, -1.505296677350998e-05, -1.4467164874076843e-05, -1.3881362974643707e-05, -1.3295561075210571e-05, -1.2709759175777435e-05, -1.21239572763443e-05, -1.1538155376911163e-05, -1.0952353477478027e-05, -1.0366551578044891e-05, -9.780749678611755e-06, -9.19494777917862e-06, -8.609145879745483e-06, -8.023343980312347e-06, -7.4375420808792114e-06, -6.8517401814460754e-06, -6.2659382820129395e-06, -5.6801363825798035e-06, -5.0943344831466675e-06, -4.5085325837135315e-06, -3.9227306842803955e-06, -3.3369287848472595e-06, -2.7511268854141235e-06, -2.1653249859809875e-06, -1.5795230865478516e-06, -9.937211871147156e-07, -4.079192876815796e-07, 1.778826117515564e-07, 7.636845111846924e-07, 1.3494864106178284e-06, 1.9352883100509644e-06, 2.5210902094841003e-06, 3.1068921089172363e-06, 3.6926940083503723e-06, 4.278495907783508e-06, 4.864297807216644e-06, 5.45009970664978e-06, 6.035901606082916e-06, 6.621703505516052e-06, 7.207505404949188e-06, 7.793307304382324e-06, 8.37910920381546e-06, 8.964911103248596e-06, 9.550713002681732e-06, 1.0136514902114868e-05, 1.0722316801548004e-05, 1.130811870098114e-05, 1.1893920600414276e-05, 1.2479722499847412e-05, 1.3065524399280548e-05, 1.3651326298713684e-05, 1.423712819814682e-05, 1.4822930097579956e-05, 1.5408731997013092e-05, 1.5994533896446228e-05, 1.6580335795879364e-05, 1.71661376953125e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 9.0, 25.0, 29.0, 39.0, 74.0, 141.0, 254.0, 670.0, 2006.0, 10616.0, 491193.0, 529911.0, 10491.0, 1933.0, 622.0, 254.0, 106.0, 64.0, 38.0, 21.0, 14.0, 10.0, 4.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0787353515625, -0.07570743560791016, -0.07267951965332031, -0.06965160369873047, -0.06662368774414062, -0.06359577178955078, -0.06056785583496094, -0.057539939880371094, -0.05451202392578125, -0.051484107971191406, -0.04845619201660156, -0.04542827606201172, -0.042400360107421875, -0.03937244415283203, -0.03634452819824219, -0.033316612243652344, -0.0302886962890625, -0.027260780334472656, -0.024232864379882812, -0.02120494842529297, -0.018177032470703125, -0.015149116516113281, -0.012121200561523438, -0.009093284606933594, -0.00606536865234375, -0.0030374526977539062, -9.5367431640625e-06, 0.0030183792114257812, 0.006046295166015625, 0.009074211120605469, 0.012102127075195312, 0.015130043029785156, 0.018157958984375, 0.021185874938964844, 0.024213790893554688, 0.02724170684814453, 0.030269622802734375, 0.03329753875732422, 0.03632545471191406, 0.039353370666503906, 0.04238128662109375, 0.045409202575683594, 0.04843711853027344, 0.05146503448486328, 0.054492950439453125, 0.05752086639404297, 0.06054878234863281, 0.06357669830322266, 0.0666046142578125, 0.06963253021240234, 0.07266044616699219, 0.07568836212158203, 0.07871627807617188, 0.08174419403076172, 0.08477210998535156, 0.0878000259399414, 0.09082794189453125, 0.0938558578491211, 0.09688377380371094, 0.09991168975830078, 0.10293960571289062, 0.10596752166748047, 0.10899543762207031, 0.11202335357666016, 0.11505126953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 12.0, 20.0, 29.0, 66.0, 168.0, 363.0, 135.0, 64.0, 22.0, 18.0, 17.0, 14.0, 10.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0205078125, -0.019943594932556152, -0.019379377365112305, -0.018815159797668457, -0.01825094223022461, -0.01768672466278076, -0.017122507095336914, -0.016558289527893066, -0.01599407196044922, -0.015429854393005371, -0.014865636825561523, -0.014301419258117676, -0.013737201690673828, -0.01317298412322998, -0.012608766555786133, -0.012044548988342285, -0.011480331420898438, -0.01091611385345459, -0.010351896286010742, -0.009787678718566895, -0.009223461151123047, -0.0086592435836792, -0.008095026016235352, -0.007530808448791504, -0.006966590881347656, -0.006402373313903809, -0.005838155746459961, -0.005273938179016113, -0.004709720611572266, -0.004145503044128418, -0.0035812854766845703, -0.0030170679092407227, -0.002452850341796875, -0.0018886327743530273, -0.0013244152069091797, -0.000760197639465332, -0.00019598007202148438, 0.0003682374954223633, 0.0009324550628662109, 0.0014966726303100586, 0.0020608901977539062, 0.002625107765197754, 0.0031893253326416016, 0.0037535429000854492, 0.004317760467529297, 0.0048819780349731445, 0.005446195602416992, 0.00601041316986084, 0.0065746307373046875, 0.007138848304748535, 0.007703065872192383, 0.00826728343963623, 0.008831501007080078, 0.009395718574523926, 0.009959936141967773, 0.010524153709411621, 0.011088371276855469, 0.011652588844299316, 0.012216806411743164, 0.012781023979187012, 0.01334524154663086, 0.013909459114074707, 0.014473676681518555, 0.015037894248962402, 0.01560211181640625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 16.0, 10.0, 25.0, 53.0, 97.0, 237.0, 299.0, 138.0, 56.0, 21.0, 14.0, 11.0, 16.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.168915271759033, -5.043398857116699, -4.917882442474365, -4.7923665046691895, -4.6668500900268555, -4.5413336753845215, -4.4158172607421875, -4.290301322937012, -4.164784908294678, -4.039268493652344, -3.913752317428589, -3.788235902786255, -3.6627197265625, -3.537203311920166, -3.411686897277832, -3.286170721054077, -3.160654306411743, -3.035137891769409, -2.9096217155456543, -2.7841053009033203, -2.6585891246795654, -2.5330727100372314, -2.4075565338134766, -2.2820401191711426, -2.1565237045288086, -2.0310072898864746, -1.9054911136627197, -1.7799746990203857, -1.6544585227966309, -1.5289421081542969, -1.4034258127212524, -1.277909517288208, -1.1523935794830322, -1.0268772840499878, -0.9013609886169434, -0.7758446335792542, -0.6503283381462097, -0.5248120427131653, -0.3992956876754761, -0.27377939224243164, -0.1482630968093872, -0.02274678647518158, 0.10276952385902405, 0.22828584909439087, 0.3538021445274353, 0.47931843996047974, 0.604834794998169, 0.7303510904312134, 0.8558673858642578, 0.9813836812973022, 1.1068999767303467, 1.2324163913726807, 1.3579325675964355, 1.4834489822387695, 1.608965277671814, 1.7344815731048584, 1.8599978685379028, 1.9855141639709473, 2.1110305786132812, 2.236546754837036, 2.36206316947937, 2.487579345703125, 2.613095760345459, 2.738612174987793, 2.864128351211548]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 16.0, 18.0, 18.0, 24.0, 27.0, 31.0, 55.0, 67.0, 71.0, 95.0, 70.0, 84.0, 87.0, 72.0, 56.0, 46.0, 35.0, 27.0, 22.0, 18.0, 14.0, 9.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3749933242797852, -1.3238755464553833, -1.272757887840271, -1.2216401100158691, -1.1705224514007568, -1.119404673576355, -1.0682870149612427, -1.0171692371368408, -0.9660515785217285, -0.9149338603019714, -0.8638161420822144, -0.8126984238624573, -0.7615807056427002, -0.7104629278182983, -0.659345269203186, -0.6082274913787842, -0.5571097731590271, -0.50599205493927, -0.45487433671951294, -0.40375661849975586, -0.3526389002799988, -0.3015211522579193, -0.25040343403816223, -0.19928571581840515, -0.14816799759864807, -0.09705027937889099, -0.045932553708553314, 0.005185171961784363, 0.05630289018154144, 0.10742062330245972, 0.1585383415222168, 0.20965605974197388, 0.26077377796173096, 0.31189149618148804, 0.3630092144012451, 0.4141269326210022, 0.4652446508407593, 0.5163624286651611, 0.5674800872802734, 0.6185978651046753, 0.6697155237197876, 0.7208332419395447, 0.7719509601593018, 0.8230686783790588, 0.8741863965988159, 0.9253041744232178, 0.9764218330383301, 1.027539610862732, 1.0786573886871338, 1.1297751665115356, 1.180892825126648, 1.2320106029510498, 1.283128261566162, 1.334246039390564, 1.3853636980056763, 1.4364814758300781, 1.4875991344451904, 1.5387169122695923, 1.5898345708847046, 1.6409523487091064, 1.6920700073242188, 1.7431877851486206, 1.794305443763733, 1.8454232215881348, 1.896540880203247]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 8.0, 18.0, 34.0, 94.0, 324.0, 1047.0, 6274.0, 180208.0, 841444.0, 16532.0, 1851.0, 446.0, 151.0, 57.0, 18.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.986328125, -3.854278564453125, -3.72222900390625, -3.590179443359375, -3.4581298828125, -3.326080322265625, -3.19403076171875, -3.061981201171875, -2.929931640625, -2.797882080078125, -2.66583251953125, -2.533782958984375, -2.4017333984375, -2.269683837890625, -2.13763427734375, -2.005584716796875, -1.87353515625, -1.741485595703125, -1.60943603515625, -1.477386474609375, -1.3453369140625, -1.213287353515625, -1.08123779296875, -0.949188232421875, -0.817138671875, -0.685089111328125, -0.55303955078125, -0.420989990234375, -0.2889404296875, -0.156890869140625, -0.02484130859375, 0.107208251953125, 0.2392578125, 0.371307373046875, 0.50335693359375, 0.635406494140625, 0.7674560546875, 0.899505615234375, 1.03155517578125, 1.163604736328125, 1.295654296875, 1.427703857421875, 1.55975341796875, 1.691802978515625, 1.8238525390625, 1.955902099609375, 2.08795166015625, 2.220001220703125, 2.35205078125, 2.484100341796875, 2.61614990234375, 2.748199462890625, 2.8802490234375, 3.012298583984375, 3.14434814453125, 3.276397705078125, 3.408447265625, 3.540496826171875, 3.67254638671875, 3.804595947265625, 3.9366455078125, 4.068695068359375, 4.20074462890625, 4.332794189453125, 4.46484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 12.0, 9.0, 9.0, 10.0, 20.0, 22.0, 23.0, 32.0, 44.0, 59.0, 69.0, 74.0, 83.0, 85.0, 83.0, 77.0, 46.0, 48.0, 31.0, 32.0, 30.0, 26.0, 15.0, 9.0, 11.0, 11.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.974609375, -2.865966796875, -2.75732421875, -2.648681640625, -2.5400390625, -2.431396484375, -2.32275390625, -2.214111328125, -2.10546875, -1.996826171875, -1.88818359375, -1.779541015625, -1.6708984375, -1.562255859375, -1.45361328125, -1.344970703125, -1.236328125, -1.127685546875, -1.01904296875, -0.910400390625, -0.8017578125, -0.693115234375, -0.58447265625, -0.475830078125, -0.3671875, -0.258544921875, -0.14990234375, -0.041259765625, 0.0673828125, 0.176025390625, 0.28466796875, 0.393310546875, 0.501953125, 0.610595703125, 0.71923828125, 0.827880859375, 0.9365234375, 1.045166015625, 1.15380859375, 1.262451171875, 1.37109375, 1.479736328125, 1.58837890625, 1.697021484375, 1.8056640625, 1.914306640625, 2.02294921875, 2.131591796875, 2.240234375, 2.348876953125, 2.45751953125, 2.566162109375, 2.6748046875, 2.783447265625, 2.89208984375, 3.000732421875, 3.109375, 3.218017578125, 3.32666015625, 3.435302734375, 3.5439453125, 3.652587890625, 3.76123046875, 3.869873046875, 3.978515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 2.0, 8.0, 7.0, 9.0, 9.0, 11.0, 11.0, 24.0, 30.0, 43.0, 39.0, 61.0, 65.0, 137.0, 171.0, 301.0, 535.0, 1089.0, 2616.0, 7630.0, 34006.0, 308741.0, 613216.0, 61548.0, 11420.0, 3607.0, 1428.0, 678.0, 377.0, 246.0, 128.0, 93.0, 64.0, 47.0, 37.0, 22.0, 25.0, 13.0, 14.0, 11.0, 7.0, 6.0, 2.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.2297515869140625, -1.186065673828125, -1.1423797607421875, -1.09869384765625, -1.0550079345703125, -1.011322021484375, -0.9676361083984375, -0.9239501953125, -0.8802642822265625, -0.836578369140625, -0.7928924560546875, -0.74920654296875, -0.7055206298828125, -0.661834716796875, -0.6181488037109375, -0.574462890625, -0.5307769775390625, -0.487091064453125, -0.4434051513671875, -0.39971923828125, -0.3560333251953125, -0.312347412109375, -0.2686614990234375, -0.2249755859375, -0.1812896728515625, -0.137603759765625, -0.0939178466796875, -0.05023193359375, -0.0065460205078125, 0.037139892578125, 0.0808258056640625, 0.12451171875, 0.1681976318359375, 0.211883544921875, 0.2555694580078125, 0.29925537109375, 0.3429412841796875, 0.386627197265625, 0.4303131103515625, 0.4739990234375, 0.5176849365234375, 0.561370849609375, 0.6050567626953125, 0.64874267578125, 0.6924285888671875, 0.736114501953125, 0.7798004150390625, 0.823486328125, 0.8671722412109375, 0.910858154296875, 0.9545440673828125, 0.99822998046875, 1.0419158935546875, 1.085601806640625, 1.1292877197265625, 1.1729736328125, 1.2166595458984375, 1.260345458984375, 1.3040313720703125, 1.34771728515625, 1.3914031982421875, 1.435089111328125, 1.4787750244140625, 1.5224609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 9.0, 12.0, 14.0, 18.0, 20.0, 20.0, 28.0, 28.0, 33.0, 37.0, 36.0, 39.0, 43.0, 45.0, 44.0, 47.0, 45.0, 43.0, 51.0, 45.0, 48.0, 34.0, 22.0, 34.0, 29.0, 21.0, 29.0, 25.0, 11.0, 17.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.828277587890625, -2.73077392578125, -2.633270263671875, -2.5357666015625, -2.438262939453125, -2.34075927734375, -2.243255615234375, -2.145751953125, -2.048248291015625, -1.95074462890625, -1.853240966796875, -1.7557373046875, -1.658233642578125, -1.56072998046875, -1.463226318359375, -1.36572265625, -1.268218994140625, -1.17071533203125, -1.073211669921875, -0.9757080078125, -0.878204345703125, -0.78070068359375, -0.683197021484375, -0.585693359375, -0.488189697265625, -0.39068603515625, -0.293182373046875, -0.1956787109375, -0.098175048828125, -0.00067138671875, 0.096832275390625, 0.1943359375, 0.291839599609375, 0.38934326171875, 0.486846923828125, 0.5843505859375, 0.681854248046875, 0.77935791015625, 0.876861572265625, 0.974365234375, 1.071868896484375, 1.16937255859375, 1.266876220703125, 1.3643798828125, 1.461883544921875, 1.55938720703125, 1.656890869140625, 1.75439453125, 1.851898193359375, 1.94940185546875, 2.046905517578125, 2.1444091796875, 2.241912841796875, 2.33941650390625, 2.436920166015625, 2.534423828125, 2.631927490234375, 2.72943115234375, 2.826934814453125, 2.9244384765625, 3.021942138671875, 3.11944580078125, 3.216949462890625, 3.314453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 18.0, 28.0, 41.0, 40.0, 79.0, 131.0, 227.0, 465.0, 904.0, 2287.0, 6541.0, 26951.0, 201568.0, 704455.0, 83035.0, 14767.0, 4037.0, 1496.0, 678.0, 342.0, 168.0, 111.0, 56.0, 34.0, 22.0, 23.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.67626953125, -0.6571121215820312, -0.6379547119140625, -0.6187973022460938, -0.599639892578125, -0.5804824829101562, -0.5613250732421875, -0.5421676635742188, -0.52301025390625, -0.5038528442382812, -0.4846954345703125, -0.46553802490234375, -0.446380615234375, -0.42722320556640625, -0.4080657958984375, -0.38890838623046875, -0.3697509765625, -0.35059356689453125, -0.3314361572265625, -0.31227874755859375, -0.293121337890625, -0.27396392822265625, -0.2548065185546875, -0.23564910888671875, -0.21649169921875, -0.19733428955078125, -0.1781768798828125, -0.15901947021484375, -0.139862060546875, -0.12070465087890625, -0.1015472412109375, -0.08238983154296875, -0.063232421875, -0.04407501220703125, -0.0249176025390625, -0.00576019287109375, 0.013397216796875, 0.03255462646484375, 0.0517120361328125, 0.07086944580078125, 0.09002685546875, 0.10918426513671875, 0.1283416748046875, 0.14749908447265625, 0.166656494140625, 0.18581390380859375, 0.2049713134765625, 0.22412872314453125, 0.2432861328125, 0.26244354248046875, 0.2816009521484375, 0.30075836181640625, 0.319915771484375, 0.33907318115234375, 0.3582305908203125, 0.37738800048828125, 0.39654541015625, 0.41570281982421875, 0.4348602294921875, 0.45401763916015625, 0.473175048828125, 0.49233245849609375, 0.5114898681640625, 0.5306472778320312, 0.5498046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 10.0, 4.0, 8.0, 16.0, 16.0, 16.0, 22.0, 43.0, 61.0, 70.0, 108.0, 185.0, 124.0, 85.0, 56.0, 58.0, 25.0, 25.0, 17.0, 18.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.85860824584961e-05, -9.537674486637115e-05, -9.216740727424622e-05, -8.895806968212128e-05, -8.574873208999634e-05, -8.25393944978714e-05, -7.933005690574646e-05, -7.612071931362152e-05, -7.291138172149658e-05, -6.970204412937164e-05, -6.64927065372467e-05, -6.328336894512177e-05, -6.0074031352996826e-05, -5.686469376087189e-05, -5.365535616874695e-05, -5.044601857662201e-05, -4.723668098449707e-05, -4.402734339237213e-05, -4.081800580024719e-05, -3.7608668208122253e-05, -3.4399330615997314e-05, -3.1189993023872375e-05, -2.7980655431747437e-05, -2.4771317839622498e-05, -2.156198024749756e-05, -1.835264265537262e-05, -1.514330506324768e-05, -1.1933967471122742e-05, -8.724629878997803e-06, -5.515292286872864e-06, -2.305954694747925e-06, 9.033828973770142e-07, 4.112720489501953e-06, 7.322058081626892e-06, 1.0531395673751831e-05, 1.374073326587677e-05, 1.695007085800171e-05, 2.0159408450126648e-05, 2.3368746042251587e-05, 2.6578083634376526e-05, 2.9787421226501465e-05, 3.2996758818626404e-05, 3.620609641075134e-05, 3.941543400287628e-05, 4.262477159500122e-05, 4.583410918712616e-05, 4.90434467792511e-05, 5.225278437137604e-05, 5.5462121963500977e-05, 5.8671459555625916e-05, 6.188079714775085e-05, 6.50901347398758e-05, 6.829947233200073e-05, 7.150880992412567e-05, 7.471814751625061e-05, 7.792748510837555e-05, 8.113682270050049e-05, 8.434616029262543e-05, 8.755549788475037e-05, 9.07648354768753e-05, 9.397417306900024e-05, 9.718351066112518e-05, 0.00010039284825325012, 0.00010360218584537506, 0.0001068115234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 16.0, 24.0, 31.0, 43.0, 65.0, 106.0, 158.0, 271.0, 439.0, 881.0, 2043.0, 4717.0, 14346.0, 57948.0, 451630.0, 436531.0, 56821.0, 13943.0, 4611.0, 1875.0, 866.0, 418.0, 259.0, 159.0, 103.0, 66.0, 40.0, 35.0, 21.0, 12.0, 12.0, 6.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48888397216796875, -0.4714202880859375, -0.45395660400390625, -0.436492919921875, -0.41902923583984375, -0.4015655517578125, -0.38410186767578125, -0.36663818359375, -0.34917449951171875, -0.3317108154296875, -0.31424713134765625, -0.296783447265625, -0.27931976318359375, -0.2618560791015625, -0.24439239501953125, -0.2269287109375, -0.20946502685546875, -0.1920013427734375, -0.17453765869140625, -0.157073974609375, -0.13961029052734375, -0.1221466064453125, -0.10468292236328125, -0.08721923828125, -0.06975555419921875, -0.0522918701171875, -0.03482818603515625, -0.017364501953125, 9.918212890625e-05, 0.0175628662109375, 0.03502655029296875, 0.052490234375, 0.06995391845703125, 0.0874176025390625, 0.10488128662109375, 0.122344970703125, 0.13980865478515625, 0.1572723388671875, 0.17473602294921875, 0.19219970703125, 0.20966339111328125, 0.2271270751953125, 0.24459075927734375, 0.262054443359375, 0.27951812744140625, 0.2969818115234375, 0.31444549560546875, 0.3319091796875, 0.34937286376953125, 0.3668365478515625, 0.38430023193359375, 0.401763916015625, 0.41922760009765625, 0.4366912841796875, 0.45415496826171875, 0.47161865234375, 0.48908233642578125, 0.5065460205078125, 0.5240097045898438, 0.541473388671875, 0.5589370727539062, 0.5764007568359375, 0.5938644409179688, 0.611328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 8.0, 13.0, 17.0, 21.0, 28.0, 30.0, 46.0, 50.0, 70.0, 105.0, 125.0, 125.0, 78.0, 53.0, 50.0, 40.0, 27.0, 26.0, 18.0, 10.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3117523193359375, -0.302459716796875, -0.2931671142578125, -0.28387451171875, -0.2745819091796875, -0.265289306640625, -0.2559967041015625, -0.2467041015625, -0.2374114990234375, -0.228118896484375, -0.2188262939453125, -0.20953369140625, -0.2002410888671875, -0.190948486328125, -0.1816558837890625, -0.17236328125, -0.1630706787109375, -0.153778076171875, -0.1444854736328125, -0.13519287109375, -0.1259002685546875, -0.116607666015625, -0.1073150634765625, -0.0980224609375, -0.0887298583984375, -0.079437255859375, -0.0701446533203125, -0.06085205078125, -0.0515594482421875, -0.042266845703125, -0.0329742431640625, -0.023681640625, -0.0143890380859375, -0.005096435546875, 0.0041961669921875, 0.01348876953125, 0.0227813720703125, 0.032073974609375, 0.0413665771484375, 0.0506591796875, 0.0599517822265625, 0.069244384765625, 0.0785369873046875, 0.08782958984375, 0.0971221923828125, 0.106414794921875, 0.1157073974609375, 0.125, 0.1342926025390625, 0.143585205078125, 0.1528778076171875, 0.16217041015625, 0.1714630126953125, 0.180755615234375, 0.1900482177734375, 0.1993408203125, 0.2086334228515625, 0.217926025390625, 0.2272186279296875, 0.23651123046875, 0.2458038330078125, 0.255096435546875, 0.2643890380859375, 0.273681640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 14.0, 29.0, 120.0, 440.0, 288.0, 67.0, 22.0, 9.0, 11.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.458877563476562, -21.000242233276367, -20.541606903076172, -20.08297348022461, -19.624338150024414, -19.16570281982422, -18.707067489624023, -18.248432159423828, -17.789796829223633, -17.331161499023438, -16.872526168823242, -16.413890838623047, -15.955256462097168, -15.496622085571289, -15.037986755371094, -14.579351425170898, -14.12071704864502, -13.662081718444824, -13.203447341918945, -12.74481201171875, -12.286176681518555, -11.82754135131836, -11.36890697479248, -10.910271644592285, -10.451637268066406, -9.993001937866211, -9.534367561340332, -9.075732231140137, -8.617096900939941, -8.158462524414062, -7.699827194213867, -7.241191864013672, -6.782557010650635, -6.323922157287598, -5.865286827087402, -5.406651973724365, -4.948017120361328, -4.489381790161133, -4.030746936798096, -3.5721118450164795, -3.1134767532348633, -2.654841661453247, -2.196206569671631, -1.7375717163085938, -1.2789366245269775, -0.8203015327453613, -0.3616666793823242, 0.09696841239929199, 0.5556035041809082, 1.0142385959625244, 1.472873568534851, 1.9315085411071777, 2.390143632888794, 2.84877872467041, 3.3074135780334473, 3.7660486698150635, 4.22468376159668, 4.683318614959717, 5.141953945159912, 5.600588798522949, 6.0592241287231445, 6.517858982086182, 6.976493835449219, 7.435129165649414, 7.893764019012451]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 10.0, 12.0, 14.0, 16.0, 22.0, 28.0, 25.0, 40.0, 41.0, 45.0, 42.0, 46.0, 41.0, 52.0, 51.0, 53.0, 65.0, 45.0, 46.0, 45.0, 39.0, 28.0, 27.0, 21.0, 29.0, 19.0, 13.0, 23.0, 11.0, 10.0, 6.0, 12.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.503831386566162, -6.293907165527344, -6.083983421325684, -5.874059200286865, -5.664135456085205, -5.454211235046387, -5.244287490844727, -5.034363269805908, -4.824439525604248, -4.61451530456543, -4.4045915603637695, -4.194667339324951, -3.984743595123291, -3.7748193740844727, -3.5648956298828125, -3.354971408843994, -3.145047426223755, -2.9351234436035156, -2.7251994609832764, -2.515275478363037, -2.305351495742798, -2.0954275131225586, -1.8855034112930298, -1.6755794286727905, -1.4656554460525513, -1.255731463432312, -1.0458074808120728, -0.8358834385871887, -0.6259594559669495, -0.41603541374206543, -0.20611143112182617, 0.003812551498413086, 0.21373653411865234, 0.4236605167388916, 0.6335844993591309, 0.8435085415840149, 1.0534324645996094, 1.2633565664291382, 1.4732805490493774, 1.6832045316696167, 1.893128514289856, 2.1030526161193848, 2.312976598739624, 2.5229005813598633, 2.7328245639801025, 2.942748546600342, 3.152672529220581, 3.3625965118408203, 3.5725204944610596, 3.782444477081299, 3.992368459701538, 4.202292442321777, 4.412216663360596, 4.622140407562256, 4.832064628601074, 5.041988372802734, 5.251912593841553, 5.461836814880371, 5.671760559082031, 5.88168478012085, 6.09160852432251, 6.301532745361328, 6.511456489562988, 6.721380710601807, 6.931304454803467]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 11.0, 10.0, 13.0, 29.0, 44.0, 73.0, 90.0, 162.0, 224.0, 452.0, 822.0, 1627.0, 3331.0, 8360.0, 25694.0, 124619.0, 2858370.0, 1060458.0, 78824.0, 18749.0, 6468.0, 2751.0, 1327.0, 696.0, 398.0, 213.0, 175.0, 90.0, 61.0, 52.0, 30.0, 18.0, 13.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9084930419921875, -1.837493896484375, -1.7664947509765625, -1.69549560546875, -1.6244964599609375, -1.553497314453125, -1.4824981689453125, -1.4114990234375, -1.3404998779296875, -1.269500732421875, -1.1985015869140625, -1.12750244140625, -1.0565032958984375, -0.985504150390625, -0.9145050048828125, -0.843505859375, -0.7725067138671875, -0.701507568359375, -0.6305084228515625, -0.55950927734375, -0.4885101318359375, -0.417510986328125, -0.3465118408203125, -0.2755126953125, -0.2045135498046875, -0.133514404296875, -0.0625152587890625, 0.00848388671875, 0.0794830322265625, 0.150482177734375, 0.2214813232421875, 0.29248046875, 0.3634796142578125, 0.434478759765625, 0.5054779052734375, 0.57647705078125, 0.6474761962890625, 0.718475341796875, 0.7894744873046875, 0.8604736328125, 0.9314727783203125, 1.002471923828125, 1.0734710693359375, 1.14447021484375, 1.2154693603515625, 1.286468505859375, 1.3574676513671875, 1.428466796875, 1.4994659423828125, 1.570465087890625, 1.6414642333984375, 1.71246337890625, 1.7834625244140625, 1.854461669921875, 1.9254608154296875, 1.9964599609375, 2.0674591064453125, 2.138458251953125, 2.2094573974609375, 2.28045654296875, 2.3514556884765625, 2.422454833984375, 2.4934539794921875, 2.564453125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 9.0, 4.0, 9.0, 5.0, 13.0, 19.0, 24.0, 37.0, 36.0, 64.0, 78.0, 79.0, 91.0, 85.0, 92.0, 62.0, 65.0, 49.0, 42.0, 34.0, 28.0, 19.0, 10.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.593963623046875, -1.53363037109375, -1.473297119140625, -1.4129638671875, -1.352630615234375, -1.29229736328125, -1.231964111328125, -1.171630859375, -1.111297607421875, -1.05096435546875, -0.990631103515625, -0.9302978515625, -0.869964599609375, -0.80963134765625, -0.749298095703125, -0.68896484375, -0.628631591796875, -0.56829833984375, -0.507965087890625, -0.4476318359375, -0.387298583984375, -0.32696533203125, -0.266632080078125, -0.206298828125, -0.145965576171875, -0.08563232421875, -0.025299072265625, 0.0350341796875, 0.095367431640625, 0.15570068359375, 0.216033935546875, 0.2763671875, 0.336700439453125, 0.39703369140625, 0.457366943359375, 0.5177001953125, 0.578033447265625, 0.63836669921875, 0.698699951171875, 0.759033203125, 0.819366455078125, 0.87969970703125, 0.940032958984375, 1.0003662109375, 1.060699462890625, 1.12103271484375, 1.181365966796875, 1.24169921875, 1.302032470703125, 1.36236572265625, 1.422698974609375, 1.4830322265625, 1.543365478515625, 1.60369873046875, 1.664031982421875, 1.724365234375, 1.784698486328125, 1.84503173828125, 1.905364990234375, 1.9656982421875, 2.026031494140625, 2.08636474609375, 2.146697998046875, 2.20703125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 19.0, 21.0, 27.0, 37.0, 65.0, 85.0, 208.0, 368.0, 819.0, 1960.0, 6276.0, 31812.0, 545448.0, 3519654.0, 71579.0, 10749.0, 2983.0, 1077.0, 467.0, 238.0, 135.0, 89.0, 49.0, 20.0, 23.0, 17.0, 14.0, 11.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.187164306640625, -3.09112548828125, -2.995086669921875, -2.8990478515625, -2.803009033203125, -2.70697021484375, -2.610931396484375, -2.514892578125, -2.418853759765625, -2.32281494140625, -2.226776123046875, -2.1307373046875, -2.034698486328125, -1.93865966796875, -1.842620849609375, -1.74658203125, -1.650543212890625, -1.55450439453125, -1.458465576171875, -1.3624267578125, -1.266387939453125, -1.17034912109375, -1.074310302734375, -0.978271484375, -0.882232666015625, -0.78619384765625, -0.690155029296875, -0.5941162109375, -0.498077392578125, -0.40203857421875, -0.305999755859375, -0.2099609375, -0.113922119140625, -0.01788330078125, 0.078155517578125, 0.1741943359375, 0.270233154296875, 0.36627197265625, 0.462310791015625, 0.558349609375, 0.654388427734375, 0.75042724609375, 0.846466064453125, 0.9425048828125, 1.038543701171875, 1.13458251953125, 1.230621337890625, 1.32666015625, 1.422698974609375, 1.51873779296875, 1.614776611328125, 1.7108154296875, 1.806854248046875, 1.90289306640625, 1.998931884765625, 2.094970703125, 2.191009521484375, 2.28704833984375, 2.383087158203125, 2.4791259765625, 2.575164794921875, 2.67120361328125, 2.767242431640625, 2.86328125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 7.0, 14.0, 18.0, 36.0, 50.0, 60.0, 88.0, 148.0, 240.0, 557.0, 1312.0, 723.0, 319.0, 167.0, 89.0, 82.0, 52.0, 35.0, 22.0, 12.0, 7.0, 9.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6572799682617188, -0.6358489990234375, -0.6144180297851562, -0.592987060546875, -0.5715560913085938, -0.5501251220703125, -0.5286941528320312, -0.50726318359375, -0.48583221435546875, -0.4644012451171875, -0.44297027587890625, -0.421539306640625, -0.40010833740234375, -0.3786773681640625, -0.35724639892578125, -0.3358154296875, -0.31438446044921875, -0.2929534912109375, -0.27152252197265625, -0.250091552734375, -0.22866058349609375, -0.2072296142578125, -0.18579864501953125, -0.16436767578125, -0.14293670654296875, -0.1215057373046875, -0.10007476806640625, -0.078643798828125, -0.05721282958984375, -0.0357818603515625, -0.01435089111328125, 0.007080078125, 0.02851104736328125, 0.0499420166015625, 0.07137298583984375, 0.092803955078125, 0.11423492431640625, 0.1356658935546875, 0.15709686279296875, 0.17852783203125, 0.19995880126953125, 0.2213897705078125, 0.24282073974609375, 0.264251708984375, 0.28568267822265625, 0.3071136474609375, 0.32854461669921875, 0.3499755859375, 0.37140655517578125, 0.3928375244140625, 0.41426849365234375, 0.435699462890625, 0.45713043212890625, 0.4785614013671875, 0.49999237060546875, 0.52142333984375, 0.5428543090820312, 0.5642852783203125, 0.5857162475585938, 0.607147216796875, 0.6285781860351562, 0.6500091552734375, 0.6714401245117188, 0.69287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 8.0, 20.0, 39.0, 82.0, 157.0, 222.0, 194.0, 128.0, 52.0, 22.0, 19.0, 9.0, 16.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.906493186950684, -5.765346050262451, -5.624198913574219, -5.483051300048828, -5.341904163360596, -5.200757026672363, -5.059609889984131, -4.918462753295898, -4.777315139770508, -4.636168003082275, -4.495020866394043, -4.353873252868652, -4.21272611618042, -4.0715789794921875, -3.930431842803955, -3.7892847061157227, -3.6481375694274902, -3.506990432739258, -3.3658430576324463, -3.224695920944214, -3.0835485458374023, -2.94240140914917, -2.8012542724609375, -2.660107135772705, -2.5189597606658936, -2.377812623977661, -2.2366652488708496, -2.095518112182617, -1.9543708562850952, -1.8132236003875732, -1.6720764636993408, -1.5309292078018188, -1.3897817134857178, -1.2486344575881958, -1.1074872016906738, -0.9663400650024414, -0.8251928091049194, -0.6840455532073975, -0.5428983569145203, -0.40175116062164307, -0.2606039047241211, -0.11945667862892151, 0.021690547466278076, 0.16283777356147766, 0.30398499965667725, 0.4451322555541992, 0.5862794518470764, 0.7274266481399536, 0.8685739040374756, 1.0097211599349976, 1.1508684158325195, 1.292015552520752, 1.433162808418274, 1.574310064315796, 1.7154572010040283, 1.8566044569015503, 1.9977517127990723, 2.1388988494873047, 2.280046224594116, 2.4211933612823486, 2.56234073638916, 2.7034878730773926, 2.844635009765625, 2.9857821464538574, 3.126929521560669]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 6.0, 11.0, 11.0, 14.0, 16.0, 28.0, 31.0, 41.0, 25.0, 55.0, 47.0, 56.0, 72.0, 71.0, 61.0, 66.0, 65.0, 60.0, 37.0, 36.0, 36.0, 34.0, 26.0, 20.0, 10.0, 9.0, 7.0, 14.0, 9.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5737828016281128, -1.5160099267959595, -1.4582370519638062, -1.4004642963409424, -1.342691421508789, -1.2849185466766357, -1.2271456718444824, -1.169372797012329, -1.1115999221801758, -1.0538270473480225, -0.9960542321205139, -0.9382813572883606, -0.880508542060852, -0.8227356672286987, -0.7649627923965454, -0.7071899175643921, -0.6494171619415283, -0.591644287109375, -0.5338714718818665, -0.47609859704971313, -0.4183257520198822, -0.36055290699005127, -0.30278003215789795, -0.24500718712806702, -0.18723434209823608, -0.12946149706840515, -0.07168863713741302, -0.013915777206420898, 0.043857067823410034, 0.10162991285324097, 0.1594027876853943, 0.21717563271522522, 0.2749483585357666, 0.33272120356559753, 0.39049404859542847, 0.4482669234275818, 0.5060397386550903, 0.5638126134872437, 0.621585488319397, 0.6793583631515503, 0.7371311783790588, 0.7949040532112122, 0.8526768684387207, 0.910449743270874, 0.9682226181030273, 1.0259954929351807, 1.083768367767334, 1.1415411233901978, 1.199313998222351, 1.2570868730545044, 1.3148597478866577, 1.3726325035095215, 1.4304053783416748, 1.4881782531738281, 1.5459511280059814, 1.6037240028381348, 1.661496877670288, 1.7192697525024414, 1.7770426273345947, 1.834815502166748, 1.8925882577896118, 1.9503611326217651, 2.008133888244629, 2.0659067630767822, 2.1236796379089355]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 9.0, 8.0, 9.0, 17.0, 31.0, 40.0, 60.0, 83.0, 141.0, 273.0, 549.0, 1084.0, 2783.0, 8830.0, 39571.0, 414183.0, 518576.0, 46940.0, 9861.0, 3021.0, 1186.0, 560.0, 301.0, 157.0, 94.0, 65.0, 40.0, 21.0, 20.0, 12.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.2312450408935547, -0.22445297241210938, -0.21766090393066406, -0.21086883544921875, -0.20407676696777344, -0.19728469848632812, -0.1904926300048828, -0.1837005615234375, -0.1769084930419922, -0.17011642456054688, -0.16332435607910156, -0.15653228759765625, -0.14974021911621094, -0.14294815063476562, -0.1361560821533203, -0.129364013671875, -0.12257194519042969, -0.11577987670898438, -0.10898780822753906, -0.10219573974609375, -0.09540367126464844, -0.08861160278320312, -0.08181953430175781, -0.0750274658203125, -0.06823539733886719, -0.061443328857421875, -0.05465126037597656, -0.04785919189453125, -0.04106712341308594, -0.034275054931640625, -0.027482986450195312, -0.02069091796875, -0.013898849487304688, -0.007106781005859375, -0.0003147125244140625, 0.00647735595703125, 0.013269424438476562, 0.020061492919921875, 0.026853561401367188, 0.0336456298828125, 0.04043769836425781, 0.047229766845703125, 0.05402183532714844, 0.06081390380859375, 0.06760597229003906, 0.07439804077148438, 0.08119010925292969, 0.087982177734375, 0.09477424621582031, 0.10156631469726562, 0.10835838317871094, 0.11515045166015625, 0.12194252014160156, 0.12873458862304688, 0.1355266571044922, 0.1423187255859375, 0.1491107940673828, 0.15590286254882812, 0.16269493103027344, 0.16948699951171875, 0.17627906799316406, 0.18307113647460938, 0.1898632049560547, 0.1966552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 5.0, 9.0, 4.0, 8.0, 7.0, 16.0, 17.0, 21.0, 28.0, 57.0, 60.0, 72.0, 75.0, 84.0, 89.0, 89.0, 74.0, 62.0, 49.0, 49.0, 35.0, 18.0, 14.0, 15.0, 15.0, 8.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4140625, -1.3656158447265625, -1.317169189453125, -1.2687225341796875, -1.22027587890625, -1.1718292236328125, -1.123382568359375, -1.0749359130859375, -1.0264892578125, -0.9780426025390625, -0.929595947265625, -0.8811492919921875, -0.83270263671875, -0.7842559814453125, -0.735809326171875, -0.6873626708984375, -0.638916015625, -0.5904693603515625, -0.542022705078125, -0.4935760498046875, -0.44512939453125, -0.3966827392578125, -0.348236083984375, -0.2997894287109375, -0.2513427734375, -0.2028961181640625, -0.154449462890625, -0.1060028076171875, -0.05755615234375, -0.0091094970703125, 0.039337158203125, 0.0877838134765625, 0.13623046875, 0.1846771240234375, 0.233123779296875, 0.2815704345703125, 0.33001708984375, 0.3784637451171875, 0.426910400390625, 0.4753570556640625, 0.5238037109375, 0.5722503662109375, 0.620697021484375, 0.6691436767578125, 0.71759033203125, 0.7660369873046875, 0.814483642578125, 0.8629302978515625, 0.911376953125, 0.9598236083984375, 1.008270263671875, 1.0567169189453125, 1.10516357421875, 1.1536102294921875, 1.202056884765625, 1.2505035400390625, 1.2989501953125, 1.3473968505859375, 1.395843505859375, 1.4442901611328125, 1.49273681640625, 1.5411834716796875, 1.589630126953125, 1.6380767822265625, 1.6865234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 9.0, 13.0, 5.0, 15.0, 14.0, 16.0, 20.0, 33.0, 48.0, 51.0, 61.0, 85.0, 112.0, 149.0, 221.0, 330.0, 597.0, 1674.0, 7520.0, 62003.0, 665243.0, 282469.0, 22150.0, 3363.0, 932.0, 373.0, 244.0, 179.0, 137.0, 113.0, 76.0, 69.0, 54.0, 36.0, 28.0, 29.0, 20.0, 12.0, 7.0, 8.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.181884765625, -0.1761646270751953, -0.17044448852539062, -0.16472434997558594, -0.15900421142578125, -0.15328407287597656, -0.14756393432617188, -0.1418437957763672, -0.1361236572265625, -0.1304035186767578, -0.12468338012695312, -0.11896324157714844, -0.11324310302734375, -0.10752296447753906, -0.10180282592773438, -0.09608268737792969, -0.090362548828125, -0.08464241027832031, -0.07892227172851562, -0.07320213317871094, -0.06748199462890625, -0.06176185607910156, -0.056041717529296875, -0.05032157897949219, -0.0446014404296875, -0.03888130187988281, -0.033161163330078125, -0.027441024780273438, -0.02172088623046875, -0.016000747680664062, -0.010280609130859375, -0.0045604705810546875, 0.00115966796875, 0.0068798065185546875, 0.012599945068359375, 0.018320083618164062, 0.02404022216796875, 0.029760360717773438, 0.035480499267578125, 0.04120063781738281, 0.0469207763671875, 0.05264091491699219, 0.058361053466796875, 0.06408119201660156, 0.06980133056640625, 0.07552146911621094, 0.08124160766601562, 0.08696174621582031, 0.092681884765625, 0.09840202331542969, 0.10412216186523438, 0.10984230041503906, 0.11556243896484375, 0.12128257751464844, 0.12700271606445312, 0.1327228546142578, 0.1384429931640625, 0.1441631317138672, 0.14988327026367188, 0.15560340881347656, 0.16132354736328125, 0.16704368591308594, 0.17276382446289062, 0.1784839630126953, 0.1842041015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 7.0, 10.0, 12.0, 26.0, 25.0, 21.0, 35.0, 26.0, 35.0, 32.0, 55.0, 48.0, 66.0, 60.0, 52.0, 58.0, 53.0, 48.0, 50.0, 35.0, 28.0, 36.0, 39.0, 25.0, 21.0, 16.0, 14.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.0447998046875, -1.978271484375, -1.9117431640625, -1.84521484375, -1.7786865234375, -1.712158203125, -1.6456298828125, -1.5791015625, -1.5125732421875, -1.446044921875, -1.3795166015625, -1.31298828125, -1.2464599609375, -1.179931640625, -1.1134033203125, -1.046875, -0.9803466796875, -0.913818359375, -0.8472900390625, -0.78076171875, -0.7142333984375, -0.647705078125, -0.5811767578125, -0.5146484375, -0.4481201171875, -0.381591796875, -0.3150634765625, -0.24853515625, -0.1820068359375, -0.115478515625, -0.0489501953125, 0.017578125, 0.0841064453125, 0.150634765625, 0.2171630859375, 0.28369140625, 0.3502197265625, 0.416748046875, 0.4832763671875, 0.5498046875, 0.6163330078125, 0.682861328125, 0.7493896484375, 0.81591796875, 0.8824462890625, 0.948974609375, 1.0155029296875, 1.08203125, 1.1485595703125, 1.215087890625, 1.2816162109375, 1.34814453125, 1.4146728515625, 1.481201171875, 1.5477294921875, 1.6142578125, 1.6807861328125, 1.747314453125, 1.8138427734375, 1.88037109375, 1.9468994140625, 2.013427734375, 2.0799560546875, 2.146484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 13.0, 10.0, 20.0, 31.0, 43.0, 56.0, 114.0, 141.0, 277.0, 673.0, 3034.0, 64465.0, 969343.0, 7981.0, 1325.0, 419.0, 192.0, 106.0, 77.0, 61.0, 38.0, 18.0, 13.0, 12.0, 8.0, 8.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06475830078125, -0.06297063827514648, -0.06118297576904297, -0.05939531326293945, -0.05760765075683594, -0.05581998825073242, -0.054032325744628906, -0.05224466323852539, -0.050457000732421875, -0.04866933822631836, -0.046881675720214844, -0.04509401321411133, -0.04330635070800781, -0.0415186882019043, -0.03973102569580078, -0.037943363189697266, -0.03615570068359375, -0.034368038177490234, -0.03258037567138672, -0.030792713165283203, -0.029005050659179688, -0.027217388153076172, -0.025429725646972656, -0.02364206314086914, -0.021854400634765625, -0.02006673812866211, -0.018279075622558594, -0.016491413116455078, -0.014703750610351562, -0.012916088104248047, -0.011128425598144531, -0.009340763092041016, -0.0075531005859375, -0.005765438079833984, -0.003977775573730469, -0.002190113067626953, -0.0004024505615234375, 0.0013852119445800781, 0.0031728744506835938, 0.004960536956787109, 0.006748199462890625, 0.00853586196899414, 0.010323524475097656, 0.012111186981201172, 0.013898849487304688, 0.015686511993408203, 0.01747417449951172, 0.019261837005615234, 0.02104949951171875, 0.022837162017822266, 0.02462482452392578, 0.026412487030029297, 0.028200149536132812, 0.029987812042236328, 0.031775474548339844, 0.03356313705444336, 0.035350799560546875, 0.03713846206665039, 0.038926124572753906, 0.04071378707885742, 0.04250144958496094, 0.04428911209106445, 0.04607677459716797, 0.047864437103271484, 0.049652099609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 7.0, 9.0, 6.0, 16.0, 18.0, 34.0, 35.0, 58.0, 91.0, 105.0, 147.0, 143.0, 96.0, 80.0, 41.0, 31.0, 19.0, 12.0, 10.0, 7.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.1457672119140625e-05, -2.0944513380527496e-05, -2.0431354641914368e-05, -1.991819590330124e-05, -1.940503716468811e-05, -1.889187842607498e-05, -1.8378719687461853e-05, -1.7865560948848724e-05, -1.7352402210235596e-05, -1.6839243471622467e-05, -1.632608473300934e-05, -1.581292599439621e-05, -1.529976725578308e-05, -1.4786608517169952e-05, -1.4273449778556824e-05, -1.3760291039943695e-05, -1.3247132301330566e-05, -1.2733973562717438e-05, -1.2220814824104309e-05, -1.170765608549118e-05, -1.1194497346878052e-05, -1.0681338608264923e-05, -1.0168179869651794e-05, -9.655021131038666e-06, -9.141862392425537e-06, -8.628703653812408e-06, -8.11554491519928e-06, -7.602386176586151e-06, -7.0892274379730225e-06, -6.576068699359894e-06, -6.062909960746765e-06, -5.5497512221336365e-06, -5.036592483520508e-06, -4.523433744907379e-06, -4.0102750062942505e-06, -3.497116267681122e-06, -2.983957529067993e-06, -2.4707987904548645e-06, -1.957640051841736e-06, -1.4444813132286072e-06, -9.313225746154785e-07, -4.1816383600234985e-07, 9.499490261077881e-08, 6.081536412239075e-07, 1.1213123798370361e-06, 1.6344711184501648e-06, 2.1476298570632935e-06, 2.660788595676422e-06, 3.1739473342895508e-06, 3.6871060729026794e-06, 4.200264811515808e-06, 4.713423550128937e-06, 5.2265822887420654e-06, 5.739741027355194e-06, 6.252899765968323e-06, 6.766058504581451e-06, 7.27921724319458e-06, 7.792375981807709e-06, 8.305534720420837e-06, 8.818693459033966e-06, 9.331852197647095e-06, 9.845010936260223e-06, 1.0358169674873352e-05, 1.087132841348648e-05, 1.138448715209961e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 0.0, 3.0, 4.0, 4.0, 12.0, 14.0, 24.0, 25.0, 32.0, 42.0, 76.0, 114.0, 154.0, 260.0, 427.0, 731.0, 1400.0, 2876.0, 7760.0, 30621.0, 591459.0, 372794.0, 26651.0, 7158.0, 2825.0, 1336.0, 669.0, 399.0, 217.0, 154.0, 95.0, 65.0, 44.0, 29.0, 16.0, 12.0, 16.0, 9.0, 10.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042816162109375, -0.04147624969482422, -0.04013633728027344, -0.038796424865722656, -0.037456512451171875, -0.036116600036621094, -0.03477668762207031, -0.03343677520751953, -0.03209686279296875, -0.03075695037841797, -0.029417037963867188, -0.028077125549316406, -0.026737213134765625, -0.025397300720214844, -0.024057388305664062, -0.02271747589111328, -0.0213775634765625, -0.02003765106201172, -0.018697738647460938, -0.017357826232910156, -0.016017913818359375, -0.014678001403808594, -0.013338088989257812, -0.011998176574707031, -0.01065826416015625, -0.009318351745605469, -0.007978439331054688, -0.006638526916503906, -0.005298614501953125, -0.003958702087402344, -0.0026187896728515625, -0.0012788772583007812, 6.103515625e-05, 0.0014009475708007812, 0.0027408599853515625, 0.004080772399902344, 0.005420684814453125, 0.006760597229003906, 0.008100509643554688, 0.009440422058105469, 0.01078033447265625, 0.012120246887207031, 0.013460159301757812, 0.014800071716308594, 0.016139984130859375, 0.017479896545410156, 0.018819808959960938, 0.02015972137451172, 0.0214996337890625, 0.02283954620361328, 0.024179458618164062, 0.025519371032714844, 0.026859283447265625, 0.028199195861816406, 0.029539108276367188, 0.03087902069091797, 0.03221893310546875, 0.03355884552001953, 0.03489875793457031, 0.036238670349121094, 0.037578582763671875, 0.038918495178222656, 0.04025840759277344, 0.04159832000732422, 0.042938232421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 13.0, 14.0, 42.0, 51.0, 89.0, 203.0, 285.0, 79.0, 41.0, 37.0, 28.0, 22.0, 17.0, 6.0, 8.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01181793212890625, -0.011461019515991211, -0.011104106903076172, -0.010747194290161133, -0.010390281677246094, -0.010033369064331055, -0.009676456451416016, -0.009319543838500977, -0.008962631225585938, -0.008605718612670898, -0.00824880599975586, -0.00789189338684082, -0.007534980773925781, -0.007178068161010742, -0.006821155548095703, -0.006464242935180664, -0.006107330322265625, -0.005750417709350586, -0.005393505096435547, -0.005036592483520508, -0.004679679870605469, -0.00432276725769043, -0.003965854644775391, -0.0036089420318603516, -0.0032520294189453125, -0.0028951168060302734, -0.0025382041931152344, -0.0021812915802001953, -0.0018243789672851562, -0.0014674663543701172, -0.0011105537414550781, -0.0007536411285400391, -0.000396728515625, -3.981590270996094e-05, 0.0003170967102050781, 0.0006740093231201172, 0.0010309219360351562, 0.0013878345489501953, 0.0017447471618652344, 0.0021016597747802734, 0.0024585723876953125, 0.0028154850006103516, 0.0031723976135253906, 0.0035293102264404297, 0.0038862228393554688, 0.004243135452270508, 0.004600048065185547, 0.004956960678100586, 0.005313873291015625, 0.005670785903930664, 0.006027698516845703, 0.006384611129760742, 0.006741523742675781, 0.00709843635559082, 0.007455348968505859, 0.0078122615814208984, 0.008169174194335938, 0.008526086807250977, 0.008882999420166016, 0.009239912033081055, 0.009596824645996094, 0.009953737258911133, 0.010310649871826172, 0.010667562484741211, 0.01102447509765625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 26.0, 39.0, 110.0, 270.0, 283.0, 144.0, 45.0, 21.0, 14.0, 11.0, 13.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.824275493621826, -4.7041215896606445, -4.583967685699463, -4.463813781738281, -4.343660354614258, -4.223506450653076, -4.1033525466918945, -3.983198642730713, -3.8630449771881104, -3.7428910732269287, -3.622737407684326, -3.5025835037231445, -3.382429599761963, -3.2622759342193604, -3.1421220302581787, -3.021968364715576, -2.9018144607543945, -2.781660556793213, -2.6615068912506104, -2.5413529872894287, -2.421199083328247, -2.3010454177856445, -2.180891513824463, -2.0607376098632812, -1.9405837059020996, -1.8204299211502075, -1.7002760171890259, -1.5801222324371338, -1.4599684476852417, -1.3398146629333496, -1.219660758972168, -1.0995069742202759, -0.9793531894683838, -0.8591993451118469, -0.7390455603599548, -0.618891716003418, -0.4987379014492035, -0.378584086894989, -0.25843024253845215, -0.13827645778656006, -0.018122613430023193, 0.10203120857477188, 0.22218503057956696, 0.3423388600349426, 0.4624926745891571, 0.5826464891433716, 0.7028003334999084, 0.8229541182518005, 0.9431079626083374, 1.0632617473602295, 1.1834156513214111, 1.3035694360733032, 1.4237232208251953, 1.543877124786377, 1.664030909538269, 1.7841846942901611, 1.9043385982513428, 2.0244925022125244, 2.144646167755127, 2.2648000717163086, 2.3849539756774902, 2.5051076412200928, 2.6252615451812744, 2.745415210723877, 2.8655691146850586]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 5.0, 11.0, 7.0, 11.0, 16.0, 19.0, 29.0, 34.0, 51.0, 63.0, 58.0, 96.0, 96.0, 83.0, 86.0, 88.0, 43.0, 51.0, 41.0, 26.0, 20.0, 15.0, 10.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3058565855026245, -1.257638931274414, -1.2094212770462036, -1.1612036228179932, -1.1129859685897827, -1.0647683143615723, -1.0165506601333618, -0.9683330059051514, -0.9201153516769409, -0.8718976974487305, -0.82368004322052, -0.7754623889923096, -0.7272447347640991, -0.6790270805358887, -0.6308094263076782, -0.5825917720794678, -0.5343741774559021, -0.48615652322769165, -0.4379388689994812, -0.38972121477127075, -0.3415035605430603, -0.29328590631484985, -0.2450682818889618, -0.19685062766075134, -0.1486329734325409, -0.10041531920433044, -0.05219767242670059, -0.00398002564907074, 0.04423762857913971, 0.09245528280735016, 0.14067292213439941, 0.18889057636260986, 0.2371082305908203, 0.28532588481903076, 0.3335435390472412, 0.38176119327545166, 0.4299788475036621, 0.47819650173187256, 0.526414155960083, 0.5746318101882935, 0.6228494644165039, 0.6710671186447144, 0.7192847728729248, 0.7675024271011353, 0.8157200813293457, 0.8639377355575562, 0.9121553897857666, 0.960373044013977, 1.0085906982421875, 1.056808352470398, 1.1050260066986084, 1.1532436609268188, 1.2014613151550293, 1.2496789693832397, 1.2978966236114502, 1.3461142778396606, 1.3943318128585815, 1.442549467086792, 1.4907671213150024, 1.538984775543213, 1.5872024297714233, 1.6354200839996338, 1.6836377382278442, 1.7318553924560547, 1.7800730466842651]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 16.0, 24.0, 39.0, 69.0, 106.0, 188.0, 318.0, 599.0, 1199.0, 2651.0, 6377.0, 17603.0, 61695.0, 296721.0, 510820.0, 105893.0, 27850.0, 9357.0, 3714.0, 1607.0, 724.0, 366.0, 220.0, 132.0, 83.0, 62.0, 26.0, 22.0, 16.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.0084228515625, -0.973876953125, -0.9393310546875, -0.90478515625, -0.8702392578125, -0.835693359375, -0.8011474609375, -0.7666015625, -0.7320556640625, -0.697509765625, -0.6629638671875, -0.62841796875, -0.5938720703125, -0.559326171875, -0.5247802734375, -0.490234375, -0.4556884765625, -0.421142578125, -0.3865966796875, -0.35205078125, -0.3175048828125, -0.282958984375, -0.2484130859375, -0.2138671875, -0.1793212890625, -0.144775390625, -0.1102294921875, -0.07568359375, -0.0411376953125, -0.006591796875, 0.0279541015625, 0.0625, 0.0970458984375, 0.131591796875, 0.1661376953125, 0.20068359375, 0.2352294921875, 0.269775390625, 0.3043212890625, 0.3388671875, 0.3734130859375, 0.407958984375, 0.4425048828125, 0.47705078125, 0.5115966796875, 0.546142578125, 0.5806884765625, 0.615234375, 0.6497802734375, 0.684326171875, 0.7188720703125, 0.75341796875, 0.7879638671875, 0.822509765625, 0.8570556640625, 0.8916015625, 0.9261474609375, 0.960693359375, 0.9952392578125, 1.02978515625, 1.0643310546875, 1.098876953125, 1.1334228515625, 1.16796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 12.0, 13.0, 18.0, 21.0, 28.0, 36.0, 59.0, 63.0, 64.0, 85.0, 89.0, 90.0, 86.0, 75.0, 56.0, 46.0, 37.0, 23.0, 23.0, 11.0, 13.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.625, -3.5108642578125, -3.396728515625, -3.2825927734375, -3.16845703125, -3.0543212890625, -2.940185546875, -2.8260498046875, -2.7119140625, -2.5977783203125, -2.483642578125, -2.3695068359375, -2.25537109375, -2.1412353515625, -2.027099609375, -1.9129638671875, -1.798828125, -1.6846923828125, -1.570556640625, -1.4564208984375, -1.34228515625, -1.2281494140625, -1.114013671875, -0.9998779296875, -0.8857421875, -0.7716064453125, -0.657470703125, -0.5433349609375, -0.42919921875, -0.3150634765625, -0.200927734375, -0.0867919921875, 0.02734375, 0.1414794921875, 0.255615234375, 0.3697509765625, 0.48388671875, 0.5980224609375, 0.712158203125, 0.8262939453125, 0.9404296875, 1.0545654296875, 1.168701171875, 1.2828369140625, 1.39697265625, 1.5111083984375, 1.625244140625, 1.7393798828125, 1.853515625, 1.9676513671875, 2.081787109375, 2.1959228515625, 2.31005859375, 2.4241943359375, 2.538330078125, 2.6524658203125, 2.7666015625, 2.8807373046875, 2.994873046875, 3.1090087890625, 3.22314453125, 3.3372802734375, 3.451416015625, 3.5655517578125, 3.6796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 13.0, 8.0, 6.0, 19.0, 17.0, 25.0, 24.0, 44.0, 39.0, 53.0, 83.0, 95.0, 136.0, 244.0, 347.0, 568.0, 1141.0, 2449.0, 6245.0, 18610.0, 70094.0, 351824.0, 467346.0, 91978.0, 23400.0, 7518.0, 2986.0, 1358.0, 666.0, 360.0, 226.0, 190.0, 111.0, 76.0, 62.0, 38.0, 32.0, 33.0, 18.0, 15.0, 11.0, 6.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8115234375, -0.7862396240234375, -0.760955810546875, -0.7356719970703125, -0.71038818359375, -0.6851043701171875, -0.659820556640625, -0.6345367431640625, -0.6092529296875, -0.5839691162109375, -0.558685302734375, -0.5334014892578125, -0.50811767578125, -0.4828338623046875, -0.457550048828125, -0.4322662353515625, -0.406982421875, -0.3816986083984375, -0.356414794921875, -0.3311309814453125, -0.30584716796875, -0.2805633544921875, -0.255279541015625, -0.2299957275390625, -0.2047119140625, -0.1794281005859375, -0.154144287109375, -0.1288604736328125, -0.10357666015625, -0.0782928466796875, -0.053009033203125, -0.0277252197265625, -0.00244140625, 0.0228424072265625, 0.048126220703125, 0.0734100341796875, 0.09869384765625, 0.1239776611328125, 0.149261474609375, 0.1745452880859375, 0.1998291015625, 0.2251129150390625, 0.250396728515625, 0.2756805419921875, 0.30096435546875, 0.3262481689453125, 0.351531982421875, 0.3768157958984375, 0.402099609375, 0.4273834228515625, 0.452667236328125, 0.4779510498046875, 0.50323486328125, 0.5285186767578125, 0.553802490234375, 0.5790863037109375, 0.6043701171875, 0.6296539306640625, 0.654937744140625, 0.6802215576171875, 0.70550537109375, 0.7307891845703125, 0.756072998046875, 0.7813568115234375, 0.806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 11.0, 3.0, 6.0, 11.0, 15.0, 13.0, 12.0, 17.0, 18.0, 22.0, 16.0, 24.0, 24.0, 28.0, 43.0, 37.0, 42.0, 40.0, 32.0, 36.0, 30.0, 47.0, 44.0, 39.0, 50.0, 28.0, 34.0, 30.0, 37.0, 26.0, 33.0, 28.0, 23.0, 17.0, 23.0, 14.0, 11.0, 8.0, 6.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.90625, -2.821929931640625, -2.73760986328125, -2.653289794921875, -2.5689697265625, -2.484649658203125, -2.40032958984375, -2.316009521484375, -2.231689453125, -2.147369384765625, -2.06304931640625, -1.978729248046875, -1.8944091796875, -1.810089111328125, -1.72576904296875, -1.641448974609375, -1.55712890625, -1.472808837890625, -1.38848876953125, -1.304168701171875, -1.2198486328125, -1.135528564453125, -1.05120849609375, -0.966888427734375, -0.882568359375, -0.798248291015625, -0.71392822265625, -0.629608154296875, -0.5452880859375, -0.460968017578125, -0.37664794921875, -0.292327880859375, -0.2080078125, -0.123687744140625, -0.03936767578125, 0.044952392578125, 0.1292724609375, 0.213592529296875, 0.29791259765625, 0.382232666015625, 0.466552734375, 0.550872802734375, 0.63519287109375, 0.719512939453125, 0.8038330078125, 0.888153076171875, 0.97247314453125, 1.056793212890625, 1.14111328125, 1.225433349609375, 1.30975341796875, 1.394073486328125, 1.4783935546875, 1.562713623046875, 1.64703369140625, 1.731353759765625, 1.815673828125, 1.899993896484375, 1.98431396484375, 2.068634033203125, 2.1529541015625, 2.237274169921875, 2.32159423828125, 2.405914306640625, 2.490234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 13.0, 30.0, 45.0, 46.0, 93.0, 156.0, 236.0, 428.0, 870.0, 1929.0, 5701.0, 26337.0, 266525.0, 676702.0, 54447.0, 9577.0, 2864.0, 1118.0, 586.0, 324.0, 158.0, 93.0, 74.0, 40.0, 33.0, 16.0, 13.0, 10.0, 9.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5947265625, -0.5768051147460938, -0.5588836669921875, -0.5409622192382812, -0.523040771484375, -0.5051193237304688, -0.4871978759765625, -0.46927642822265625, -0.45135498046875, -0.43343353271484375, -0.4155120849609375, -0.39759063720703125, -0.379669189453125, -0.36174774169921875, -0.3438262939453125, -0.32590484619140625, -0.3079833984375, -0.29006195068359375, -0.2721405029296875, -0.25421905517578125, -0.236297607421875, -0.21837615966796875, -0.2004547119140625, -0.18253326416015625, -0.16461181640625, -0.14669036865234375, -0.1287689208984375, -0.11084747314453125, -0.092926025390625, -0.07500457763671875, -0.0570831298828125, -0.03916168212890625, -0.021240234375, -0.00331878662109375, 0.0146026611328125, 0.03252410888671875, 0.050445556640625, 0.06836700439453125, 0.0862884521484375, 0.10420989990234375, 0.12213134765625, 0.14005279541015625, 0.1579742431640625, 0.17589569091796875, 0.193817138671875, 0.21173858642578125, 0.2296600341796875, 0.24758148193359375, 0.2655029296875, 0.28342437744140625, 0.3013458251953125, 0.31926727294921875, 0.337188720703125, 0.35511016845703125, 0.3730316162109375, 0.39095306396484375, 0.40887451171875, 0.42679595947265625, 0.4447174072265625, 0.46263885498046875, 0.480560302734375, 0.49848175048828125, 0.5164031982421875, 0.5343246459960938, 0.55224609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 4.0, 3.0, 12.0, 12.0, 14.0, 24.0, 29.0, 39.0, 54.0, 87.0, 127.0, 130.0, 139.0, 101.0, 53.0, 44.0, 31.0, 16.0, 14.0, 15.0, 13.0, 5.0, 10.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.930133819580078e-05, -9.665079414844513e-05, -9.400025010108948e-05, -9.134970605373383e-05, -8.869916200637817e-05, -8.604861795902252e-05, -8.339807391166687e-05, -8.074752986431122e-05, -7.809698581695557e-05, -7.544644176959991e-05, -7.279589772224426e-05, -7.014535367488861e-05, -6.749480962753296e-05, -6.484426558017731e-05, -6.219372153282166e-05, -5.9543177485466003e-05, -5.689263343811035e-05, -5.42420893907547e-05, -5.159154534339905e-05, -4.8941001296043396e-05, -4.6290457248687744e-05, -4.363991320133209e-05, -4.098936915397644e-05, -3.833882510662079e-05, -3.568828105926514e-05, -3.3037737011909485e-05, -3.0387192964553833e-05, -2.773664891719818e-05, -2.508610486984253e-05, -2.2435560822486877e-05, -1.9785016775131226e-05, -1.7134472727775574e-05, -1.4483928680419922e-05, -1.183338463306427e-05, -9.182840585708618e-06, -6.532296538352966e-06, -3.8817524909973145e-06, -1.2312084436416626e-06, 1.4193356037139893e-06, 4.069879651069641e-06, 6.720423698425293e-06, 9.370967745780945e-06, 1.2021511793136597e-05, 1.4672055840492249e-05, 1.73225998878479e-05, 1.9973143935203552e-05, 2.2623687982559204e-05, 2.5274232029914856e-05, 2.7924776077270508e-05, 3.057532012462616e-05, 3.322586417198181e-05, 3.587640821933746e-05, 3.8526952266693115e-05, 4.117749631404877e-05, 4.382804036140442e-05, 4.647858440876007e-05, 4.912912845611572e-05, 5.1779672503471375e-05, 5.4430216550827026e-05, 5.708076059818268e-05, 5.973130464553833e-05, 6.238184869289398e-05, 6.503239274024963e-05, 6.768293678760529e-05, 7.033348083496094e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 17.0, 22.0, 41.0, 63.0, 125.0, 245.0, 482.0, 1085.0, 2676.0, 9215.0, 55644.0, 738051.0, 211016.0, 21712.0, 4970.0, 1691.0, 675.0, 362.0, 177.0, 90.0, 53.0, 29.0, 19.0, 11.0, 13.0, 3.0, 9.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6298828125, -0.6087188720703125, -0.587554931640625, -0.5663909912109375, -0.54522705078125, -0.5240631103515625, -0.502899169921875, -0.4817352294921875, -0.4605712890625, -0.4394073486328125, -0.418243408203125, -0.3970794677734375, -0.37591552734375, -0.3547515869140625, -0.333587646484375, -0.3124237060546875, -0.291259765625, -0.2700958251953125, -0.248931884765625, -0.2277679443359375, -0.20660400390625, -0.1854400634765625, -0.164276123046875, -0.1431121826171875, -0.1219482421875, -0.1007843017578125, -0.079620361328125, -0.0584564208984375, -0.03729248046875, -0.0161285400390625, 0.005035400390625, 0.0261993408203125, 0.04736328125, 0.0685272216796875, 0.089691162109375, 0.1108551025390625, 0.13201904296875, 0.1531829833984375, 0.174346923828125, 0.1955108642578125, 0.2166748046875, 0.2378387451171875, 0.259002685546875, 0.2801666259765625, 0.30133056640625, 0.3224945068359375, 0.343658447265625, 0.3648223876953125, 0.385986328125, 0.4071502685546875, 0.428314208984375, 0.4494781494140625, 0.47064208984375, 0.4918060302734375, 0.512969970703125, 0.5341339111328125, 0.5552978515625, 0.5764617919921875, 0.597625732421875, 0.6187896728515625, 0.63995361328125, 0.6611175537109375, 0.682281494140625, 0.7034454345703125, 0.724609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 8.0, 17.0, 22.0, 45.0, 51.0, 96.0, 166.0, 193.0, 148.0, 84.0, 48.0, 38.0, 23.0, 18.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42194366455078125, -0.4093170166015625, -0.39669036865234375, -0.384063720703125, -0.37143707275390625, -0.3588104248046875, -0.34618377685546875, -0.33355712890625, -0.32093048095703125, -0.3083038330078125, -0.29567718505859375, -0.283050537109375, -0.27042388916015625, -0.2577972412109375, -0.24517059326171875, -0.2325439453125, -0.21991729736328125, -0.2072906494140625, -0.19466400146484375, -0.182037353515625, -0.16941070556640625, -0.1567840576171875, -0.14415740966796875, -0.13153076171875, -0.11890411376953125, -0.1062774658203125, -0.09365081787109375, -0.081024169921875, -0.06839752197265625, -0.0557708740234375, -0.04314422607421875, -0.030517578125, -0.01789093017578125, -0.0052642822265625, 0.00736236572265625, 0.019989013671875, 0.03261566162109375, 0.0452423095703125, 0.05786895751953125, 0.07049560546875, 0.08312225341796875, 0.0957489013671875, 0.10837554931640625, 0.121002197265625, 0.13362884521484375, 0.1462554931640625, 0.15888214111328125, 0.1715087890625, 0.18413543701171875, 0.1967620849609375, 0.20938873291015625, 0.222015380859375, 0.23464202880859375, 0.2472686767578125, 0.25989532470703125, 0.27252197265625, 0.28514862060546875, 0.2977752685546875, 0.31040191650390625, 0.323028564453125, 0.33565521240234375, 0.3482818603515625, 0.36090850830078125, 0.37353515625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 13.0, 40.0, 597.0, 310.0, 42.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.428099155426025, -6.589502334594727, -5.7509050369262695, -4.912308216094971, -4.073711395263672, -3.235114097595215, -2.396517276763916, -1.557919979095459, -0.7193231582641602, 0.119273841381073, 0.9578708410263062, 1.7964677810668945, 2.6350648403167725, 3.4736618995666504, 4.312258720397949, 5.150856018066406, 5.989452838897705, 6.828049659729004, 7.666646957397461, 8.505243301391602, 9.343840599060059, 10.182437896728516, 11.021034240722656, 11.85963249206543, 12.69822883605957, 13.536826133728027, 14.375422477722168, 15.214019775390625, 16.052616119384766, 16.89121437072754, 17.72981071472168, 18.568408966064453, 19.40700340270996, 20.2455997467041, 21.084197998046875, 21.922794342041016, 22.761390686035156, 23.59998893737793, 24.43858528137207, 25.277183532714844, 26.115779876708984, 26.954376220703125, 27.7929744720459, 28.63157081604004, 29.47016716003418, 30.308765411376953, 31.147361755371094, 31.985958099365234, 32.824554443359375, 33.663150787353516, 34.501747131347656, 35.34034729003906, 36.1789436340332, 37.017539978027344, 37.856136322021484, 38.694732666015625, 39.53333282470703, 40.37192916870117, 41.21052551269531, 42.04912567138672, 42.88772201538086, 43.726318359375, 44.56491470336914, 45.40351104736328, 46.24210739135742]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 11.0, 15.0, 6.0, 7.0, 11.0, 18.0, 21.0, 25.0, 49.0, 38.0, 40.0, 34.0, 45.0, 44.0, 62.0, 53.0, 48.0, 44.0, 49.0, 48.0, 45.0, 38.0, 47.0, 37.0, 23.0, 25.0, 23.0, 21.0, 16.0, 6.0, 16.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.437473297119141, -6.233244895935059, -6.029016017913818, -5.824787616729736, -5.620559215545654, -5.416330337524414, -5.212101936340332, -5.00787353515625, -4.803645133972168, -4.599416732788086, -4.395187854766846, -4.190959453582764, -3.9867310523986816, -3.7825024127960205, -3.5782737731933594, -3.3740453720092773, -3.169816493988037, -2.965587854385376, -2.761359453201294, -2.557130813598633, -2.352902412414551, -2.1486737728118896, -1.9444451332092285, -1.740216612815857, -1.5359880924224854, -1.3317595720291138, -1.1275310516357422, -0.923302412033081, -0.7190738916397095, -0.5148453712463379, -0.31061673164367676, -0.10638821125030518, 0.09784078598022461, 0.3020693361759186, 0.5062978863716125, 0.7105264663696289, 0.9147549867630005, 1.118983507156372, 1.3232121467590332, 1.5274406671524048, 1.7316691875457764, 1.935897707939148, 2.1401262283325195, 2.3443548679351807, 2.548583507537842, 2.752811908721924, 2.957040548324585, 3.161269187927246, 3.365497589111328, 3.5697262287139893, 3.7739546298980713, 3.9781832695007324, 4.1824116706848145, 4.386640548706055, 4.590868949890137, 4.795097351074219, 4.999325752258301, 5.203554153442383, 5.407783031463623, 5.612011432647705, 5.816239833831787, 6.020468711853027, 6.224697113037109, 6.428925514221191, 6.633154392242432]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 3.0, 14.0, 26.0, 28.0, 80.0, 123.0, 196.0, 358.0, 662.0, 1337.0, 2970.0, 7755.0, 27969.0, 177790.0, 3573611.0, 344438.0, 39749.0, 10243.0, 3620.0, 1550.0, 765.0, 441.0, 208.0, 135.0, 80.0, 47.0, 25.0, 20.0, 15.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.38812255859375, -2.3074951171875, -2.22686767578125, -2.146240234375, -2.06561279296875, -1.9849853515625, -1.90435791015625, -1.82373046875, -1.74310302734375, -1.6624755859375, -1.58184814453125, -1.501220703125, -1.42059326171875, -1.3399658203125, -1.25933837890625, -1.1787109375, -1.09808349609375, -1.0174560546875, -0.93682861328125, -0.856201171875, -0.77557373046875, -0.6949462890625, -0.61431884765625, -0.53369140625, -0.45306396484375, -0.3724365234375, -0.29180908203125, -0.211181640625, -0.13055419921875, -0.0499267578125, 0.03070068359375, 0.111328125, 0.19195556640625, 0.2725830078125, 0.35321044921875, 0.433837890625, 0.51446533203125, 0.5950927734375, 0.67572021484375, 0.75634765625, 0.83697509765625, 0.9176025390625, 0.99822998046875, 1.078857421875, 1.15948486328125, 1.2401123046875, 1.32073974609375, 1.4013671875, 1.48199462890625, 1.5626220703125, 1.64324951171875, 1.723876953125, 1.80450439453125, 1.8851318359375, 1.96575927734375, 2.04638671875, 2.12701416015625, 2.2076416015625, 2.28826904296875, 2.368896484375, 2.44952392578125, 2.5301513671875, 2.61077880859375, 2.69140625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 8.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 5.0, 19.0, 14.0, 18.0, 30.0, 30.0, 42.0, 47.0, 78.0, 83.0, 90.0, 90.0, 90.0, 57.0, 68.0, 33.0, 42.0, 36.0, 27.0, 21.0, 11.0, 10.0, 7.0, 5.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423828125, -1.37152099609375, -1.3192138671875, -1.26690673828125, -1.214599609375, -1.16229248046875, -1.1099853515625, -1.05767822265625, -1.00537109375, -0.95306396484375, -0.9007568359375, -0.84844970703125, -0.796142578125, -0.74383544921875, -0.6915283203125, -0.63922119140625, -0.5869140625, -0.53460693359375, -0.4822998046875, -0.42999267578125, -0.377685546875, -0.32537841796875, -0.2730712890625, -0.22076416015625, -0.16845703125, -0.11614990234375, -0.0638427734375, -0.01153564453125, 0.040771484375, 0.09307861328125, 0.1453857421875, 0.19769287109375, 0.25, 0.30230712890625, 0.3546142578125, 0.40692138671875, 0.459228515625, 0.51153564453125, 0.5638427734375, 0.61614990234375, 0.66845703125, 0.72076416015625, 0.7730712890625, 0.82537841796875, 0.877685546875, 0.92999267578125, 0.9822998046875, 1.03460693359375, 1.0869140625, 1.13922119140625, 1.1915283203125, 1.24383544921875, 1.296142578125, 1.34844970703125, 1.4007568359375, 1.45306396484375, 1.50537109375, 1.55767822265625, 1.6099853515625, 1.66229248046875, 1.714599609375, 1.76690673828125, 1.8192138671875, 1.87152099609375, 1.923828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 7.0, 11.0, 17.0, 19.0, 29.0, 43.0, 81.0, 123.0, 212.0, 349.0, 795.0, 1920.0, 6416.0, 34331.0, 879099.0, 3207453.0, 50880.0, 8240.0, 2356.0, 906.0, 409.0, 221.0, 118.0, 70.0, 50.0, 38.0, 21.0, 12.0, 11.0, 10.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.878021240234375, -2.77557373046875, -2.673126220703125, -2.5706787109375, -2.468231201171875, -2.36578369140625, -2.263336181640625, -2.160888671875, -2.058441162109375, -1.95599365234375, -1.853546142578125, -1.7510986328125, -1.648651123046875, -1.54620361328125, -1.443756103515625, -1.34130859375, -1.238861083984375, -1.13641357421875, -1.033966064453125, -0.9315185546875, -0.829071044921875, -0.72662353515625, -0.624176025390625, -0.521728515625, -0.419281005859375, -0.31683349609375, -0.214385986328125, -0.1119384765625, -0.009490966796875, 0.09295654296875, 0.195404052734375, 0.2978515625, 0.400299072265625, 0.50274658203125, 0.605194091796875, 0.7076416015625, 0.810089111328125, 0.91253662109375, 1.014984130859375, 1.117431640625, 1.219879150390625, 1.32232666015625, 1.424774169921875, 1.5272216796875, 1.629669189453125, 1.73211669921875, 1.834564208984375, 1.93701171875, 2.039459228515625, 2.14190673828125, 2.244354248046875, 2.3468017578125, 2.449249267578125, 2.55169677734375, 2.654144287109375, 2.756591796875, 2.859039306640625, 2.96148681640625, 3.063934326171875, 3.1663818359375, 3.268829345703125, 3.37127685546875, 3.473724365234375, 3.576171875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 13.0, 24.0, 40.0, 40.0, 67.0, 112.0, 172.0, 366.0, 1283.0, 1072.0, 377.0, 169.0, 111.0, 82.0, 35.0, 23.0, 22.0, 12.0, 15.0, 9.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7883071899414062, -0.7636260986328125, -0.7389450073242188, -0.714263916015625, -0.6895828247070312, -0.6649017333984375, -0.6402206420898438, -0.61553955078125, -0.5908584594726562, -0.5661773681640625, -0.5414962768554688, -0.516815185546875, -0.49213409423828125, -0.4674530029296875, -0.44277191162109375, -0.4180908203125, -0.39340972900390625, -0.3687286376953125, -0.34404754638671875, -0.319366455078125, -0.29468536376953125, -0.2700042724609375, -0.24532318115234375, -0.22064208984375, -0.19596099853515625, -0.1712799072265625, -0.14659881591796875, -0.121917724609375, -0.09723663330078125, -0.0725555419921875, -0.04787445068359375, -0.023193359375, 0.00148773193359375, 0.0261688232421875, 0.05084991455078125, 0.075531005859375, 0.10021209716796875, 0.1248931884765625, 0.14957427978515625, 0.17425537109375, 0.19893646240234375, 0.2236175537109375, 0.24829864501953125, 0.272979736328125, 0.29766082763671875, 0.3223419189453125, 0.34702301025390625, 0.3717041015625, 0.39638519287109375, 0.4210662841796875, 0.44574737548828125, 0.470428466796875, 0.49510955810546875, 0.5197906494140625, 0.5444717407226562, 0.56915283203125, 0.5938339233398438, 0.6185150146484375, 0.6431961059570312, 0.667877197265625, 0.6925582885742188, 0.7172393798828125, 0.7419204711914062, 0.7666015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 11.0, 17.0, 27.0, 43.0, 86.0, 131.0, 182.0, 201.0, 135.0, 52.0, 35.0, 21.0, 10.0, 11.0, 8.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7479658126831055, -4.625550270080566, -4.503134250640869, -4.38071870803833, -4.258302688598633, -4.135887145996094, -4.0134711265563965, -3.8910553455352783, -3.76863956451416, -3.646223783493042, -3.523808002471924, -3.4013922214508057, -3.2789764404296875, -3.1565606594085693, -3.034144878387451, -2.911729097366333, -2.789313316345215, -2.6668975353240967, -2.5444817543029785, -2.4220659732818604, -2.299650192260742, -2.177234411239624, -2.054818630218506, -1.9324028491973877, -1.8099873065948486, -1.6875715255737305, -1.5651557445526123, -1.4427399635314941, -1.320324182510376, -1.1979084014892578, -1.0754926204681396, -0.9530768990516663, -0.8306610584259033, -0.7082452774047852, -0.585829496383667, -0.4634137451648712, -0.34099796414375305, -0.21858221292495728, -0.09616643190383911, 0.026249349117279053, 0.14866513013839722, 0.2710809111595154, 0.39349669218063354, 0.5159124135971069, 0.6383281946182251, 0.7607439756393433, 0.8831597566604614, 1.0055755376815796, 1.1279913187026978, 1.250407099723816, 1.372822880744934, 1.4952386617660522, 1.6176544427871704, 1.740070104598999, 1.8624858856201172, 1.9849016666412354, 2.1073174476623535, 2.2297332286834717, 2.35214900970459, 2.474564790725708, 2.596980571746826, 2.7193963527679443, 2.8418121337890625, 2.9642279148101807, 3.086643695831299]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 7.0, 15.0, 16.0, 23.0, 31.0, 31.0, 54.0, 60.0, 68.0, 69.0, 81.0, 56.0, 78.0, 76.0, 54.0, 48.0, 38.0, 44.0, 35.0, 34.0, 19.0, 17.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7363262176513672, -1.6730821132659912, -1.6098381280899048, -1.5465940237045288, -1.4833500385284424, -1.4201059341430664, -1.3568618297576904, -1.2936177253723145, -1.230373740196228, -1.167129635810852, -1.1038856506347656, -1.0406415462493896, -0.9773975014686584, -0.9141534566879272, -0.8509093523025513, -0.7876653075218201, -0.7244212627410889, -0.6611772179603577, -0.5979331731796265, -0.5346890687942505, -0.4714450240135193, -0.4082009792327881, -0.3449569046497345, -0.2817128300666809, -0.2184687852859497, -0.1552247256040573, -0.09198066592216492, -0.028736606240272522, 0.03450745344161987, 0.09775149822235107, 0.16099557280540466, 0.22423964738845825, 0.28748393058776855, 0.35072797536849976, 0.41397204995155334, 0.47721612453460693, 0.5404601693153381, 0.6037042140960693, 0.6669483184814453, 0.7301923632621765, 0.7934364080429077, 0.8566804528236389, 0.9199244976043701, 0.9831686019897461, 1.046412706375122, 1.1096566915512085, 1.1729007959365845, 1.236144781112671, 1.2993888854980469, 1.3626329898834229, 1.4258769750595093, 1.4891210794448853, 1.5523650646209717, 1.6156091690063477, 1.6788532733917236, 1.7420973777770996, 1.805341362953186, 1.868585467338562, 1.9318294525146484, 1.9950735569000244, 2.0583176612854004, 2.1215615272521973, 2.1848056316375732, 2.248049736022949, 2.311293840408325]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 21.0, 30.0, 59.0, 84.0, 202.0, 597.0, 2628.0, 29748.0, 900015.0, 108418.0, 5221.0, 942.0, 272.0, 123.0, 72.0, 35.0, 24.0, 10.0, 11.0, 6.0, 6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.34168243408203125, -0.3288726806640625, -0.31606292724609375, -0.303253173828125, -0.29044342041015625, -0.2776336669921875, -0.26482391357421875, -0.25201416015625, -0.23920440673828125, -0.2263946533203125, -0.21358489990234375, -0.200775146484375, -0.18796539306640625, -0.1751556396484375, -0.16234588623046875, -0.1495361328125, -0.13672637939453125, -0.1239166259765625, -0.11110687255859375, -0.098297119140625, -0.08548736572265625, -0.0726776123046875, -0.05986785888671875, -0.04705810546875, -0.03424835205078125, -0.0214385986328125, -0.00862884521484375, 0.004180908203125, 0.01699066162109375, 0.0298004150390625, 0.04261016845703125, 0.055419921875, 0.06822967529296875, 0.0810394287109375, 0.09384918212890625, 0.106658935546875, 0.11946868896484375, 0.1322784423828125, 0.14508819580078125, 0.15789794921875, 0.17070770263671875, 0.1835174560546875, 0.19632720947265625, 0.209136962890625, 0.22194671630859375, 0.2347564697265625, 0.24756622314453125, 0.2603759765625, 0.27318572998046875, 0.2859954833984375, 0.29880523681640625, 0.311614990234375, 0.32442474365234375, 0.3372344970703125, 0.35004425048828125, 0.36285400390625, 0.37566375732421875, 0.3884735107421875, 0.40128326416015625, 0.414093017578125, 0.42690277099609375, 0.4397125244140625, 0.45252227783203125, 0.46533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 5.0, 5.0, 13.0, 15.0, 17.0, 41.0, 34.0, 59.0, 82.0, 100.0, 86.0, 95.0, 106.0, 69.0, 66.0, 52.0, 48.0, 39.0, 22.0, 10.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.448486328125, -1.38916015625, -1.329833984375, -1.2705078125, -1.211181640625, -1.15185546875, -1.092529296875, -1.033203125, -0.973876953125, -0.91455078125, -0.855224609375, -0.7958984375, -0.736572265625, -0.67724609375, -0.617919921875, -0.55859375, -0.499267578125, -0.43994140625, -0.380615234375, -0.3212890625, -0.261962890625, -0.20263671875, -0.143310546875, -0.083984375, -0.024658203125, 0.03466796875, 0.093994140625, 0.1533203125, 0.212646484375, 0.27197265625, 0.331298828125, 0.390625, 0.449951171875, 0.50927734375, 0.568603515625, 0.6279296875, 0.687255859375, 0.74658203125, 0.805908203125, 0.865234375, 0.924560546875, 0.98388671875, 1.043212890625, 1.1025390625, 1.161865234375, 1.22119140625, 1.280517578125, 1.33984375, 1.399169921875, 1.45849609375, 1.517822265625, 1.5771484375, 1.636474609375, 1.69580078125, 1.755126953125, 1.814453125, 1.873779296875, 1.93310546875, 1.992431640625, 2.0517578125, 2.111083984375, 2.17041015625, 2.229736328125, 2.2890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 6.0, 7.0, 14.0, 19.0, 23.0, 26.0, 30.0, 53.0, 77.0, 119.0, 194.0, 280.0, 641.0, 2088.0, 11946.0, 118976.0, 781921.0, 117575.0, 11177.0, 1888.0, 601.0, 291.0, 169.0, 119.0, 83.0, 43.0, 38.0, 26.0, 23.0, 17.0, 13.0, 7.0, 12.0, 6.0, 5.0, 10.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1600341796875, -0.15460777282714844, -0.14918136596679688, -0.1437549591064453, -0.13832855224609375, -0.1329021453857422, -0.12747573852539062, -0.12204933166503906, -0.1166229248046875, -0.11119651794433594, -0.10577011108398438, -0.10034370422363281, -0.09491729736328125, -0.08949089050292969, -0.08406448364257812, -0.07863807678222656, -0.073211669921875, -0.06778526306152344, -0.062358856201171875, -0.05693244934082031, -0.05150604248046875, -0.04607963562011719, -0.040653228759765625, -0.03522682189941406, -0.0298004150390625, -0.024374008178710938, -0.018947601318359375, -0.013521194458007812, -0.00809478759765625, -0.0026683807373046875, 0.002758026123046875, 0.008184432983398438, 0.01361083984375, 0.019037246704101562, 0.024463653564453125, 0.029890060424804688, 0.03531646728515625, 0.04074287414550781, 0.046169281005859375, 0.05159568786621094, 0.0570220947265625, 0.06244850158691406, 0.06787490844726562, 0.07330131530761719, 0.07872772216796875, 0.08415412902832031, 0.08958053588867188, 0.09500694274902344, 0.100433349609375, 0.10585975646972656, 0.11128616333007812, 0.11671257019042969, 0.12213897705078125, 0.1275653839111328, 0.13299179077148438, 0.13841819763183594, 0.1438446044921875, 0.14927101135253906, 0.15469741821289062, 0.1601238250732422, 0.16555023193359375, 0.1709766387939453, 0.17640304565429688, 0.18182945251464844, 0.187255859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 2.0, 6.0, 9.0, 9.0, 4.0, 11.0, 15.0, 15.0, 23.0, 26.0, 28.0, 18.0, 29.0, 36.0, 34.0, 52.0, 44.0, 54.0, 47.0, 51.0, 49.0, 40.0, 59.0, 42.0, 41.0, 35.0, 37.0, 35.0, 25.0, 16.0, 22.0, 19.0, 8.0, 11.0, 8.0, 8.0, 3.0, 6.0, 11.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.79315185546875, -1.7337646484375, -1.67437744140625, -1.614990234375, -1.55560302734375, -1.4962158203125, -1.43682861328125, -1.37744140625, -1.31805419921875, -1.2586669921875, -1.19927978515625, -1.139892578125, -1.08050537109375, -1.0211181640625, -0.96173095703125, -0.90234375, -0.84295654296875, -0.7835693359375, -0.72418212890625, -0.664794921875, -0.60540771484375, -0.5460205078125, -0.48663330078125, -0.42724609375, -0.36785888671875, -0.3084716796875, -0.24908447265625, -0.189697265625, -0.13031005859375, -0.0709228515625, -0.01153564453125, 0.0478515625, 0.10723876953125, 0.1666259765625, 0.22601318359375, 0.285400390625, 0.34478759765625, 0.4041748046875, 0.46356201171875, 0.52294921875, 0.58233642578125, 0.6417236328125, 0.70111083984375, 0.760498046875, 0.81988525390625, 0.8792724609375, 0.93865966796875, 0.998046875, 1.05743408203125, 1.1168212890625, 1.17620849609375, 1.235595703125, 1.29498291015625, 1.3543701171875, 1.41375732421875, 1.47314453125, 1.53253173828125, 1.5919189453125, 1.65130615234375, 1.710693359375, 1.77008056640625, 1.8294677734375, 1.88885498046875, 1.9482421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 7.0, 13.0, 19.0, 20.0, 33.0, 43.0, 52.0, 79.0, 154.0, 304.0, 750.0, 2927.0, 77190.0, 958491.0, 6466.0, 1093.0, 357.0, 184.0, 102.0, 66.0, 42.0, 41.0, 25.0, 21.0, 14.0, 10.0, 7.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.041182518005371094, -0.03960990905761719, -0.03803730010986328, -0.036464691162109375, -0.03489208221435547, -0.03331947326660156, -0.031746864318847656, -0.03017425537109375, -0.028601646423339844, -0.027029037475585938, -0.02545642852783203, -0.023883819580078125, -0.02231121063232422, -0.020738601684570312, -0.019165992736816406, -0.0175933837890625, -0.016020774841308594, -0.014448165893554688, -0.012875556945800781, -0.011302947998046875, -0.009730339050292969, -0.008157730102539062, -0.006585121154785156, -0.00501251220703125, -0.0034399032592773438, -0.0018672943115234375, -0.00029468536376953125, 0.001277923583984375, 0.0028505325317382812, 0.0044231414794921875, 0.005995750427246094, 0.007568359375, 0.009140968322753906, 0.010713577270507812, 0.012286186218261719, 0.013858795166015625, 0.015431404113769531, 0.017004013061523438, 0.018576622009277344, 0.02014923095703125, 0.021721839904785156, 0.023294448852539062, 0.02486705780029297, 0.026439666748046875, 0.02801227569580078, 0.029584884643554688, 0.031157493591308594, 0.0327301025390625, 0.034302711486816406, 0.03587532043457031, 0.03744792938232422, 0.039020538330078125, 0.04059314727783203, 0.04216575622558594, 0.043738365173339844, 0.04531097412109375, 0.046883583068847656, 0.04845619201660156, 0.05002880096435547, 0.051601409912109375, 0.05317401885986328, 0.05474662780761719, 0.056319236755371094, 0.057891845703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 4.0, 13.0, 25.0, 21.0, 33.0, 67.0, 117.0, 160.0, 138.0, 125.0, 89.0, 64.0, 46.0, 29.0, 10.0, 10.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3530254364013672e-05, -1.2949109077453613e-05, -1.2367963790893555e-05, -1.1786818504333496e-05, -1.1205673217773438e-05, -1.0624527931213379e-05, -1.004338264465332e-05, -9.462237358093262e-06, -8.881092071533203e-06, -8.299946784973145e-06, -7.718801498413086e-06, -7.137656211853027e-06, -6.556510925292969e-06, -5.97536563873291e-06, -5.3942203521728516e-06, -4.813075065612793e-06, -4.231929779052734e-06, -3.6507844924926758e-06, -3.069639205932617e-06, -2.4884939193725586e-06, -1.9073486328125e-06, -1.3262033462524414e-06, -7.450580596923828e-07, -1.6391277313232422e-07, 4.172325134277344e-07, 9.98377799987793e-07, 1.5795230865478516e-06, 2.16066837310791e-06, 2.7418136596679688e-06, 3.3229589462280273e-06, 3.904104232788086e-06, 4.4852495193481445e-06, 5.066394805908203e-06, 5.647540092468262e-06, 6.22868537902832e-06, 6.809830665588379e-06, 7.3909759521484375e-06, 7.972121238708496e-06, 8.553266525268555e-06, 9.134411811828613e-06, 9.715557098388672e-06, 1.029670238494873e-05, 1.0877847671508789e-05, 1.1458992958068848e-05, 1.2040138244628906e-05, 1.2621283531188965e-05, 1.3202428817749023e-05, 1.3783574104309082e-05, 1.436471939086914e-05, 1.49458646774292e-05, 1.5527009963989258e-05, 1.6108155250549316e-05, 1.6689300537109375e-05, 1.7270445823669434e-05, 1.7851591110229492e-05, 1.843273639678955e-05, 1.901388168334961e-05, 1.9595026969909668e-05, 2.0176172256469727e-05, 2.0757317543029785e-05, 2.1338462829589844e-05, 2.1919608116149902e-05, 2.250075340270996e-05, 2.308189868927002e-05, 2.3663043975830078e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 12.0, 30.0, 25.0, 42.0, 73.0, 96.0, 188.0, 381.0, 736.0, 2432.0, 13394.0, 902416.0, 118971.0, 6831.0, 1614.0, 560.0, 297.0, 148.0, 85.0, 64.0, 50.0, 31.0, 17.0, 13.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06486892700195312, -0.06253814697265625, -0.060207366943359375, -0.0578765869140625, -0.055545806884765625, -0.05321502685546875, -0.050884246826171875, -0.048553466796875, -0.046222686767578125, -0.04389190673828125, -0.041561126708984375, -0.0392303466796875, -0.036899566650390625, -0.03456878662109375, -0.032238006591796875, -0.0299072265625, -0.027576446533203125, -0.02524566650390625, -0.022914886474609375, -0.0205841064453125, -0.018253326416015625, -0.01592254638671875, -0.013591766357421875, -0.011260986328125, -0.008930206298828125, -0.00659942626953125, -0.004268646240234375, -0.0019378662109375, 0.000392913818359375, 0.00272369384765625, 0.005054473876953125, 0.00738525390625, 0.009716033935546875, 0.01204681396484375, 0.014377593994140625, 0.0167083740234375, 0.019039154052734375, 0.02136993408203125, 0.023700714111328125, 0.026031494140625, 0.028362274169921875, 0.03069305419921875, 0.033023834228515625, 0.0353546142578125, 0.037685394287109375, 0.04001617431640625, 0.042346954345703125, 0.044677734375, 0.047008514404296875, 0.04933929443359375, 0.051670074462890625, 0.0540008544921875, 0.056331634521484375, 0.05866241455078125, 0.060993194580078125, 0.063323974609375, 0.06565475463867188, 0.06798553466796875, 0.07031631469726562, 0.0726470947265625, 0.07497787475585938, 0.07730865478515625, 0.07963943481445312, 0.08197021484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 10.0, 11.0, 14.0, 25.0, 32.0, 38.0, 78.0, 161.0, 183.0, 167.0, 95.0, 53.0, 33.0, 27.0, 23.0, 12.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00777435302734375, -0.007582962512969971, -0.007391571998596191, -0.007200181484222412, -0.007008790969848633, -0.0068174004554748535, -0.006626009941101074, -0.006434619426727295, -0.006243228912353516, -0.006051838397979736, -0.005860447883605957, -0.005669057369232178, -0.0054776668548583984, -0.005286276340484619, -0.00509488582611084, -0.0049034953117370605, -0.004712104797363281, -0.004520714282989502, -0.004329323768615723, -0.004137933254241943, -0.003946542739868164, -0.0037551522254943848, -0.0035637617111206055, -0.003372371196746826, -0.003180980682373047, -0.0029895901679992676, -0.0027981996536254883, -0.002606809139251709, -0.0024154186248779297, -0.0022240281105041504, -0.002032637596130371, -0.0018412470817565918, -0.0016498565673828125, -0.0014584660530090332, -0.001267075538635254, -0.0010756850242614746, -0.0008842945098876953, -0.000692903995513916, -0.0005015134811401367, -0.0003101229667663574, -0.00011873245239257812, 7.265806198120117e-05, 0.00026404857635498047, 0.00045543909072875977, 0.0006468296051025391, 0.0008382201194763184, 0.0010296106338500977, 0.001221001148223877, 0.0014123916625976562, 0.0016037821769714355, 0.0017951726913452148, 0.001986563205718994, 0.0021779537200927734, 0.0023693442344665527, 0.002560734748840332, 0.0027521252632141113, 0.0029435157775878906, 0.00313490629196167, 0.0033262968063354492, 0.0035176873207092285, 0.003709077835083008, 0.003900468349456787, 0.004091858863830566, 0.004283249378204346, 0.004474639892578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 12.0, 17.0, 30.0, 40.0, 101.0, 195.0, 228.0, 194.0, 74.0, 43.0, 16.0, 14.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8177742958068848, -3.7183310985565186, -3.6188876628875732, -3.519444465637207, -3.420001268386841, -3.3205578327178955, -3.2211146354675293, -3.121671199798584, -3.0222280025482178, -2.9227848052978516, -2.8233413696289062, -2.72389817237854, -2.624454975128174, -2.5250115394592285, -2.4255683422088623, -2.326125144958496, -2.226681709289551, -2.1272385120391846, -2.0277950763702393, -1.928351879119873, -1.8289085626602173, -1.7294652462005615, -1.6300220489501953, -1.5305787324905396, -1.431135654449463, -1.3316923379898071, -1.232249140739441, -1.1328058242797852, -1.0333625078201294, -0.9339192509651184, -0.8344759941101074, -0.7350326776504517, -0.6355893611907959, -0.5361461043357849, -0.43670278787612915, -0.33725953102111816, -0.2378162443637848, -0.13837295770645142, -0.03892970085144043, 0.06051361560821533, 0.15995687246322632, 0.2594001591205597, 0.35884344577789307, 0.45828670263290405, 0.557729959487915, 0.6571732759475708, 0.7566165328025818, 0.8560598492622375, 0.9555031061172485, 1.0549464225769043, 1.1543896198272705, 1.2538329362869263, 1.353276252746582, 1.4527194499969482, 1.552162766456604, 1.6516060829162598, 1.751049280166626, 1.8504925966262817, 1.949935793876648, 2.0493791103363037, 2.14882230758667, 2.2482657432556152, 2.3477089405059814, 2.4471521377563477, 2.546595573425293]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 5.0, 15.0, 19.0, 26.0, 34.0, 40.0, 71.0, 72.0, 93.0, 100.0, 81.0, 99.0, 74.0, 52.0, 54.0, 46.0, 37.0, 20.0, 18.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.456957459449768, -1.4033881425857544, -1.3498188257217407, -1.2962493896484375, -1.2426800727844238, -1.1891107559204102, -1.1355414390563965, -1.0819721221923828, -1.0284026861190796, -0.9748333692550659, -0.9212639927864075, -0.8676946759223938, -0.8141252994537354, -0.7605559825897217, -0.706986665725708, -0.6534172892570496, -0.5998479723930359, -0.5462786555290222, -0.49270927906036377, -0.4391399621963501, -0.38557058572769165, -0.332001268863678, -0.2784319221973419, -0.22486257553100586, -0.1712932288646698, -0.11772388219833374, -0.06415454298257828, -0.010585203766822815, 0.042984142899513245, 0.09655347466468811, 0.15012282133102417, 0.20369216799736023, 0.2572615146636963, 0.31083086133003235, 0.3644002079963684, 0.4179695248603821, 0.4715389013290405, 0.5251082181930542, 0.5786775350570679, 0.6322469115257263, 0.6858162879943848, 0.7393856048583984, 0.7929549813270569, 0.8465242981910706, 0.900093674659729, 0.9536629915237427, 1.0072323083877563, 1.0608017444610596, 1.1143710613250732, 1.167940378189087, 1.2215096950531006, 1.2750791311264038, 1.3286484479904175, 1.3822177648544312, 1.4357870817184448, 1.489356517791748, 1.5429257154464722, 1.5964950323104858, 1.6500643491744995, 1.7036337852478027, 1.7572031021118164, 1.81077241897583, 1.8643417358398438, 1.9179110527038574, 1.9714804887771606]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 8.0, 13.0, 17.0, 14.0, 22.0, 26.0, 31.0, 54.0, 84.0, 111.0, 176.0, 222.0, 403.0, 563.0, 841.0, 1422.0, 2252.0, 3897.0, 7671.0, 17071.0, 53099.0, 326071.0, 521631.0, 71639.0, 21178.0, 8709.0, 4460.0, 2472.0, 1487.0, 976.0, 592.0, 429.0, 277.0, 170.0, 124.0, 95.0, 68.0, 47.0, 41.0, 30.0, 17.0, 13.0, 8.0, 8.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.228515625, -1.19140625, -1.154296875, -1.1171875, -1.080078125, -1.04296875, -1.005859375, -0.96875, -0.931640625, -0.89453125, -0.857421875, -0.8203125, -0.783203125, -0.74609375, -0.708984375, -0.671875, -0.634765625, -0.59765625, -0.560546875, -0.5234375, -0.486328125, -0.44921875, -0.412109375, -0.375, -0.337890625, -0.30078125, -0.263671875, -0.2265625, -0.189453125, -0.15234375, -0.115234375, -0.078125, -0.041015625, -0.00390625, 0.033203125, 0.0703125, 0.107421875, 0.14453125, 0.181640625, 0.21875, 0.255859375, 0.29296875, 0.330078125, 0.3671875, 0.404296875, 0.44140625, 0.478515625, 0.515625, 0.552734375, 0.58984375, 0.626953125, 0.6640625, 0.701171875, 0.73828125, 0.775390625, 0.8125, 0.849609375, 0.88671875, 0.923828125, 0.9609375, 0.998046875, 1.03515625, 1.072265625, 1.109375, 1.146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 12.0, 10.0, 12.0, 25.0, 26.0, 37.0, 57.0, 55.0, 87.0, 78.0, 93.0, 97.0, 82.0, 51.0, 62.0, 47.0, 48.0, 39.0, 17.0, 15.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.138671875, -3.033172607421875, -2.92767333984375, -2.822174072265625, -2.7166748046875, -2.611175537109375, -2.50567626953125, -2.400177001953125, -2.294677734375, -2.189178466796875, -2.08367919921875, -1.978179931640625, -1.8726806640625, -1.767181396484375, -1.66168212890625, -1.556182861328125, -1.45068359375, -1.345184326171875, -1.23968505859375, -1.134185791015625, -1.0286865234375, -0.923187255859375, -0.81768798828125, -0.712188720703125, -0.606689453125, -0.501190185546875, -0.39569091796875, -0.290191650390625, -0.1846923828125, -0.079193115234375, 0.02630615234375, 0.131805419921875, 0.2373046875, 0.342803955078125, 0.44830322265625, 0.553802490234375, 0.6593017578125, 0.764801025390625, 0.87030029296875, 0.975799560546875, 1.081298828125, 1.186798095703125, 1.29229736328125, 1.397796630859375, 1.5032958984375, 1.608795166015625, 1.71429443359375, 1.819793701171875, 1.92529296875, 2.030792236328125, 2.13629150390625, 2.241790771484375, 2.3472900390625, 2.452789306640625, 2.55828857421875, 2.663787841796875, 2.769287109375, 2.874786376953125, 2.98028564453125, 3.085784912109375, 3.1912841796875, 3.296783447265625, 3.40228271484375, 3.507781982421875, 3.61328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 5.0, 17.0, 18.0, 16.0, 37.0, 46.0, 79.0, 139.0, 259.0, 549.0, 1151.0, 3040.0, 10414.0, 55376.0, 827832.0, 125984.0, 16092.0, 4599.0, 1491.0, 665.0, 299.0, 160.0, 80.0, 62.0, 47.0, 27.0, 19.0, 11.0, 15.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7138671875, -1.657958984375, -1.60205078125, -1.546142578125, -1.490234375, -1.434326171875, -1.37841796875, -1.322509765625, -1.2666015625, -1.210693359375, -1.15478515625, -1.098876953125, -1.04296875, -0.987060546875, -0.93115234375, -0.875244140625, -0.8193359375, -0.763427734375, -0.70751953125, -0.651611328125, -0.595703125, -0.539794921875, -0.48388671875, -0.427978515625, -0.3720703125, -0.316162109375, -0.26025390625, -0.204345703125, -0.1484375, -0.092529296875, -0.03662109375, 0.019287109375, 0.0751953125, 0.131103515625, 0.18701171875, 0.242919921875, 0.298828125, 0.354736328125, 0.41064453125, 0.466552734375, 0.5224609375, 0.578369140625, 0.63427734375, 0.690185546875, 0.74609375, 0.802001953125, 0.85791015625, 0.913818359375, 0.9697265625, 1.025634765625, 1.08154296875, 1.137451171875, 1.193359375, 1.249267578125, 1.30517578125, 1.361083984375, 1.4169921875, 1.472900390625, 1.52880859375, 1.584716796875, 1.640625, 1.696533203125, 1.75244140625, 1.808349609375, 1.8642578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 3.0, 10.0, 7.0, 12.0, 17.0, 18.0, 25.0, 37.0, 30.0, 27.0, 34.0, 22.0, 32.0, 53.0, 56.0, 47.0, 43.0, 50.0, 33.0, 45.0, 45.0, 39.0, 41.0, 34.0, 33.0, 32.0, 34.0, 20.0, 21.0, 11.0, 11.0, 13.0, 9.0, 13.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2734375, -2.18695068359375, -2.1004638671875, -2.01397705078125, -1.927490234375, -1.84100341796875, -1.7545166015625, -1.66802978515625, -1.58154296875, -1.49505615234375, -1.4085693359375, -1.32208251953125, -1.235595703125, -1.14910888671875, -1.0626220703125, -0.97613525390625, -0.8896484375, -0.80316162109375, -0.7166748046875, -0.63018798828125, -0.543701171875, -0.45721435546875, -0.3707275390625, -0.28424072265625, -0.19775390625, -0.11126708984375, -0.0247802734375, 0.06170654296875, 0.148193359375, 0.23468017578125, 0.3211669921875, 0.40765380859375, 0.494140625, 0.58062744140625, 0.6671142578125, 0.75360107421875, 0.840087890625, 0.92657470703125, 1.0130615234375, 1.09954833984375, 1.18603515625, 1.27252197265625, 1.3590087890625, 1.44549560546875, 1.531982421875, 1.61846923828125, 1.7049560546875, 1.79144287109375, 1.8779296875, 1.96441650390625, 2.0509033203125, 2.13739013671875, 2.223876953125, 2.31036376953125, 2.3968505859375, 2.48333740234375, 2.56982421875, 2.65631103515625, 2.7427978515625, 2.82928466796875, 2.915771484375, 3.00225830078125, 3.0887451171875, 3.17523193359375, 3.26171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 10.0, 6.0, 11.0, 10.0, 12.0, 17.0, 37.0, 62.0, 86.0, 170.0, 392.0, 924.0, 2452.0, 8842.0, 115516.0, 890727.0, 22301.0, 4370.0, 1431.0, 566.0, 274.0, 137.0, 73.0, 36.0, 30.0, 19.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2808074951171875, -1.242279052734375, -1.2037506103515625, -1.16522216796875, -1.1266937255859375, -1.088165283203125, -1.0496368408203125, -1.0111083984375, -0.9725799560546875, -0.934051513671875, -0.8955230712890625, -0.85699462890625, -0.8184661865234375, -0.779937744140625, -0.7414093017578125, -0.702880859375, -0.6643524169921875, -0.625823974609375, -0.5872955322265625, -0.54876708984375, -0.5102386474609375, -0.471710205078125, -0.4331817626953125, -0.3946533203125, -0.3561248779296875, -0.317596435546875, -0.2790679931640625, -0.24053955078125, -0.2020111083984375, -0.163482666015625, -0.1249542236328125, -0.08642578125, -0.0478973388671875, -0.009368896484375, 0.0291595458984375, 0.06768798828125, 0.1062164306640625, 0.144744873046875, 0.1832733154296875, 0.2218017578125, 0.2603302001953125, 0.298858642578125, 0.3373870849609375, 0.37591552734375, 0.4144439697265625, 0.452972412109375, 0.4915008544921875, 0.530029296875, 0.5685577392578125, 0.607086181640625, 0.6456146240234375, 0.68414306640625, 0.7226715087890625, 0.761199951171875, 0.7997283935546875, 0.8382568359375, 0.8767852783203125, 0.915313720703125, 0.9538421630859375, 0.99237060546875, 1.0308990478515625, 1.069427490234375, 1.1079559326171875, 1.146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 6.0, 18.0, 34.0, 65.0, 120.0, 319.0, 217.0, 94.0, 44.0, 19.0, 17.0, 16.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018586963415145874, -0.00018052756786346436, -0.00017518550157546997, -0.00016984343528747559, -0.0001645013689994812, -0.00015915930271148682, -0.00015381723642349243, -0.00014847517013549805, -0.00014313310384750366, -0.00013779103755950928, -0.0001324489712715149, -0.0001271069049835205, -0.00012176483869552612, -0.00011642277240753174, -0.00011108070611953735, -0.00010573863983154297, -0.00010039657354354858, -9.50545072555542e-05, -8.971244096755981e-05, -8.437037467956543e-05, -7.902830839157104e-05, -7.368624210357666e-05, -6.834417581558228e-05, -6.300210952758789e-05, -5.7660043239593506e-05, -5.231797695159912e-05, -4.6975910663604736e-05, -4.163384437561035e-05, -3.629177808761597e-05, -3.094971179962158e-05, -2.5607645511627197e-05, -2.0265579223632812e-05, -1.4923512935638428e-05, -9.581446647644043e-06, -4.239380359649658e-06, 1.1026859283447266e-06, 6.444752216339111e-06, 1.1786818504333496e-05, 1.712888479232788e-05, 2.2470951080322266e-05, 2.781301736831665e-05, 3.3155083656311035e-05, 3.849714994430542e-05, 4.3839216232299805e-05, 4.918128252029419e-05, 5.4523348808288574e-05, 5.986541509628296e-05, 6.520748138427734e-05, 7.054954767227173e-05, 7.589161396026611e-05, 8.12336802482605e-05, 8.657574653625488e-05, 9.191781282424927e-05, 9.725987911224365e-05, 0.00010260194540023804, 0.00010794401168823242, 0.0001132860779762268, 0.00011862814426422119, 0.00012397021055221558, 0.00012931227684020996, 0.00013465434312820435, 0.00013999640941619873, 0.00014533847570419312, 0.0001506805419921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 10.0, 16.0, 14.0, 17.0, 30.0, 31.0, 55.0, 94.0, 128.0, 195.0, 407.0, 834.0, 2122.0, 6401.0, 32086.0, 768428.0, 212721.0, 17541.0, 4284.0, 1566.0, 654.0, 353.0, 185.0, 103.0, 62.0, 55.0, 41.0, 21.0, 13.0, 12.0, 8.0, 9.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.880859375, -0.852294921875, -0.82373046875, -0.795166015625, -0.7666015625, -0.738037109375, -0.70947265625, -0.680908203125, -0.65234375, -0.623779296875, -0.59521484375, -0.566650390625, -0.5380859375, -0.509521484375, -0.48095703125, -0.452392578125, -0.423828125, -0.395263671875, -0.36669921875, -0.338134765625, -0.3095703125, -0.281005859375, -0.25244140625, -0.223876953125, -0.1953125, -0.166748046875, -0.13818359375, -0.109619140625, -0.0810546875, -0.052490234375, -0.02392578125, 0.004638671875, 0.033203125, 0.061767578125, 0.09033203125, 0.118896484375, 0.1474609375, 0.176025390625, 0.20458984375, 0.233154296875, 0.26171875, 0.290283203125, 0.31884765625, 0.347412109375, 0.3759765625, 0.404541015625, 0.43310546875, 0.461669921875, 0.490234375, 0.518798828125, 0.54736328125, 0.575927734375, 0.6044921875, 0.633056640625, 0.66162109375, 0.690185546875, 0.71875, 0.747314453125, 0.77587890625, 0.804443359375, 0.8330078125, 0.861572265625, 0.89013671875, 0.918701171875, 0.947265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 4.0, 8.0, 9.0, 7.0, 13.0, 14.0, 24.0, 45.0, 98.0, 154.0, 264.0, 140.0, 75.0, 45.0, 28.0, 10.0, 10.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37841796875, -0.36554718017578125, -0.3526763916015625, -0.33980560302734375, -0.326934814453125, -0.31406402587890625, -0.3011932373046875, -0.28832244873046875, -0.27545166015625, -0.26258087158203125, -0.2497100830078125, -0.23683929443359375, -0.223968505859375, -0.21109771728515625, -0.1982269287109375, -0.18535614013671875, -0.1724853515625, -0.15961456298828125, -0.1467437744140625, -0.13387298583984375, -0.121002197265625, -0.10813140869140625, -0.0952606201171875, -0.08238983154296875, -0.06951904296875, -0.05664825439453125, -0.0437774658203125, -0.03090667724609375, -0.018035888671875, -0.00516510009765625, 0.0077056884765625, 0.02057647705078125, 0.033447265625, 0.04631805419921875, 0.0591888427734375, 0.07205963134765625, 0.084930419921875, 0.09780120849609375, 0.1106719970703125, 0.12354278564453125, 0.13641357421875, 0.14928436279296875, 0.1621551513671875, 0.17502593994140625, 0.187896728515625, 0.20076751708984375, 0.2136383056640625, 0.22650909423828125, 0.2393798828125, 0.25225067138671875, 0.2651214599609375, 0.27799224853515625, 0.290863037109375, 0.30373382568359375, 0.3166046142578125, 0.32947540283203125, 0.34234619140625, 0.35521697998046875, 0.3680877685546875, 0.38095855712890625, 0.393829345703125, 0.40670013427734375, 0.4195709228515625, 0.43244171142578125, 0.4453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 33.0, 155.0, 506.0, 231.0, 44.0, 15.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.974451065063477, -15.452621459960938, -14.930791854858398, -14.40896224975586, -13.88713264465332, -13.365303039550781, -12.843472480773926, -12.321642875671387, -11.799813270568848, -11.277983665466309, -10.75615406036377, -10.23432445526123, -9.712493896484375, -9.190664291381836, -8.668834686279297, -8.147005081176758, -7.625175476074219, -7.10334587097168, -6.581516265869141, -6.059686183929443, -5.537856578826904, -5.016026973724365, -4.494196891784668, -3.972367286682129, -3.45053768157959, -2.928708076477051, -2.4068782329559326, -1.885048508644104, -1.3632187843322754, -0.8413891792297363, -0.31955933570861816, 0.2022705078125, 0.7240982055664062, 1.2459279298782349, 1.7677576541900635, 2.2895874977111816, 2.8114171028137207, 3.3332467079162598, 3.855076551437378, 4.376906394958496, 4.898736000061035, 5.420565605163574, 5.942395210266113, 6.4642252922058105, 6.98605489730835, 7.507884502410889, 8.029714584350586, 8.551544189453125, 9.073373794555664, 9.595203399658203, 10.117033004760742, 10.638862609863281, 11.16069221496582, 11.68252182006836, 12.204352378845215, 12.726181983947754, 13.248011589050293, 13.769841194152832, 14.291670799255371, 14.81350040435791, 15.335330963134766, 15.857160568237305, 16.378990173339844, 16.900819778442383, 17.422649383544922]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 2.0, 10.0, 10.0, 14.0, 18.0, 19.0, 21.0, 35.0, 34.0, 27.0, 36.0, 53.0, 49.0, 48.0, 61.0, 56.0, 64.0, 47.0, 60.0, 60.0, 38.0, 38.0, 36.0, 32.0, 24.0, 23.0, 19.0, 14.0, 14.0, 11.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.235995769500732, -5.043769836425781, -4.85154390335083, -4.659317970275879, -4.467092514038086, -4.274866580963135, -4.082640647888184, -3.8904147148132324, -3.6981887817382812, -3.50596284866333, -3.313736915588379, -3.121511220932007, -2.9292852878570557, -2.7370593547821045, -2.5448336601257324, -2.3526077270507812, -2.16038179397583, -1.968155860900879, -1.7759300470352173, -1.5837042331695557, -1.3914783000946045, -1.1992523670196533, -1.0070265531539917, -0.8148007392883301, -0.6225748062133789, -0.4303489327430725, -0.2381230592727661, -0.04589718580245972, 0.14632868766784668, 0.3385545611381531, 0.5307804346084595, 0.7230062484741211, 0.9152321815490723, 1.1074581146240234, 1.299683928489685, 1.4919097423553467, 1.6841356754302979, 1.876361608505249, 2.068587303161621, 2.2608132362365723, 2.4530391693115234, 2.6452651023864746, 2.837491035461426, 3.029716730117798, 3.221942663192749, 3.4141685962677, 3.6063942909240723, 3.7986202239990234, 3.9908461570739746, 4.183072090148926, 4.375298023223877, 4.567523956298828, 4.759749412536621, 4.951975345611572, 5.144201278686523, 5.336427211761475, 5.528653144836426, 5.720879077911377, 5.913105010986328, 6.105330944061279, 6.2975568771362305, 6.489782333374023, 6.682008266448975, 6.874234199523926, 7.066460132598877]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 13.0, 14.0, 12.0, 23.0, 29.0, 52.0, 77.0, 141.0, 221.0, 462.0, 916.0, 2317.0, 6905.0, 29545.0, 302855.0, 3683640.0, 139709.0, 18546.0, 5056.0, 1929.0, 853.0, 381.0, 210.0, 145.0, 90.0, 49.0, 28.0, 18.0, 17.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.800384521484375, -2.70819091796875, -2.615997314453125, -2.5238037109375, -2.431610107421875, -2.33941650390625, -2.247222900390625, -2.155029296875, -2.062835693359375, -1.97064208984375, -1.878448486328125, -1.7862548828125, -1.694061279296875, -1.60186767578125, -1.509674072265625, -1.41748046875, -1.325286865234375, -1.23309326171875, -1.140899658203125, -1.0487060546875, -0.956512451171875, -0.86431884765625, -0.772125244140625, -0.679931640625, -0.587738037109375, -0.49554443359375, -0.403350830078125, -0.3111572265625, -0.218963623046875, -0.12677001953125, -0.034576416015625, 0.0576171875, 0.149810791015625, 0.24200439453125, 0.334197998046875, 0.4263916015625, 0.518585205078125, 0.61077880859375, 0.702972412109375, 0.795166015625, 0.887359619140625, 0.97955322265625, 1.071746826171875, 1.1639404296875, 1.256134033203125, 1.34832763671875, 1.440521240234375, 1.53271484375, 1.624908447265625, 1.71710205078125, 1.809295654296875, 1.9014892578125, 1.993682861328125, 2.08587646484375, 2.178070068359375, 2.270263671875, 2.362457275390625, 2.45465087890625, 2.546844482421875, 2.6390380859375, 2.731231689453125, 2.82342529296875, 2.915618896484375, 3.0078125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 8.0, 6.0, 4.0, 15.0, 6.0, 23.0, 28.0, 29.0, 42.0, 62.0, 73.0, 92.0, 74.0, 90.0, 82.0, 67.0, 78.0, 54.0, 41.0, 30.0, 19.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3591461181640625, -1.303253173828125, -1.2473602294921875, -1.19146728515625, -1.1355743408203125, -1.079681396484375, -1.0237884521484375, -0.9678955078125, -0.9120025634765625, -0.856109619140625, -0.8002166748046875, -0.74432373046875, -0.6884307861328125, -0.632537841796875, -0.5766448974609375, -0.520751953125, -0.4648590087890625, -0.408966064453125, -0.3530731201171875, -0.29718017578125, -0.2412872314453125, -0.185394287109375, -0.1295013427734375, -0.0736083984375, -0.0177154541015625, 0.038177490234375, 0.0940704345703125, 0.14996337890625, 0.2058563232421875, 0.261749267578125, 0.3176422119140625, 0.37353515625, 0.4294281005859375, 0.485321044921875, 0.5412139892578125, 0.59710693359375, 0.6529998779296875, 0.708892822265625, 0.7647857666015625, 0.8206787109375, 0.8765716552734375, 0.932464599609375, 0.9883575439453125, 1.04425048828125, 1.1001434326171875, 1.156036376953125, 1.2119293212890625, 1.267822265625, 1.3237152099609375, 1.379608154296875, 1.4355010986328125, 1.49139404296875, 1.5472869873046875, 1.603179931640625, 1.6590728759765625, 1.7149658203125, 1.7708587646484375, 1.826751708984375, 1.8826446533203125, 1.93853759765625, 1.9944305419921875, 2.050323486328125, 2.1062164306640625, 2.162109375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 18.0, 22.0, 37.0, 57.0, 100.0, 204.0, 402.0, 844.0, 2624.0, 11695.0, 129346.0, 3905513.0, 127317.0, 11696.0, 2583.0, 911.0, 387.0, 210.0, 113.0, 60.0, 48.0, 33.0, 20.0, 11.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.922271728515625, -3.80157470703125, -3.680877685546875, -3.5601806640625, -3.439483642578125, -3.31878662109375, -3.198089599609375, -3.077392578125, -2.956695556640625, -2.83599853515625, -2.715301513671875, -2.5946044921875, -2.473907470703125, -2.35321044921875, -2.232513427734375, -2.11181640625, -1.991119384765625, -1.87042236328125, -1.749725341796875, -1.6290283203125, -1.508331298828125, -1.38763427734375, -1.266937255859375, -1.146240234375, -1.025543212890625, -0.90484619140625, -0.784149169921875, -0.6634521484375, -0.542755126953125, -0.42205810546875, -0.301361083984375, -0.1806640625, -0.059967041015625, 0.06072998046875, 0.181427001953125, 0.3021240234375, 0.422821044921875, 0.54351806640625, 0.664215087890625, 0.784912109375, 0.905609130859375, 1.02630615234375, 1.147003173828125, 1.2677001953125, 1.388397216796875, 1.50909423828125, 1.629791259765625, 1.75048828125, 1.871185302734375, 1.99188232421875, 2.112579345703125, 2.2332763671875, 2.353973388671875, 2.47467041015625, 2.595367431640625, 2.716064453125, 2.836761474609375, 2.95745849609375, 3.078155517578125, 3.1988525390625, 3.319549560546875, 3.44024658203125, 3.560943603515625, 3.681640625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 18.0, 9.0, 16.0, 29.0, 40.0, 60.0, 78.0, 134.0, 229.0, 509.0, 1385.0, 740.0, 336.0, 139.0, 105.0, 74.0, 54.0, 29.0, 17.0, 8.0, 18.0, 10.0, 8.0, 8.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.49852752685546875, -0.4755706787109375, -0.45261383056640625, -0.429656982421875, -0.40670013427734375, -0.3837432861328125, -0.36078643798828125, -0.33782958984375, -0.31487274169921875, -0.2919158935546875, -0.26895904541015625, -0.246002197265625, -0.22304534912109375, -0.2000885009765625, -0.17713165283203125, -0.1541748046875, -0.13121795654296875, -0.1082611083984375, -0.08530426025390625, -0.062347412109375, -0.03939056396484375, -0.0164337158203125, 0.00652313232421875, 0.02947998046875, 0.05243682861328125, 0.0753936767578125, 0.09835052490234375, 0.121307373046875, 0.14426422119140625, 0.1672210693359375, 0.19017791748046875, 0.213134765625, 0.23609161376953125, 0.2590484619140625, 0.28200531005859375, 0.304962158203125, 0.32791900634765625, 0.3508758544921875, 0.37383270263671875, 0.39678955078125, 0.41974639892578125, 0.4427032470703125, 0.46566009521484375, 0.488616943359375, 0.5115737915039062, 0.5345306396484375, 0.5574874877929688, 0.5804443359375, 0.6034011840820312, 0.6263580322265625, 0.6493148803710938, 0.672271728515625, 0.6952285766601562, 0.7181854248046875, 0.7411422729492188, 0.76409912109375, 0.7870559692382812, 0.8100128173828125, 0.8329696655273438, 0.855926513671875, 0.8788833618164062, 0.9018402099609375, 0.9247970581054688, 0.94775390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 6.0, 8.0, 17.0, 16.0, 21.0, 35.0, 60.0, 75.0, 132.0, 155.0, 118.0, 115.0, 96.0, 46.0, 21.0, 21.0, 12.0, 6.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.8963539600372314, -3.803611993789673, -3.7108700275421143, -3.6181280612945557, -3.525386095046997, -3.4326441287994385, -3.339901924133301, -3.247159957885742, -3.1544179916381836, -3.061676025390625, -2.9689340591430664, -2.876192092895508, -2.783450126647949, -2.6907081604003906, -2.597966194152832, -2.5052242279052734, -2.412482261657715, -2.3197402954101562, -2.2269983291625977, -2.134256362915039, -2.0415143966674805, -1.9487724304199219, -1.8560303449630737, -1.7632883787155151, -1.6705464124679565, -1.577804446220398, -1.4850624799728394, -1.3923203945159912, -1.2995784282684326, -1.206836462020874, -1.1140944957733154, -1.0213525295257568, -0.9286103248596191, -0.8358683586120605, -0.743126392364502, -0.6503843665122986, -0.55764240026474, -0.4649004340171814, -0.372158408164978, -0.27941644191741943, -0.18667447566986084, -0.09393249452114105, -0.0011905133724212646, 0.09155148267745972, 0.1842934489250183, 0.2770354151725769, 0.3697774410247803, 0.46251940727233887, 0.5552613735198975, 0.648003339767456, 0.7407453060150146, 0.833487331867218, 0.9262292981147766, 1.0189712047576904, 1.1117132902145386, 1.2044552564620972, 1.2971972227096558, 1.3899391889572144, 1.482681155204773, 1.575423240661621, 1.6681652069091797, 1.7609071731567383, 1.8536491394042969, 1.9463911056518555, 2.039133071899414]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 10.0, 10.0, 14.0, 8.0, 23.0, 31.0, 54.0, 52.0, 69.0, 67.0, 86.0, 84.0, 86.0, 70.0, 90.0, 59.0, 50.0, 44.0, 21.0, 23.0, 15.0, 8.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8984811305999756, -1.8194431066513062, -1.7404050827026367, -1.6613669395446777, -1.5823289155960083, -1.5032908916473389, -1.4242527484893799, -1.3452147245407104, -1.266176700592041, -1.1871386766433716, -1.1081006526947021, -1.0290625095367432, -0.9500244855880737, -0.8709864616394043, -0.7919483780860901, -0.7129102945327759, -0.6338722705841064, -0.554834246635437, -0.4757961630821228, -0.396758109331131, -0.31772005558013916, -0.23868200182914734, -0.15964394807815552, -0.08060586452484131, -0.001567840576171875, 0.07747021317481995, 0.15650826692581177, 0.2355463206768036, 0.3145843744277954, 0.39362242817878723, 0.47266048192977905, 0.5516985654830933, 0.6307363510131836, 0.709774374961853, 0.7888124585151672, 0.8678505420684814, 0.9468885660171509, 1.0259265899658203, 1.1049647331237793, 1.1840027570724487, 1.2630407810211182, 1.3420788049697876, 1.421116828918457, 1.500154972076416, 1.5791929960250854, 1.6582310199737549, 1.7372691631317139, 1.8163071870803833, 1.8953452110290527, 1.9743832349777222, 2.0534212589263916, 2.1324594020843506, 2.2114973068237305, 2.2905354499816895, 2.3695735931396484, 2.4486117362976074, 2.5276496410369873, 2.6066877841949463, 2.685725688934326, 2.764763832092285, 2.843801975250244, 2.922839879989624, 3.001878023147583, 3.080915927886963, 3.159954071044922]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 8.0, 15.0, 15.0, 35.0, 75.0, 113.0, 240.0, 649.0, 1943.0, 11430.0, 528160.0, 491580.0, 11360.0, 1804.0, 591.0, 225.0, 134.0, 62.0, 36.0, 27.0, 13.0, 15.0, 4.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4267578125, -0.4145622253417969, -0.40236663818359375, -0.3901710510253906, -0.3779754638671875, -0.3657798767089844, -0.35358428955078125, -0.3413887023925781, -0.329193115234375, -0.3169975280761719, -0.30480194091796875, -0.2926063537597656, -0.2804107666015625, -0.2682151794433594, -0.25601959228515625, -0.24382400512695312, -0.23162841796875, -0.21943283081054688, -0.20723724365234375, -0.19504165649414062, -0.1828460693359375, -0.17065048217773438, -0.15845489501953125, -0.14625930786132812, -0.134063720703125, -0.12186813354492188, -0.10967254638671875, -0.09747695922851562, -0.0852813720703125, -0.07308578491210938, -0.06089019775390625, -0.048694610595703125, -0.0364990234375, -0.024303436279296875, -0.01210784912109375, 8.7738037109375e-05, 0.0122833251953125, 0.024478912353515625, 0.03667449951171875, 0.048870086669921875, 0.061065673828125, 0.07326126098632812, 0.08545684814453125, 0.09765243530273438, 0.1098480224609375, 0.12204360961914062, 0.13423919677734375, 0.14643478393554688, 0.15863037109375, 0.17082595825195312, 0.18302154541015625, 0.19521713256835938, 0.2074127197265625, 0.21960830688476562, 0.23180389404296875, 0.24399948120117188, 0.256195068359375, 0.2683906555175781, 0.28058624267578125, 0.2927818298339844, 0.3049774169921875, 0.3171730041503906, 0.32936859130859375, 0.3415641784667969, 0.353759765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 16.0, 9.0, 24.0, 26.0, 56.0, 79.0, 88.0, 117.0, 113.0, 110.0, 117.0, 71.0, 57.0, 39.0, 26.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9306640625, -1.8579864501953125, -1.785308837890625, -1.7126312255859375, -1.63995361328125, -1.5672760009765625, -1.494598388671875, -1.4219207763671875, -1.3492431640625, -1.2765655517578125, -1.203887939453125, -1.1312103271484375, -1.05853271484375, -0.9858551025390625, -0.913177490234375, -0.8404998779296875, -0.767822265625, -0.6951446533203125, -0.622467041015625, -0.5497894287109375, -0.47711181640625, -0.4044342041015625, -0.331756591796875, -0.2590789794921875, -0.1864013671875, -0.1137237548828125, -0.041046142578125, 0.0316314697265625, 0.10430908203125, 0.1769866943359375, 0.249664306640625, 0.3223419189453125, 0.39501953125, 0.4676971435546875, 0.540374755859375, 0.6130523681640625, 0.68572998046875, 0.7584075927734375, 0.831085205078125, 0.9037628173828125, 0.9764404296875, 1.0491180419921875, 1.121795654296875, 1.1944732666015625, 1.26715087890625, 1.3398284912109375, 1.412506103515625, 1.4851837158203125, 1.557861328125, 1.6305389404296875, 1.703216552734375, 1.7758941650390625, 1.84857177734375, 1.9212493896484375, 1.993927001953125, 2.0666046142578125, 2.1392822265625, 2.2119598388671875, 2.284637451171875, 2.3573150634765625, 2.42999267578125, 2.5026702880859375, 2.575347900390625, 2.6480255126953125, 2.720703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 15.0, 8.0, 18.0, 31.0, 34.0, 37.0, 52.0, 57.0, 83.0, 96.0, 126.0, 210.0, 360.0, 909.0, 3873.0, 32108.0, 520308.0, 458045.0, 26672.0, 3554.0, 856.0, 352.0, 198.0, 138.0, 106.0, 68.0, 48.0, 32.0, 29.0, 28.0, 17.0, 17.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.198486328125, -0.1920795440673828, -0.18567276000976562, -0.17926597595214844, -0.17285919189453125, -0.16645240783691406, -0.16004562377929688, -0.1536388397216797, -0.1472320556640625, -0.1408252716064453, -0.13441848754882812, -0.12801170349121094, -0.12160491943359375, -0.11519813537597656, -0.10879135131835938, -0.10238456726074219, -0.095977783203125, -0.08957099914550781, -0.08316421508789062, -0.07675743103027344, -0.07035064697265625, -0.06394386291503906, -0.057537078857421875, -0.05113029479980469, -0.0447235107421875, -0.03831672668457031, -0.031909942626953125, -0.025503158569335938, -0.01909637451171875, -0.012689590454101562, -0.006282806396484375, 0.0001239776611328125, 0.00653076171875, 0.012937545776367188, 0.019344329833984375, 0.025751113891601562, 0.03215789794921875, 0.03856468200683594, 0.044971466064453125, 0.05137825012207031, 0.0577850341796875, 0.06419181823730469, 0.07059860229492188, 0.07700538635253906, 0.08341217041015625, 0.08981895446777344, 0.09622573852539062, 0.10263252258300781, 0.109039306640625, 0.11544609069824219, 0.12185287475585938, 0.12825965881347656, 0.13466644287109375, 0.14107322692871094, 0.14748001098632812, 0.1538867950439453, 0.1602935791015625, 0.1667003631591797, 0.17310714721679688, 0.17951393127441406, 0.18592071533203125, 0.19232749938964844, 0.19873428344726562, 0.2051410675048828, 0.2115478515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 23.0, 13.0, 28.0, 28.0, 46.0, 31.0, 36.0, 34.0, 39.0, 52.0, 35.0, 60.0, 55.0, 42.0, 43.0, 47.0, 51.0, 34.0, 30.0, 28.0, 36.0, 26.0, 28.0, 14.0, 17.0, 13.0, 10.0, 10.0, 4.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.03765869140625, -1.9718017578125, -1.90594482421875, -1.840087890625, -1.77423095703125, -1.7083740234375, -1.64251708984375, -1.57666015625, -1.51080322265625, -1.4449462890625, -1.37908935546875, -1.313232421875, -1.24737548828125, -1.1815185546875, -1.11566162109375, -1.0498046875, -0.98394775390625, -0.9180908203125, -0.85223388671875, -0.786376953125, -0.72052001953125, -0.6546630859375, -0.58880615234375, -0.52294921875, -0.45709228515625, -0.3912353515625, -0.32537841796875, -0.259521484375, -0.19366455078125, -0.1278076171875, -0.06195068359375, 0.00390625, 0.06976318359375, 0.1356201171875, 0.20147705078125, 0.267333984375, 0.33319091796875, 0.3990478515625, 0.46490478515625, 0.53076171875, 0.59661865234375, 0.6624755859375, 0.72833251953125, 0.794189453125, 0.86004638671875, 0.9259033203125, 0.99176025390625, 1.0576171875, 1.12347412109375, 1.1893310546875, 1.25518798828125, 1.321044921875, 1.38690185546875, 1.4527587890625, 1.51861572265625, 1.58447265625, 1.65032958984375, 1.7161865234375, 1.78204345703125, 1.847900390625, 1.91375732421875, 1.9796142578125, 2.04547119140625, 2.111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 11.0, 17.0, 19.0, 42.0, 78.0, 182.0, 537.0, 3739.0, 1036724.0, 6224.0, 618.0, 149.0, 73.0, 38.0, 16.0, 15.0, 15.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11407470703125, -0.10943317413330078, -0.10479164123535156, -0.10015010833740234, -0.09550857543945312, -0.0908670425415039, -0.08622550964355469, -0.08158397674560547, -0.07694244384765625, -0.07230091094970703, -0.06765937805175781, -0.0630178451538086, -0.058376312255859375, -0.053734779357910156, -0.04909324645996094, -0.04445171356201172, -0.0398101806640625, -0.03516864776611328, -0.030527114868164062, -0.025885581970214844, -0.021244049072265625, -0.016602516174316406, -0.011960983276367188, -0.007319450378417969, -0.00267791748046875, 0.0019636154174804688, 0.0066051483154296875, 0.011246681213378906, 0.015888214111328125, 0.020529747009277344, 0.025171279907226562, 0.02981281280517578, 0.034454345703125, 0.03909587860107422, 0.04373741149902344, 0.048378944396972656, 0.053020477294921875, 0.057662010192871094, 0.06230354309082031, 0.06694507598876953, 0.07158660888671875, 0.07622814178466797, 0.08086967468261719, 0.0855112075805664, 0.09015274047851562, 0.09479427337646484, 0.09943580627441406, 0.10407733917236328, 0.1087188720703125, 0.11336040496826172, 0.11800193786621094, 0.12264347076416016, 0.12728500366210938, 0.1319265365600586, 0.1365680694580078, 0.14120960235595703, 0.14585113525390625, 0.15049266815185547, 0.1551342010498047, 0.1597757339477539, 0.16441726684570312, 0.16905879974365234, 0.17370033264160156, 0.17834186553955078, 0.1829833984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 11.0, 12.0, 21.0, 41.0, 56.0, 103.0, 187.0, 182.0, 168.0, 99.0, 49.0, 25.0, 19.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8789043426513672e-05, -2.7995556592941284e-05, -2.7202069759368896e-05, -2.640858292579651e-05, -2.561509609222412e-05, -2.4821609258651733e-05, -2.4028122425079346e-05, -2.3234635591506958e-05, -2.244114875793457e-05, -2.1647661924362183e-05, -2.0854175090789795e-05, -2.0060688257217407e-05, -1.926720142364502e-05, -1.8473714590072632e-05, -1.7680227756500244e-05, -1.6886740922927856e-05, -1.609325408935547e-05, -1.529976725578308e-05, -1.4506280422210693e-05, -1.3712793588638306e-05, -1.2919306755065918e-05, -1.212581992149353e-05, -1.1332333087921143e-05, -1.0538846254348755e-05, -9.745359420776367e-06, -8.95187258720398e-06, -8.158385753631592e-06, -7.364898920059204e-06, -6.571412086486816e-06, -5.777925252914429e-06, -4.984438419342041e-06, -4.190951585769653e-06, -3.3974647521972656e-06, -2.603977918624878e-06, -1.8104910850524902e-06, -1.0170042514801025e-06, -2.2351741790771484e-07, 5.699694156646729e-07, 1.3634562492370605e-06, 2.1569430828094482e-06, 2.950429916381836e-06, 3.7439167499542236e-06, 4.537403583526611e-06, 5.330890417098999e-06, 6.124377250671387e-06, 6.917864084243774e-06, 7.711350917816162e-06, 8.50483775138855e-06, 9.298324584960938e-06, 1.0091811418533325e-05, 1.0885298252105713e-05, 1.16787850856781e-05, 1.2472271919250488e-05, 1.3265758752822876e-05, 1.4059245586395264e-05, 1.4852732419967651e-05, 1.564621925354004e-05, 1.6439706087112427e-05, 1.7233192920684814e-05, 1.8026679754257202e-05, 1.882016658782959e-05, 1.9613653421401978e-05, 2.0407140254974365e-05, 2.1200627088546753e-05, 2.199411392211914e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 12.0, 14.0, 22.0, 38.0, 73.0, 97.0, 206.0, 330.0, 982.0, 5535.0, 868427.0, 167249.0, 3921.0, 857.0, 324.0, 172.0, 87.0, 48.0, 44.0, 20.0, 24.0, 18.0, 14.0, 15.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1578369140625, -0.1535625457763672, -0.14928817749023438, -0.14501380920410156, -0.14073944091796875, -0.13646507263183594, -0.13219070434570312, -0.1279163360595703, -0.1236419677734375, -0.11936759948730469, -0.11509323120117188, -0.11081886291503906, -0.10654449462890625, -0.10227012634277344, -0.09799575805664062, -0.09372138977050781, -0.089447021484375, -0.08517265319824219, -0.08089828491210938, -0.07662391662597656, -0.07234954833984375, -0.06807518005371094, -0.06380081176757812, -0.05952644348144531, -0.0552520751953125, -0.05097770690917969, -0.046703338623046875, -0.04242897033691406, -0.03815460205078125, -0.03388023376464844, -0.029605865478515625, -0.025331497192382812, -0.02105712890625, -0.016782760620117188, -0.012508392333984375, -0.008234024047851562, -0.00395965576171875, 0.0003147125244140625, 0.004589080810546875, 0.008863449096679688, 0.0131378173828125, 0.017412185668945312, 0.021686553955078125, 0.025960922241210938, 0.03023529052734375, 0.03450965881347656, 0.038784027099609375, 0.04305839538574219, 0.047332763671875, 0.05160713195800781, 0.055881500244140625, 0.06015586853027344, 0.06443023681640625, 0.06870460510253906, 0.07297897338867188, 0.07725334167480469, 0.0815277099609375, 0.08580207824707031, 0.09007644653320312, 0.09435081481933594, 0.09862518310546875, 0.10289955139160156, 0.10717391967773438, 0.11144828796386719, 0.11572265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 57.0, 528.0, 312.0, 44.0, 16.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0416259765625, -0.040738701820373535, -0.03985142707824707, -0.038964152336120605, -0.03807687759399414, -0.037189602851867676, -0.03630232810974121, -0.035415053367614746, -0.03452777862548828, -0.033640503883361816, -0.03275322914123535, -0.03186595439910889, -0.030978679656982422, -0.030091404914855957, -0.029204130172729492, -0.028316855430603027, -0.027429580688476562, -0.026542305946350098, -0.025655031204223633, -0.024767756462097168, -0.023880481719970703, -0.02299320697784424, -0.022105932235717773, -0.02121865749359131, -0.020331382751464844, -0.01944410800933838, -0.018556833267211914, -0.01766955852508545, -0.016782283782958984, -0.01589500904083252, -0.015007734298706055, -0.01412045955657959, -0.013233184814453125, -0.01234591007232666, -0.011458635330200195, -0.01057136058807373, -0.009684085845947266, -0.0087968111038208, -0.007909536361694336, -0.007022261619567871, -0.006134986877441406, -0.005247712135314941, -0.0043604373931884766, -0.0034731626510620117, -0.002585887908935547, -0.001698613166809082, -0.0008113384246826172, 7.593631744384766e-05, 0.0009632110595703125, 0.0018504858016967773, 0.002737760543823242, 0.003625035285949707, 0.004512310028076172, 0.005399584770202637, 0.0062868595123291016, 0.007174134254455566, 0.008061408996582031, 0.008948683738708496, 0.009835958480834961, 0.010723233222961426, 0.01161050796508789, 0.012497782707214355, 0.01338505744934082, 0.014272332191467285, 0.01515960693359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 8.0, 10.0, 21.0, 35.0, 67.0, 144.0, 216.0, 213.0, 146.0, 61.0, 23.0, 15.0, 10.0, 18.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1042208671569824, -3.0072691440582275, -2.9103174209594727, -2.8133656978607178, -2.716413974761963, -2.619462251663208, -2.522510528564453, -2.425558567047119, -2.3286070823669434, -2.2316553592681885, -2.1347036361694336, -2.0377519130706787, -1.9408001899719238, -1.843848466873169, -1.7468966245651245, -1.6499449014663696, -1.5529930591583252, -1.4560413360595703, -1.3590896129608154, -1.2621378898620605, -1.1651861667633057, -1.0682344436645508, -0.9712826013565063, -0.8743308782577515, -0.7773791551589966, -0.6804274320602417, -0.5834757089614868, -0.48652392625808716, -0.3895722031593323, -0.2926204800605774, -0.19566869735717773, -0.09871697425842285, -0.0017652511596679688, 0.09518648684024811, 0.19213822484016418, 0.28908997774124146, 0.38604170083999634, 0.4829934239387512, 0.5799452066421509, 0.6768969297409058, 0.7738486528396606, 0.8708003759384155, 0.9677520990371704, 1.0647039413452148, 1.1616556644439697, 1.2586073875427246, 1.3555591106414795, 1.4525108337402344, 1.5494625568389893, 1.6464142799377441, 1.743366003036499, 1.840317726135254, 1.9372694492340088, 2.0342211723327637, 2.1311731338500977, 2.2281246185302734, 2.3250765800476074, 2.4220283031463623, 2.518980026245117, 2.615931749343872, 2.712883472442627, 2.809835195541382, 2.9067869186401367, 3.0037388801574707, 3.1006903648376465]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 12.0, 12.0, 15.0, 22.0, 28.0, 58.0, 64.0, 88.0, 108.0, 108.0, 99.0, 100.0, 83.0, 64.0, 52.0, 28.0, 16.0, 13.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5358527898788452, -1.4713879823684692, -1.4069232940673828, -1.3424584865570068, -1.2779936790466309, -1.2135288715362549, -1.1490641832351685, -1.0845993757247925, -1.020134687423706, -0.9556699395179749, -0.8912051320075989, -0.8267403841018677, -0.7622755765914917, -0.6978108286857605, -0.6333460807800293, -0.5688812732696533, -0.5044164657592773, -0.43995168805122375, -0.37548691034317017, -0.31102216243743896, -0.24655738472938538, -0.1820926070213318, -0.11762785911560059, -0.053163081407547, 0.011301696300506592, 0.07576646655797958, 0.14023123681545258, 0.20469599962234497, 0.26916077733039856, 0.33362555503845215, 0.39809030294418335, 0.46255508065223694, 0.5270199775695801, 0.5914847254753113, 0.6559495329856873, 0.7204142808914185, 0.7848790884017944, 0.8493438363075256, 0.9138085842132568, 0.9782733917236328, 1.0427381992340088, 1.1072030067443848, 1.1716676950454712, 1.2361325025558472, 1.3005973100662231, 1.3650619983673096, 1.4295268058776855, 1.4939916133880615, 1.558456301689148, 1.622921109199524, 1.6873857975006104, 1.7518506050109863, 1.8163154125213623, 1.8807802200317383, 1.9452449083328247, 2.009709596633911, 2.074174404144287, 2.138639211654663, 2.203104019165039, 2.267568588256836, 2.332033395767212, 2.396498203277588, 2.460963010787964, 2.52542781829834, 2.589892625808716]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 13.0, 14.0, 22.0, 30.0, 61.0, 101.0, 192.0, 408.0, 970.0, 2563.0, 8018.0, 38611.0, 637087.0, 323312.0, 27308.0, 6223.0, 2036.0, 824.0, 307.0, 203.0, 89.0, 65.0, 28.0, 24.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9249496459960938, -0.8845672607421875, -0.8441848754882812, -0.803802490234375, -0.7634201049804688, -0.7230377197265625, -0.6826553344726562, -0.64227294921875, -0.6018905639648438, -0.5615081787109375, -0.5211257934570312, -0.480743408203125, -0.44036102294921875, -0.3999786376953125, -0.35959625244140625, -0.3192138671875, -0.27883148193359375, -0.2384490966796875, -0.19806671142578125, -0.157684326171875, -0.11730194091796875, -0.0769195556640625, -0.03653717041015625, 0.00384521484375, 0.04422760009765625, 0.0846099853515625, 0.12499237060546875, 0.165374755859375, 0.20575714111328125, 0.2461395263671875, 0.28652191162109375, 0.326904296875, 0.36728668212890625, 0.4076690673828125, 0.44805145263671875, 0.488433837890625, 0.5288162231445312, 0.5691986083984375, 0.6095809936523438, 0.64996337890625, 0.6903457641601562, 0.7307281494140625, 0.7711105346679688, 0.811492919921875, 0.8518753051757812, 0.8922576904296875, 0.9326400756835938, 0.9730224609375, 1.0134048461914062, 1.0537872314453125, 1.0941696166992188, 1.134552001953125, 1.1749343872070312, 1.2153167724609375, 1.2556991577148438, 1.29608154296875, 1.3364639282226562, 1.3768463134765625, 1.4172286987304688, 1.457611083984375, 1.4979934692382812, 1.5383758544921875, 1.5787582397460938, 1.619140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 8.0, 13.0, 14.0, 17.0, 34.0, 40.0, 58.0, 57.0, 88.0, 84.0, 100.0, 91.0, 91.0, 65.0, 63.0, 43.0, 41.0, 26.0, 19.0, 7.0, 3.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.46807861328125, -2.3541259765625, -2.24017333984375, -2.126220703125, -2.01226806640625, -1.8983154296875, -1.78436279296875, -1.67041015625, -1.55645751953125, -1.4425048828125, -1.32855224609375, -1.214599609375, -1.10064697265625, -0.9866943359375, -0.87274169921875, -0.7587890625, -0.64483642578125, -0.5308837890625, -0.41693115234375, -0.302978515625, -0.18902587890625, -0.0750732421875, 0.03887939453125, 0.15283203125, 0.26678466796875, 0.3807373046875, 0.49468994140625, 0.608642578125, 0.72259521484375, 0.8365478515625, 0.95050048828125, 1.064453125, 1.17840576171875, 1.2923583984375, 1.40631103515625, 1.520263671875, 1.63421630859375, 1.7481689453125, 1.86212158203125, 1.97607421875, 2.09002685546875, 2.2039794921875, 2.31793212890625, 2.431884765625, 2.54583740234375, 2.6597900390625, 2.77374267578125, 2.8876953125, 3.00164794921875, 3.1156005859375, 3.22955322265625, 3.343505859375, 3.45745849609375, 3.5714111328125, 3.68536376953125, 3.79931640625, 3.91326904296875, 4.0272216796875, 4.14117431640625, 4.255126953125, 4.36907958984375, 4.4830322265625, 4.59698486328125, 4.7109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 7.0, 11.0, 14.0, 19.0, 22.0, 33.0, 41.0, 76.0, 91.0, 182.0, 340.0, 1050.0, 8592.0, 942608.0, 91489.0, 2736.0, 602.0, 227.0, 114.0, 73.0, 55.0, 33.0, 22.0, 19.0, 26.0, 10.0, 12.0, 9.0, 6.0, 2.0, 8.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.7734375, -2.693695068359375, -2.61395263671875, -2.534210205078125, -2.4544677734375, -2.374725341796875, -2.29498291015625, -2.215240478515625, -2.135498046875, -2.055755615234375, -1.97601318359375, -1.896270751953125, -1.8165283203125, -1.736785888671875, -1.65704345703125, -1.577301025390625, -1.49755859375, -1.417816162109375, -1.33807373046875, -1.258331298828125, -1.1785888671875, -1.098846435546875, -1.01910400390625, -0.939361572265625, -0.859619140625, -0.779876708984375, -0.70013427734375, -0.620391845703125, -0.5406494140625, -0.460906982421875, -0.38116455078125, -0.301422119140625, -0.2216796875, -0.141937255859375, -0.06219482421875, 0.017547607421875, 0.0972900390625, 0.177032470703125, 0.25677490234375, 0.336517333984375, 0.416259765625, 0.496002197265625, 0.57574462890625, 0.655487060546875, 0.7352294921875, 0.814971923828125, 0.89471435546875, 0.974456787109375, 1.05419921875, 1.133941650390625, 1.21368408203125, 1.293426513671875, 1.3731689453125, 1.452911376953125, 1.53265380859375, 1.612396240234375, 1.692138671875, 1.771881103515625, 1.85162353515625, 1.931365966796875, 2.0111083984375, 2.090850830078125, 2.17059326171875, 2.250335693359375, 2.330078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 14.0, 10.0, 9.0, 7.0, 17.0, 11.0, 32.0, 22.0, 26.0, 40.0, 48.0, 53.0, 52.0, 60.0, 65.0, 54.0, 59.0, 65.0, 46.0, 42.0, 40.0, 40.0, 26.0, 22.0, 29.0, 22.0, 21.0, 13.0, 12.0, 4.0, 4.0, 8.0, 9.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.501953125, -3.401214599609375, -3.30047607421875, -3.199737548828125, -3.0989990234375, -2.998260498046875, -2.89752197265625, -2.796783447265625, -2.696044921875, -2.595306396484375, -2.49456787109375, -2.393829345703125, -2.2930908203125, -2.192352294921875, -2.09161376953125, -1.990875244140625, -1.89013671875, -1.789398193359375, -1.68865966796875, -1.587921142578125, -1.4871826171875, -1.386444091796875, -1.28570556640625, -1.184967041015625, -1.084228515625, -0.983489990234375, -0.88275146484375, -0.782012939453125, -0.6812744140625, -0.580535888671875, -0.47979736328125, -0.379058837890625, -0.2783203125, -0.177581787109375, -0.07684326171875, 0.023895263671875, 0.1246337890625, 0.225372314453125, 0.32611083984375, 0.426849365234375, 0.527587890625, 0.628326416015625, 0.72906494140625, 0.829803466796875, 0.9305419921875, 1.031280517578125, 1.13201904296875, 1.232757568359375, 1.33349609375, 1.434234619140625, 1.53497314453125, 1.635711669921875, 1.7364501953125, 1.837188720703125, 1.93792724609375, 2.038665771484375, 2.139404296875, 2.240142822265625, 2.34088134765625, 2.441619873046875, 2.5423583984375, 2.643096923828125, 2.74383544921875, 2.844573974609375, 2.9453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 12.0, 30.0, 31.0, 57.0, 130.0, 221.0, 436.0, 1068.0, 3990.0, 28863.0, 876714.0, 122806.0, 10578.0, 2092.0, 739.0, 311.0, 168.0, 80.0, 65.0, 35.0, 35.0, 19.0, 14.0, 5.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83447265625, -0.8129501342773438, -0.7914276123046875, -0.7699050903320312, -0.748382568359375, -0.7268600463867188, -0.7053375244140625, -0.6838150024414062, -0.66229248046875, -0.6407699584960938, -0.6192474365234375, -0.5977249145507812, -0.576202392578125, -0.5546798706054688, -0.5331573486328125, -0.5116348266601562, -0.4901123046875, -0.46858978271484375, -0.4470672607421875, -0.42554473876953125, -0.404022216796875, -0.38249969482421875, -0.3609771728515625, -0.33945465087890625, -0.31793212890625, -0.29640960693359375, -0.2748870849609375, -0.25336456298828125, -0.231842041015625, -0.21031951904296875, -0.1887969970703125, -0.16727447509765625, -0.145751953125, -0.12422943115234375, -0.1027069091796875, -0.08118438720703125, -0.059661865234375, -0.03813934326171875, -0.0166168212890625, 0.00490570068359375, 0.02642822265625, 0.04795074462890625, 0.0694732666015625, 0.09099578857421875, 0.112518310546875, 0.13404083251953125, 0.1555633544921875, 0.17708587646484375, 0.1986083984375, 0.22013092041015625, 0.2416534423828125, 0.26317596435546875, 0.284698486328125, 0.30622100830078125, 0.3277435302734375, 0.34926605224609375, 0.37078857421875, 0.39231109619140625, 0.4138336181640625, 0.43535614013671875, 0.456878662109375, 0.47840118408203125, 0.4999237060546875, 0.5214462280273438, 0.54296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 7.0, 9.0, 9.0, 21.0, 22.0, 24.0, 30.0, 48.0, 129.0, 324.0, 148.0, 74.0, 40.0, 35.0, 23.0, 13.0, 11.0, 9.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.611513137817383e-05, -7.384642958641052e-05, -7.157772779464722e-05, -6.930902600288391e-05, -6.70403242111206e-05, -6.47716224193573e-05, -6.2502920627594e-05, -6.023421883583069e-05, -5.796551704406738e-05, -5.569681525230408e-05, -5.342811346054077e-05, -5.1159411668777466e-05, -4.889070987701416e-05, -4.6622008085250854e-05, -4.435330629348755e-05, -4.208460450172424e-05, -3.981590270996094e-05, -3.754720091819763e-05, -3.5278499126434326e-05, -3.300979733467102e-05, -3.0741095542907715e-05, -2.847239375114441e-05, -2.6203691959381104e-05, -2.3934990167617798e-05, -2.1666288375854492e-05, -1.9397586584091187e-05, -1.712888479232788e-05, -1.4860183000564575e-05, -1.259148120880127e-05, -1.0322779417037964e-05, -8.054077625274658e-06, -5.7853758335113525e-06, -3.516674041748047e-06, -1.2479722499847412e-06, 1.0207295417785645e-06, 3.28943133354187e-06, 5.558133125305176e-06, 7.826834917068481e-06, 1.0095536708831787e-05, 1.2364238500595093e-05, 1.4632940292358398e-05, 1.6901642084121704e-05, 1.917034387588501e-05, 2.1439045667648315e-05, 2.370774745941162e-05, 2.5976449251174927e-05, 2.8245151042938232e-05, 3.0513852834701538e-05, 3.2782554626464844e-05, 3.505125641822815e-05, 3.7319958209991455e-05, 3.958866000175476e-05, 4.1857361793518066e-05, 4.412606358528137e-05, 4.639476537704468e-05, 4.8663467168807983e-05, 5.093216896057129e-05, 5.3200870752334595e-05, 5.54695725440979e-05, 5.7738274335861206e-05, 6.000697612762451e-05, 6.227567791938782e-05, 6.454437971115112e-05, 6.681308150291443e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 16.0, 18.0, 19.0, 33.0, 35.0, 56.0, 73.0, 167.0, 285.0, 546.0, 1393.0, 4731.0, 25177.0, 774678.0, 217716.0, 17747.0, 3625.0, 1119.0, 468.0, 245.0, 137.0, 87.0, 52.0, 37.0, 17.0, 20.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.681640625, -0.6609268188476562, -0.6402130126953125, -0.6194992065429688, -0.598785400390625, -0.5780715942382812, -0.5573577880859375, -0.5366439819335938, -0.51593017578125, -0.49521636962890625, -0.4745025634765625, -0.45378875732421875, -0.433074951171875, -0.41236114501953125, -0.3916473388671875, -0.37093353271484375, -0.3502197265625, -0.32950592041015625, -0.3087921142578125, -0.28807830810546875, -0.267364501953125, -0.24665069580078125, -0.2259368896484375, -0.20522308349609375, -0.18450927734375, -0.16379547119140625, -0.1430816650390625, -0.12236785888671875, -0.101654052734375, -0.08094024658203125, -0.0602264404296875, -0.03951263427734375, -0.018798828125, 0.00191497802734375, 0.0226287841796875, 0.04334259033203125, 0.064056396484375, 0.08477020263671875, 0.1054840087890625, 0.12619781494140625, 0.14691162109375, 0.16762542724609375, 0.1883392333984375, 0.20905303955078125, 0.229766845703125, 0.25048065185546875, 0.2711944580078125, 0.29190826416015625, 0.3126220703125, 0.33333587646484375, 0.3540496826171875, 0.37476348876953125, 0.395477294921875, 0.41619110107421875, 0.4369049072265625, 0.45761871337890625, 0.47833251953125, 0.49904632568359375, 0.5197601318359375, 0.5404739379882812, 0.561187744140625, 0.5819015502929688, 0.6026153564453125, 0.6233291625976562, 0.64404296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 4.0, 11.0, 4.0, 12.0, 18.0, 21.0, 31.0, 55.0, 95.0, 399.0, 157.0, 61.0, 38.0, 17.0, 20.0, 14.0, 7.0, 10.0, 5.0, 4.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2993812561035156, -0.29236602783203125, -0.2853507995605469, -0.2783355712890625, -0.2713203430175781, -0.26430511474609375, -0.2572898864746094, -0.250274658203125, -0.24325942993164062, -0.23624420166015625, -0.22922897338867188, -0.2222137451171875, -0.21519851684570312, -0.20818328857421875, -0.20116806030273438, -0.19415283203125, -0.18713760375976562, -0.18012237548828125, -0.17310714721679688, -0.1660919189453125, -0.15907669067382812, -0.15206146240234375, -0.14504623413085938, -0.138031005859375, -0.13101577758789062, -0.12400054931640625, -0.11698532104492188, -0.1099700927734375, -0.10295486450195312, -0.09593963623046875, -0.08892440795898438, -0.0819091796875, -0.07489395141601562, -0.06787872314453125, -0.060863494873046875, -0.0538482666015625, -0.046833038330078125, -0.03981781005859375, -0.032802581787109375, -0.025787353515625, -0.018772125244140625, -0.01175689697265625, -0.004741668701171875, 0.0022735595703125, 0.009288787841796875, 0.01630401611328125, 0.023319244384765625, 0.03033447265625, 0.037349700927734375, 0.04436492919921875, 0.051380157470703125, 0.0583953857421875, 0.06541061401367188, 0.07242584228515625, 0.07944107055664062, 0.086456298828125, 0.09347152709960938, 0.10048675537109375, 0.10750198364257812, 0.1145172119140625, 0.12153244018554688, 0.12854766845703125, 0.13556289672851562, 0.142578125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 38.0, 187.0, 502.0, 195.0, 45.0, 18.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.789307594299316, -5.288122653961182, -4.786938190460205, -4.28575325012207, -3.7845685482025146, -3.283383846282959, -2.782198905944824, -2.2810142040252686, -1.779829502105713, -1.2786448001861572, -0.777459979057312, -0.2762751579284668, 0.22490954399108887, 0.7260942459106445, 1.2272791862487793, 1.728463888168335, 2.2296485900878906, 2.7308332920074463, 3.232017993927002, 3.7332029342651367, 4.234387397766113, 4.735572338104248, 5.236757278442383, 5.737941741943359, 6.239126682281494, 6.740311622619629, 7.2414960861206055, 7.74268102645874, 8.243865966796875, 8.745050430297852, 9.246234893798828, 9.747420310974121, 10.248603820800781, 10.749788284301758, 11.25097370147705, 11.752158164978027, 12.253342628479004, 12.754528045654297, 13.255712509155273, 13.75689697265625, 14.258081436157227, 14.759265899658203, 15.260451316833496, 15.761635780334473, 16.262821197509766, 16.764005661010742, 17.26519012451172, 17.766374588012695, 18.267559051513672, 18.76874351501465, 19.269927978515625, 19.771114349365234, 20.27229881286621, 20.773483276367188, 21.274667739868164, 21.77585220336914, 22.27703857421875, 22.778223037719727, 23.279407501220703, 23.780593872070312, 24.28177833557129, 24.782962799072266, 25.284147262573242, 25.78533172607422, 26.286516189575195]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 9.0, 15.0, 7.0, 18.0, 22.0, 24.0, 31.0, 43.0, 43.0, 38.0, 42.0, 46.0, 52.0, 44.0, 45.0, 46.0, 54.0, 34.0, 41.0, 45.0, 42.0, 31.0, 31.0, 35.0, 32.0, 20.0, 22.0, 12.0, 13.0, 10.0, 11.0, 0.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.844492435455322, -4.684164524078369, -4.523837089538574, -4.363509178161621, -4.203181743621826, -4.042853832244873, -3.882526159286499, -3.722198486328125, -3.561870574951172, -3.401542901992798, -3.241215229034424, -3.0808873176574707, -2.9205596446990967, -2.7602319717407227, -2.5999042987823486, -2.4395766258239746, -2.2792489528656006, -2.1189212799072266, -1.958593487739563, -1.798265814781189, -1.6379380226135254, -1.4776103496551514, -1.3172826766967773, -1.1569548845291138, -0.9966272115707397, -0.836299479007721, -0.6759717464447021, -0.5156440734863281, -0.3553163409233093, -0.19498860836029053, -0.034660935401916504, 0.12566685676574707, 0.2859945297241211, 0.4463222622871399, 0.6066499948501587, 0.7669776678085327, 0.9273054003715515, 1.0876331329345703, 1.2479608058929443, 1.408288598060608, 1.568616271018982, 1.728943943977356, 1.8892717361450195, 2.0495994091033936, 2.2099270820617676, 2.3702549934387207, 2.5305824279785156, 2.6909103393554688, 2.8512380123138428, 3.011565685272217, 3.171893358230591, 3.332221031188965, 3.492548942565918, 3.652876615524292, 3.813204288482666, 3.973532199859619, 4.133859634399414, 4.294187545776367, 4.454514980316162, 4.614842891693115, 4.77517032623291, 4.935498237609863, 5.095826148986816, 5.256153583526611, 5.4164814949035645]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 15.0, 15.0, 14.0, 17.0, 26.0, 31.0, 44.0, 66.0, 103.0, 172.0, 243.0, 422.0, 953.0, 2078.0, 6010.0, 22741.0, 176040.0, 3697579.0, 250267.0, 26341.0, 6566.0, 2241.0, 952.0, 495.0, 284.0, 161.0, 97.0, 88.0, 37.0, 41.0, 40.0, 24.0, 16.0, 10.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.60546875, -2.52020263671875, -2.4349365234375, -2.34967041015625, -2.264404296875, -2.17913818359375, -2.0938720703125, -2.00860595703125, -1.92333984375, -1.83807373046875, -1.7528076171875, -1.66754150390625, -1.582275390625, -1.49700927734375, -1.4117431640625, -1.32647705078125, -1.2412109375, -1.15594482421875, -1.0706787109375, -0.98541259765625, -0.900146484375, -0.81488037109375, -0.7296142578125, -0.64434814453125, -0.55908203125, -0.47381591796875, -0.3885498046875, -0.30328369140625, -0.218017578125, -0.13275146484375, -0.0474853515625, 0.03778076171875, 0.123046875, 0.20831298828125, 0.2935791015625, 0.37884521484375, 0.464111328125, 0.54937744140625, 0.6346435546875, 0.71990966796875, 0.80517578125, 0.89044189453125, 0.9757080078125, 1.06097412109375, 1.146240234375, 1.23150634765625, 1.3167724609375, 1.40203857421875, 1.4873046875, 1.57257080078125, 1.6578369140625, 1.74310302734375, 1.828369140625, 1.91363525390625, 1.9989013671875, 2.08416748046875, 2.16943359375, 2.25469970703125, 2.3399658203125, 2.42523193359375, 2.510498046875, 2.59576416015625, 2.6810302734375, 2.76629638671875, 2.8515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 1.0, 3.0, 8.0, 14.0, 20.0, 24.0, 46.0, 69.0, 85.0, 115.0, 148.0, 107.0, 109.0, 76.0, 56.0, 35.0, 27.0, 19.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.02960205078125, -1.9537353515625, -1.87786865234375, -1.802001953125, -1.72613525390625, -1.6502685546875, -1.57440185546875, -1.49853515625, -1.42266845703125, -1.3468017578125, -1.27093505859375, -1.195068359375, -1.11920166015625, -1.0433349609375, -0.96746826171875, -0.8916015625, -0.81573486328125, -0.7398681640625, -0.66400146484375, -0.588134765625, -0.51226806640625, -0.4364013671875, -0.36053466796875, -0.28466796875, -0.20880126953125, -0.1329345703125, -0.05706787109375, 0.018798828125, 0.09466552734375, 0.1705322265625, 0.24639892578125, 0.322265625, 0.39813232421875, 0.4739990234375, 0.54986572265625, 0.625732421875, 0.70159912109375, 0.7774658203125, 0.85333251953125, 0.92919921875, 1.00506591796875, 1.0809326171875, 1.15679931640625, 1.232666015625, 1.30853271484375, 1.3843994140625, 1.46026611328125, 1.5361328125, 1.61199951171875, 1.6878662109375, 1.76373291015625, 1.839599609375, 1.91546630859375, 1.9913330078125, 2.06719970703125, 2.14306640625, 2.21893310546875, 2.2947998046875, 2.37066650390625, 2.446533203125, 2.52239990234375, 2.5982666015625, 2.67413330078125, 2.75]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 9.0, 8.0, 11.0, 30.0, 52.0, 78.0, 127.0, 242.0, 515.0, 1633.0, 9900.0, 256773.0, 3883314.0, 36226.0, 3615.0, 905.0, 357.0, 175.0, 106.0, 70.0, 44.0, 27.0, 12.0, 15.0, 7.0, 9.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.3668212890625, -4.186767578125, -4.0067138671875, -3.82666015625, -3.6466064453125, -3.466552734375, -3.2864990234375, -3.1064453125, -2.9263916015625, -2.746337890625, -2.5662841796875, -2.38623046875, -2.2061767578125, -2.026123046875, -1.8460693359375, -1.666015625, -1.4859619140625, -1.305908203125, -1.1258544921875, -0.94580078125, -0.7657470703125, -0.585693359375, -0.4056396484375, -0.2255859375, -0.0455322265625, 0.134521484375, 0.3145751953125, 0.49462890625, 0.6746826171875, 0.854736328125, 1.0347900390625, 1.21484375, 1.3948974609375, 1.574951171875, 1.7550048828125, 1.93505859375, 2.1151123046875, 2.295166015625, 2.4752197265625, 2.6552734375, 2.8353271484375, 3.015380859375, 3.1954345703125, 3.37548828125, 3.5555419921875, 3.735595703125, 3.9156494140625, 4.095703125, 4.2757568359375, 4.455810546875, 4.6358642578125, 4.81591796875, 4.9959716796875, 5.176025390625, 5.3560791015625, 5.5361328125, 5.7161865234375, 5.896240234375, 6.0762939453125, 6.25634765625, 6.4364013671875, 6.616455078125, 6.7965087890625, 6.9765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 11.0, 22.0, 39.0, 80.0, 85.0, 221.0, 600.0, 1618.0, 769.0, 288.0, 134.0, 86.0, 42.0, 20.0, 17.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.543853759765625, -1.50762939453125, -1.471405029296875, -1.4351806640625, -1.398956298828125, -1.36273193359375, -1.326507568359375, -1.290283203125, -1.254058837890625, -1.21783447265625, -1.181610107421875, -1.1453857421875, -1.109161376953125, -1.07293701171875, -1.036712646484375, -1.00048828125, -0.964263916015625, -0.92803955078125, -0.891815185546875, -0.8555908203125, -0.819366455078125, -0.78314208984375, -0.746917724609375, -0.710693359375, -0.674468994140625, -0.63824462890625, -0.602020263671875, -0.5657958984375, -0.529571533203125, -0.49334716796875, -0.457122802734375, -0.4208984375, -0.384674072265625, -0.34844970703125, -0.312225341796875, -0.2760009765625, -0.239776611328125, -0.20355224609375, -0.167327880859375, -0.131103515625, -0.094879150390625, -0.05865478515625, -0.022430419921875, 0.0137939453125, 0.050018310546875, 0.08624267578125, 0.122467041015625, 0.15869140625, 0.194915771484375, 0.23114013671875, 0.267364501953125, 0.3035888671875, 0.339813232421875, 0.37603759765625, 0.412261962890625, 0.448486328125, 0.484710693359375, 0.52093505859375, 0.557159423828125, 0.5933837890625, 0.629608154296875, 0.66583251953125, 0.702056884765625, 0.73828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 10.0, 4.0, 15.0, 17.0, 27.0, 46.0, 89.0, 114.0, 128.0, 153.0, 118.0, 109.0, 65.0, 33.0, 23.0, 16.0, 8.0, 12.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.197394371032715, -4.085183143615723, -3.9729719161987305, -3.860760450363159, -3.748549222946167, -3.636337995529175, -3.5241265296936035, -3.4119153022766113, -3.299704074859619, -3.187492847442627, -3.0752816200256348, -2.9630701541900635, -2.8508589267730713, -2.738647699356079, -2.626436233520508, -2.5142250061035156, -2.4020137786865234, -2.2898025512695312, -2.177591323852539, -2.0653798580169678, -1.9531686305999756, -1.8409574031829834, -1.7287460565567017, -1.61653470993042, -1.5043234825134277, -1.3921122550964355, -1.2799009084701538, -1.167689561843872, -1.0554783344268799, -0.9432670474052429, -0.831055760383606, -0.718844473361969, -0.6066329479217529, -0.49442166090011597, -0.382210373878479, -0.26999908685684204, -0.15778779983520508, -0.045576512813568115, 0.06663477420806885, 0.1788460612297058, 0.2910573482513428, 0.40326863527297974, 0.5154799222946167, 0.6276912093162537, 0.7399024963378906, 0.8521137833595276, 0.9643250703811646, 1.0765364170074463, 1.1887476444244385, 1.3009588718414307, 1.4131702184677124, 1.5253815650939941, 1.6375927925109863, 1.7498040199279785, 1.8620153665542603, 1.974226713180542, 2.086437940597534, 2.1986491680145264, 2.3108606338500977, 2.42307186126709, 2.535283088684082, 2.647494316101074, 2.7597055435180664, 2.8719170093536377, 2.98412823677063]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 16.0, 6.0, 13.0, 19.0, 27.0, 24.0, 33.0, 46.0, 55.0, 52.0, 52.0, 61.0, 75.0, 79.0, 62.0, 70.0, 56.0, 50.0, 26.0, 43.0, 45.0, 23.0, 16.0, 13.0, 13.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341423749923706, -1.4624698162078857, -1.3907971382141113, -1.3191245794296265, -1.2474520206451416, -1.1757793426513672, -1.1041067838668823, -1.0324342250823975, -0.9607616066932678, -0.8890889883041382, -0.8174164295196533, -0.7457438111305237, -0.674071192741394, -0.6023986339569092, -0.5307260155677795, -0.4590534567832947, -0.38738083839416504, -0.3157082498073578, -0.24403564631938934, -0.1723630428314209, -0.10069045424461365, -0.029017865657806396, 0.04265475273132324, 0.1143273115158081, 0.18599992990493774, 0.257672518491745, 0.32934510707855225, 0.4010177254676819, 0.47269031405448914, 0.5443629026412964, 0.616035521030426, 0.6877080798149109, 0.759380578994751, 0.8310531973838806, 0.9027257561683655, 0.9743983745574951, 1.04607093334198, 1.1177434921264648, 1.1894161701202393, 1.2610887289047241, 1.332761287689209, 1.4044338464736938, 1.4761065244674683, 1.5477790832519531, 1.619451642036438, 1.6911242008209229, 1.7627968788146973, 1.8344694375991821, 1.9061421155929565, 1.9778146743774414, 2.049487352371216, 2.1211600303649902, 2.1928324699401855, 2.26450514793396, 2.3361778259277344, 2.4078502655029297, 2.479522943496704, 2.5511956214904785, 2.622868061065674, 2.6945407390594482, 2.7662134170532227, 2.837885856628418, 2.9095585346221924, 2.981231212615967, 3.052903652191162]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 7.0, 11.0, 8.0, 28.0, 42.0, 51.0, 86.0, 118.0, 178.0, 358.0, 654.0, 1396.0, 4644.0, 45974.0, 868781.0, 115027.0, 7473.0, 1882.0, 745.0, 435.0, 239.0, 126.0, 99.0, 66.0, 49.0, 21.0, 16.0, 3.0, 7.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4521484375, -0.43829345703125, -0.4244384765625, -0.41058349609375, -0.396728515625, -0.38287353515625, -0.3690185546875, -0.35516357421875, -0.34130859375, -0.32745361328125, -0.3135986328125, -0.29974365234375, -0.285888671875, -0.27203369140625, -0.2581787109375, -0.24432373046875, -0.23046875, -0.21661376953125, -0.2027587890625, -0.18890380859375, -0.175048828125, -0.16119384765625, -0.1473388671875, -0.13348388671875, -0.11962890625, -0.10577392578125, -0.0919189453125, -0.07806396484375, -0.064208984375, -0.05035400390625, -0.0364990234375, -0.02264404296875, -0.0087890625, 0.00506591796875, 0.0189208984375, 0.03277587890625, 0.046630859375, 0.06048583984375, 0.0743408203125, 0.08819580078125, 0.10205078125, 0.11590576171875, 0.1297607421875, 0.14361572265625, 0.157470703125, 0.17132568359375, 0.1851806640625, 0.19903564453125, 0.212890625, 0.22674560546875, 0.2406005859375, 0.25445556640625, 0.268310546875, 0.28216552734375, 0.2960205078125, 0.30987548828125, 0.32373046875, 0.33758544921875, 0.3514404296875, 0.36529541015625, 0.379150390625, 0.39300537109375, 0.4068603515625, 0.42071533203125, 0.4345703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 14.0, 10.0, 15.0, 15.0, 26.0, 41.0, 39.0, 49.0, 55.0, 73.0, 73.0, 65.0, 68.0, 76.0, 64.0, 69.0, 53.0, 44.0, 35.0, 34.0, 18.0, 15.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4208984375, -1.3621063232421875, -1.303314208984375, -1.2445220947265625, -1.18572998046875, -1.1269378662109375, -1.068145751953125, -1.0093536376953125, -0.9505615234375, -0.8917694091796875, -0.832977294921875, -0.7741851806640625, -0.71539306640625, -0.6566009521484375, -0.597808837890625, -0.5390167236328125, -0.480224609375, -0.4214324951171875, -0.362640380859375, -0.3038482666015625, -0.24505615234375, -0.1862640380859375, -0.127471923828125, -0.0686798095703125, -0.0098876953125, 0.0489044189453125, 0.107696533203125, 0.1664886474609375, 0.22528076171875, 0.2840728759765625, 0.342864990234375, 0.4016571044921875, 0.46044921875, 0.5192413330078125, 0.578033447265625, 0.6368255615234375, 0.69561767578125, 0.7544097900390625, 0.813201904296875, 0.8719940185546875, 0.9307861328125, 0.9895782470703125, 1.048370361328125, 1.1071624755859375, 1.16595458984375, 1.2247467041015625, 1.283538818359375, 1.3423309326171875, 1.401123046875, 1.4599151611328125, 1.518707275390625, 1.5774993896484375, 1.63629150390625, 1.6950836181640625, 1.753875732421875, 1.8126678466796875, 1.8714599609375, 1.9302520751953125, 1.989044189453125, 2.0478363037109375, 2.10662841796875, 2.1654205322265625, 2.224212646484375, 2.2830047607421875, 2.341796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 5.0, 8.0, 5.0, 11.0, 12.0, 23.0, 22.0, 31.0, 53.0, 64.0, 74.0, 100.0, 157.0, 268.0, 445.0, 984.0, 3913.0, 30603.0, 445018.0, 523953.0, 35686.0, 4715.0, 1091.0, 402.0, 264.0, 172.0, 125.0, 94.0, 69.0, 37.0, 23.0, 24.0, 19.0, 12.0, 15.0, 12.0, 7.0, 5.0, 6.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.237060546875, -0.2296600341796875, -0.222259521484375, -0.2148590087890625, -0.20745849609375, -0.2000579833984375, -0.192657470703125, -0.1852569580078125, -0.1778564453125, -0.1704559326171875, -0.163055419921875, -0.1556549072265625, -0.14825439453125, -0.1408538818359375, -0.133453369140625, -0.1260528564453125, -0.11865234375, -0.1112518310546875, -0.103851318359375, -0.0964508056640625, -0.08905029296875, -0.0816497802734375, -0.074249267578125, -0.0668487548828125, -0.0594482421875, -0.0520477294921875, -0.044647216796875, -0.0372467041015625, -0.02984619140625, -0.0224456787109375, -0.015045166015625, -0.0076446533203125, -0.000244140625, 0.0071563720703125, 0.014556884765625, 0.0219573974609375, 0.02935791015625, 0.0367584228515625, 0.044158935546875, 0.0515594482421875, 0.0589599609375, 0.0663604736328125, 0.073760986328125, 0.0811614990234375, 0.08856201171875, 0.0959625244140625, 0.103363037109375, 0.1107635498046875, 0.1181640625, 0.1255645751953125, 0.132965087890625, 0.1403656005859375, 0.14776611328125, 0.1551666259765625, 0.162567138671875, 0.1699676513671875, 0.1773681640625, 0.1847686767578125, 0.192169189453125, 0.1995697021484375, 0.20697021484375, 0.2143707275390625, 0.221771240234375, 0.2291717529296875, 0.236572265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 17.0, 14.0, 10.0, 23.0, 23.0, 20.0, 29.0, 27.0, 27.0, 31.0, 37.0, 37.0, 45.0, 45.0, 35.0, 50.0, 43.0, 42.0, 49.0, 33.0, 36.0, 48.0, 42.0, 29.0, 26.0, 20.0, 19.0, 23.0, 19.0, 9.0, 9.0, 11.0, 4.0, 13.0, 5.0, 8.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.32421875, -2.24969482421875, -2.1751708984375, -2.10064697265625, -2.026123046875, -1.95159912109375, -1.8770751953125, -1.80255126953125, -1.72802734375, -1.65350341796875, -1.5789794921875, -1.50445556640625, -1.429931640625, -1.35540771484375, -1.2808837890625, -1.20635986328125, -1.1318359375, -1.05731201171875, -0.9827880859375, -0.90826416015625, -0.833740234375, -0.75921630859375, -0.6846923828125, -0.61016845703125, -0.53564453125, -0.46112060546875, -0.3865966796875, -0.31207275390625, -0.237548828125, -0.16302490234375, -0.0885009765625, -0.01397705078125, 0.060546875, 0.13507080078125, 0.2095947265625, 0.28411865234375, 0.358642578125, 0.43316650390625, 0.5076904296875, 0.58221435546875, 0.65673828125, 0.73126220703125, 0.8057861328125, 0.88031005859375, 0.954833984375, 1.02935791015625, 1.1038818359375, 1.17840576171875, 1.2529296875, 1.32745361328125, 1.4019775390625, 1.47650146484375, 1.551025390625, 1.62554931640625, 1.7000732421875, 1.77459716796875, 1.84912109375, 1.92364501953125, 1.9981689453125, 2.07269287109375, 2.147216796875, 2.22174072265625, 2.2962646484375, 2.37078857421875, 2.4453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 10.0, 17.0, 22.0, 47.0, 54.0, 79.0, 144.0, 251.0, 587.0, 2457.0, 745711.0, 295746.0, 2235.0, 550.0, 245.0, 132.0, 84.0, 47.0, 41.0, 25.0, 16.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093505859375, -0.09075260162353516, -0.08799934387207031, -0.08524608612060547, -0.08249282836914062, -0.07973957061767578, -0.07698631286621094, -0.0742330551147461, -0.07147979736328125, -0.0687265396118164, -0.06597328186035156, -0.06322002410888672, -0.060466766357421875, -0.05771350860595703, -0.05496025085449219, -0.052206993103027344, -0.0494537353515625, -0.046700477600097656, -0.04394721984863281, -0.04119396209716797, -0.038440704345703125, -0.03568744659423828, -0.03293418884277344, -0.030180931091308594, -0.02742767333984375, -0.024674415588378906, -0.021921157836914062, -0.01916790008544922, -0.016414642333984375, -0.013661384582519531, -0.010908126831054688, -0.008154869079589844, -0.005401611328125, -0.0026483535766601562, 0.0001049041748046875, 0.0028581619262695312, 0.005611419677734375, 0.008364677429199219, 0.011117935180664062, 0.013871192932128906, 0.01662445068359375, 0.019377708435058594, 0.022130966186523438, 0.02488422393798828, 0.027637481689453125, 0.03039073944091797, 0.03314399719238281, 0.035897254943847656, 0.0386505126953125, 0.041403770446777344, 0.04415702819824219, 0.04691028594970703, 0.049663543701171875, 0.05241680145263672, 0.05517005920410156, 0.057923316955566406, 0.06067657470703125, 0.0634298324584961, 0.06618309020996094, 0.06893634796142578, 0.07168960571289062, 0.07444286346435547, 0.07719612121582031, 0.07994937896728516, 0.08270263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 13.0, 4.0, 18.0, 21.0, 32.0, 31.0, 55.0, 48.0, 80.0, 83.0, 84.0, 85.0, 72.0, 74.0, 48.0, 54.0, 33.0, 35.0, 24.0, 16.0, 14.0, 8.0, 9.0, 8.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, -1.5635043382644653e-05, -1.5176832675933838e-05, -1.4718621969223022e-05, -1.4260411262512207e-05, -1.3802200555801392e-05, -1.3343989849090576e-05, -1.288577914237976e-05, -1.2427568435668945e-05, -1.196935772895813e-05, -1.1511147022247314e-05, -1.1052936315536499e-05, -1.0594725608825684e-05, -1.0136514902114868e-05, -9.678304195404053e-06, -9.220093488693237e-06, -8.761882781982422e-06, -8.303672075271606e-06, -7.845461368560791e-06, -7.387250661849976e-06, -6.92903995513916e-06, -6.470829248428345e-06, -6.012618541717529e-06, -5.554407835006714e-06, -5.0961971282958984e-06, -4.637986421585083e-06, -4.179775714874268e-06, -3.721565008163452e-06, -3.2633543014526367e-06, -2.8051435947418213e-06, -2.346932888031006e-06, -1.8887221813201904e-06, -1.430511474609375e-06, -9.723007678985596e-07, -5.140900611877441e-07, -5.587935447692871e-08, 4.023313522338867e-07, 8.605420589447021e-07, 1.3187527656555176e-06, 1.776963472366333e-06, 2.2351741790771484e-06, 2.693384885787964e-06, 3.1515955924987793e-06, 3.6098062992095947e-06, 4.06801700592041e-06, 4.526227712631226e-06, 4.984438419342041e-06, 5.4426491260528564e-06, 5.900859832763672e-06, 6.359070539474487e-06, 6.817281246185303e-06, 7.275491952896118e-06, 7.733702659606934e-06, 8.191913366317749e-06, 8.650124073028564e-06, 9.10833477973938e-06, 9.566545486450195e-06, 1.002475619316101e-05, 1.0482966899871826e-05, 1.0941177606582642e-05, 1.1399388313293457e-05, 1.1857599020004272e-05, 1.2315809726715088e-05, 1.2774020433425903e-05, 1.3232231140136719e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 10.0, 15.0, 21.0, 32.0, 45.0, 95.0, 168.0, 268.0, 528.0, 1244.0, 3449.0, 14183.0, 154093.0, 834176.0, 30694.0, 5986.0, 1862.0, 778.0, 377.0, 207.0, 113.0, 71.0, 33.0, 27.0, 18.0, 8.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08190536499023438, -0.07964324951171875, -0.07738113403320312, -0.0751190185546875, -0.07285690307617188, -0.07059478759765625, -0.06833267211914062, -0.066070556640625, -0.06380844116210938, -0.06154632568359375, -0.059284210205078125, -0.0570220947265625, -0.054759979248046875, -0.05249786376953125, -0.050235748291015625, -0.0479736328125, -0.045711517333984375, -0.04344940185546875, -0.041187286376953125, -0.0389251708984375, -0.036663055419921875, -0.03440093994140625, -0.032138824462890625, -0.029876708984375, -0.027614593505859375, -0.02535247802734375, -0.023090362548828125, -0.0208282470703125, -0.018566131591796875, -0.01630401611328125, -0.014041900634765625, -0.01177978515625, -0.009517669677734375, -0.00725555419921875, -0.004993438720703125, -0.0027313232421875, -0.000469207763671875, 0.00179290771484375, 0.004055023193359375, 0.006317138671875, 0.008579254150390625, 0.01084136962890625, 0.013103485107421875, 0.0153656005859375, 0.017627716064453125, 0.01988983154296875, 0.022151947021484375, 0.0244140625, 0.026676177978515625, 0.02893829345703125, 0.031200408935546875, 0.0334625244140625, 0.035724639892578125, 0.03798675537109375, 0.040248870849609375, 0.042510986328125, 0.044773101806640625, 0.04703521728515625, 0.049297332763671875, 0.0515594482421875, 0.053821563720703125, 0.05608367919921875, 0.058345794677734375, 0.06060791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 16.0, 25.0, 44.0, 95.0, 302.0, 284.0, 76.0, 45.0, 22.0, 14.0, 17.0, 9.0, 7.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017661094665527344, -0.016981124877929688, -0.01630115509033203, -0.015621185302734375, -0.014941215515136719, -0.014261245727539062, -0.013581275939941406, -0.01290130615234375, -0.012221336364746094, -0.011541366577148438, -0.010861396789550781, -0.010181427001953125, -0.009501457214355469, -0.008821487426757812, -0.008141517639160156, -0.0074615478515625, -0.006781578063964844, -0.0061016082763671875, -0.005421638488769531, -0.004741668701171875, -0.004061698913574219, -0.0033817291259765625, -0.0027017593383789062, -0.00202178955078125, -0.0013418197631835938, -0.0006618499755859375, 1.811981201171875e-05, 0.000698089599609375, 0.0013780593872070312, 0.0020580291748046875, 0.0027379989624023438, 0.00341796875, 0.004097938537597656, 0.0047779083251953125, 0.005457878112792969, 0.006137847900390625, 0.006817817687988281, 0.0074977874755859375, 0.008177757263183594, 0.00885772705078125, 0.009537696838378906, 0.010217666625976562, 0.010897636413574219, 0.011577606201171875, 0.012257575988769531, 0.012937545776367188, 0.013617515563964844, 0.0142974853515625, 0.014977455139160156, 0.015657424926757812, 0.01633739471435547, 0.017017364501953125, 0.01769733428955078, 0.018377304077148438, 0.019057273864746094, 0.01973724365234375, 0.020417213439941406, 0.021097183227539062, 0.02177715301513672, 0.022457122802734375, 0.02313709259033203, 0.023817062377929688, 0.024497032165527344, 0.025177001953125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 26.0, 40.0, 90.0, 160.0, 200.0, 183.0, 150.0, 65.0, 29.0, 15.0, 14.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3721532821655273, -3.2513275146484375, -3.1305019855499268, -3.009676218032837, -2.888850450515747, -2.7680249214172363, -2.6471991539001465, -2.5263733863830566, -2.405547618865967, -2.284721851348877, -2.163896322250366, -2.0430705547332764, -1.9222447872161865, -1.8014191389083862, -1.680593490600586, -1.559767723083496, -1.4389420747756958, -1.3181164264678955, -1.1972906589508057, -1.0764650106430054, -0.9556392431259155, -0.8348135948181152, -0.7139878869056702, -0.5931621789932251, -0.47233647108078003, -0.35151076316833496, -0.2306850701570511, -0.10985937714576721, 0.010966330766677856, 0.13179200887680054, 0.2526177167892456, 0.3734434247016907, 0.49426913261413574, 0.6150948405265808, 0.7359205484390259, 0.8567461967468262, 0.977571964263916, 1.0983976125717163, 1.2192232608795166, 1.3400490283966064, 1.4608747959136963, 1.5817004442214966, 1.7025262117385864, 1.8233518600463867, 1.9441776275634766, 2.0650033950805664, 2.185828924179077, 2.306654691696167, 2.4274802207946777, 2.5483059883117676, 2.6691315174102783, 2.789957284927368, 2.910783052444458, 3.0316085815429688, 3.1524343490600586, 3.2732601165771484, 3.3940858840942383, 3.514911651611328, 3.635737180709839, 3.7565629482269287, 3.8773887157440186, 3.9982142448425293, 4.119040012359619, 4.239865779876709, 4.360691547393799]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 11.0, 10.0, 19.0, 25.0, 31.0, 42.0, 43.0, 71.0, 59.0, 73.0, 80.0, 89.0, 78.0, 66.0, 68.0, 46.0, 42.0, 41.0, 28.0, 19.0, 16.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2674089670181274, -1.2077746391296387, -1.1481401920318604, -1.0885058641433716, -1.0288715362548828, -0.969237208366394, -0.9096028208732605, -0.849968433380127, -0.7903341054916382, -0.7306997776031494, -0.6710653901100159, -0.6114310026168823, -0.5517966747283936, -0.4921623170375824, -0.43252795934677124, -0.3728936016559601, -0.3132592439651489, -0.25362488627433777, -0.1939905285835266, -0.13435617089271545, -0.0747218132019043, -0.01508745551109314, 0.04454690217971802, 0.10418125987052917, 0.16381561756134033, 0.2234499752521515, 0.28308433294296265, 0.3427186906337738, 0.40235304832458496, 0.4619874060153961, 0.5216217637062073, 0.5812561511993408, 0.64089035987854, 0.7005246877670288, 0.7601590752601624, 0.8197934627532959, 0.8794277906417847, 0.9390621185302734, 0.998696506023407, 1.0583308935165405, 1.1179652214050293, 1.177599549293518, 1.2372338771820068, 1.2968683242797852, 1.356502652168274, 1.4161369800567627, 1.475771427154541, 1.5354057550430298, 1.5950400829315186, 1.6546744108200073, 1.714308738708496, 1.7739431858062744, 1.8335775136947632, 1.893211841583252, 1.9528462886810303, 2.0124804973602295, 2.072114944458008, 2.131749391555786, 2.1913836002349854, 2.2510180473327637, 2.310652256011963, 2.370286703109741, 2.4299211502075195, 2.4895553588867188, 2.549189805984497]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 12.0, 12.0, 16.0, 27.0, 39.0, 59.0, 104.0, 189.0, 332.0, 623.0, 1203.0, 2634.0, 6313.0, 18643.0, 78836.0, 616603.0, 261881.0, 41115.0, 11555.0, 4319.0, 1895.0, 972.0, 513.0, 234.0, 160.0, 89.0, 52.0, 34.0, 24.0, 13.0, 19.0, 8.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.21087646484375, -1.1639404296875, -1.11700439453125, -1.070068359375, -1.02313232421875, -0.9761962890625, -0.92926025390625, -0.88232421875, -0.83538818359375, -0.7884521484375, -0.74151611328125, -0.694580078125, -0.64764404296875, -0.6007080078125, -0.55377197265625, -0.5068359375, -0.45989990234375, -0.4129638671875, -0.36602783203125, -0.319091796875, -0.27215576171875, -0.2252197265625, -0.17828369140625, -0.13134765625, -0.08441162109375, -0.0374755859375, 0.00946044921875, 0.056396484375, 0.10333251953125, 0.1502685546875, 0.19720458984375, 0.244140625, 0.29107666015625, 0.3380126953125, 0.38494873046875, 0.431884765625, 0.47882080078125, 0.5257568359375, 0.57269287109375, 0.61962890625, 0.66656494140625, 0.7135009765625, 0.76043701171875, 0.807373046875, 0.85430908203125, 0.9012451171875, 0.94818115234375, 0.9951171875, 1.04205322265625, 1.0889892578125, 1.13592529296875, 1.182861328125, 1.22979736328125, 1.2767333984375, 1.32366943359375, 1.37060546875, 1.41754150390625, 1.4644775390625, 1.51141357421875, 1.558349609375, 1.60528564453125, 1.6522216796875, 1.69915771484375, 1.74609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 14.0, 22.0, 35.0, 45.0, 49.0, 49.0, 57.0, 80.0, 82.0, 82.0, 80.0, 85.0, 45.0, 63.0, 49.0, 32.0, 23.0, 18.0, 15.0, 15.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.65142822265625, -2.5333251953125, -2.41522216796875, -2.297119140625, -2.17901611328125, -2.0609130859375, -1.94281005859375, -1.82470703125, -1.70660400390625, -1.5885009765625, -1.47039794921875, -1.352294921875, -1.23419189453125, -1.1160888671875, -0.99798583984375, -0.8798828125, -0.76177978515625, -0.6436767578125, -0.52557373046875, -0.407470703125, -0.28936767578125, -0.1712646484375, -0.05316162109375, 0.06494140625, 0.18304443359375, 0.3011474609375, 0.41925048828125, 0.537353515625, 0.65545654296875, 0.7735595703125, 0.89166259765625, 1.009765625, 1.12786865234375, 1.2459716796875, 1.36407470703125, 1.482177734375, 1.60028076171875, 1.7183837890625, 1.83648681640625, 1.95458984375, 2.07269287109375, 2.1907958984375, 2.30889892578125, 2.427001953125, 2.54510498046875, 2.6632080078125, 2.78131103515625, 2.8994140625, 3.01751708984375, 3.1356201171875, 3.25372314453125, 3.371826171875, 3.48992919921875, 3.6080322265625, 3.72613525390625, 3.84423828125, 3.96234130859375, 4.0804443359375, 4.19854736328125, 4.316650390625, 4.43475341796875, 4.5528564453125, 4.67095947265625, 4.7890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 11.0, 7.0, 7.0, 10.0, 22.0, 14.0, 29.0, 27.0, 36.0, 48.0, 72.0, 100.0, 175.0, 359.0, 1380.0, 14634.0, 929708.0, 96949.0, 3598.0, 639.0, 215.0, 157.0, 96.0, 57.0, 47.0, 31.0, 25.0, 22.0, 19.0, 10.0, 11.0, 7.0, 3.0, 8.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0], "bins": [-5.64453125, -5.49884033203125, -5.3531494140625, -5.20745849609375, -5.061767578125, -4.91607666015625, -4.7703857421875, -4.62469482421875, -4.47900390625, -4.33331298828125, -4.1876220703125, -4.04193115234375, -3.896240234375, -3.75054931640625, -3.6048583984375, -3.45916748046875, -3.3134765625, -3.16778564453125, -3.0220947265625, -2.87640380859375, -2.730712890625, -2.58502197265625, -2.4393310546875, -2.29364013671875, -2.14794921875, -2.00225830078125, -1.8565673828125, -1.71087646484375, -1.565185546875, -1.41949462890625, -1.2738037109375, -1.12811279296875, -0.982421875, -0.83673095703125, -0.6910400390625, -0.54534912109375, -0.399658203125, -0.25396728515625, -0.1082763671875, 0.03741455078125, 0.18310546875, 0.32879638671875, 0.4744873046875, 0.62017822265625, 0.765869140625, 0.91156005859375, 1.0572509765625, 1.20294189453125, 1.3486328125, 1.49432373046875, 1.6400146484375, 1.78570556640625, 1.931396484375, 2.07708740234375, 2.2227783203125, 2.36846923828125, 2.51416015625, 2.65985107421875, 2.8055419921875, 2.95123291015625, 3.096923828125, 3.24261474609375, 3.3883056640625, 3.53399658203125, 3.6796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 9.0, 16.0, 24.0, 24.0, 19.0, 23.0, 36.0, 40.0, 39.0, 48.0, 47.0, 42.0, 49.0, 59.0, 36.0, 51.0, 57.0, 39.0, 32.0, 38.0, 32.0, 35.0, 19.0, 19.0, 27.0, 18.0, 15.0, 16.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.86328125, -3.758331298828125, -3.65338134765625, -3.548431396484375, -3.4434814453125, -3.338531494140625, -3.23358154296875, -3.128631591796875, -3.023681640625, -2.918731689453125, -2.81378173828125, -2.708831787109375, -2.6038818359375, -2.498931884765625, -2.39398193359375, -2.289031982421875, -2.18408203125, -2.079132080078125, -1.97418212890625, -1.869232177734375, -1.7642822265625, -1.659332275390625, -1.55438232421875, -1.449432373046875, -1.344482421875, -1.239532470703125, -1.13458251953125, -1.029632568359375, -0.9246826171875, -0.819732666015625, -0.71478271484375, -0.609832763671875, -0.5048828125, -0.399932861328125, -0.29498291015625, -0.190032958984375, -0.0850830078125, 0.019866943359375, 0.12481689453125, 0.229766845703125, 0.334716796875, 0.439666748046875, 0.54461669921875, 0.649566650390625, 0.7545166015625, 0.859466552734375, 0.96441650390625, 1.069366455078125, 1.17431640625, 1.279266357421875, 1.38421630859375, 1.489166259765625, 1.5941162109375, 1.699066162109375, 1.80401611328125, 1.908966064453125, 2.013916015625, 2.118865966796875, 2.22381591796875, 2.328765869140625, 2.4337158203125, 2.538665771484375, 2.64361572265625, 2.748565673828125, 2.853515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 9.0, 13.0, 15.0, 21.0, 31.0, 48.0, 66.0, 120.0, 199.0, 390.0, 1222.0, 5085.0, 35100.0, 727144.0, 254676.0, 19467.0, 3258.0, 844.0, 357.0, 179.0, 95.0, 47.0, 35.0, 27.0, 20.0, 14.0, 14.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0439453125, -1.0139999389648438, -0.9840545654296875, -0.9541091918945312, -0.924163818359375, -0.8942184448242188, -0.8642730712890625, -0.8343276977539062, -0.80438232421875, -0.7744369506835938, -0.7444915771484375, -0.7145462036132812, -0.684600830078125, -0.6546554565429688, -0.6247100830078125, -0.5947647094726562, -0.5648193359375, -0.5348739624023438, -0.5049285888671875, -0.47498321533203125, -0.445037841796875, -0.41509246826171875, -0.3851470947265625, -0.35520172119140625, -0.32525634765625, -0.29531097412109375, -0.2653656005859375, -0.23542022705078125, -0.205474853515625, -0.17552947998046875, -0.1455841064453125, -0.11563873291015625, -0.085693359375, -0.05574798583984375, -0.0258026123046875, 0.00414276123046875, 0.034088134765625, 0.06403350830078125, 0.0939788818359375, 0.12392425537109375, 0.15386962890625, 0.18381500244140625, 0.2137603759765625, 0.24370574951171875, 0.273651123046875, 0.30359649658203125, 0.3335418701171875, 0.36348724365234375, 0.3934326171875, 0.42337799072265625, 0.4533233642578125, 0.48326873779296875, 0.513214111328125, 0.5431594848632812, 0.5731048583984375, 0.6030502319335938, 0.63299560546875, 0.6629409790039062, 0.6928863525390625, 0.7228317260742188, 0.752777099609375, 0.7827224731445312, 0.8126678466796875, 0.8426132202148438, 0.87255859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 16.0, 19.0, 27.0, 49.0, 112.0, 344.0, 235.0, 98.0, 38.0, 27.0, 14.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002760887145996094, -0.00026978179812431335, -0.00026347488164901733, -0.0002571679651737213, -0.0002508610486984253, -0.00024455413222312927, -0.00023824721574783325, -0.00023194029927253723, -0.0002256333827972412, -0.0002193264663219452, -0.00021301954984664917, -0.00020671263337135315, -0.00020040571689605713, -0.0001940988004207611, -0.0001877918839454651, -0.00018148496747016907, -0.00017517805099487305, -0.00016887113451957703, -0.000162564218044281, -0.00015625730156898499, -0.00014995038509368896, -0.00014364346861839294, -0.00013733655214309692, -0.0001310296356678009, -0.00012472271919250488, -0.00011841580271720886, -0.00011210888624191284, -0.00010580196976661682, -9.94950532913208e-05, -9.318813681602478e-05, -8.688122034072876e-05, -8.057430386543274e-05, -7.426738739013672e-05, -6.79604709148407e-05, -6.165355443954468e-05, -5.534663796424866e-05, -4.903972148895264e-05, -4.2732805013656616e-05, -3.6425888538360596e-05, -3.0118972063064575e-05, -2.3812055587768555e-05, -1.7505139112472534e-05, -1.1198222637176514e-05, -4.891306161880493e-06, 1.4156103134155273e-06, 7.722526788711548e-06, 1.4029443264007568e-05, 2.033635973930359e-05, 2.664327621459961e-05, 3.295019268989563e-05, 3.925710916519165e-05, 4.556402564048767e-05, 5.187094211578369e-05, 5.817785859107971e-05, 6.448477506637573e-05, 7.079169154167175e-05, 7.709860801696777e-05, 8.34055244922638e-05, 8.971244096755981e-05, 9.601935744285583e-05, 0.00010232627391815186, 0.00010863319039344788, 0.0001149401068687439, 0.00012124702334403992, 0.00012755393981933594]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 4.0, 17.0, 28.0, 26.0, 51.0, 74.0, 127.0, 210.0, 384.0, 865.0, 2052.0, 5369.0, 16789.0, 67644.0, 608188.0, 282141.0, 45135.0, 12299.0, 4038.0, 1563.0, 693.0, 345.0, 197.0, 91.0, 66.0, 41.0, 27.0, 25.0, 10.0, 12.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5126571655273438, -0.4935760498046875, -0.47449493408203125, -0.455413818359375, -0.43633270263671875, -0.4172515869140625, -0.39817047119140625, -0.37908935546875, -0.36000823974609375, -0.3409271240234375, -0.32184600830078125, -0.302764892578125, -0.28368377685546875, -0.2646026611328125, -0.24552154541015625, -0.2264404296875, -0.20735931396484375, -0.1882781982421875, -0.16919708251953125, -0.150115966796875, -0.13103485107421875, -0.1119537353515625, -0.09287261962890625, -0.07379150390625, -0.05471038818359375, -0.0356292724609375, -0.01654815673828125, 0.002532958984375, 0.02161407470703125, 0.0406951904296875, 0.05977630615234375, 0.078857421875, 0.09793853759765625, 0.1170196533203125, 0.13610076904296875, 0.155181884765625, 0.17426300048828125, 0.1933441162109375, 0.21242523193359375, 0.23150634765625, 0.25058746337890625, 0.2696685791015625, 0.28874969482421875, 0.307830810546875, 0.32691192626953125, 0.3459930419921875, 0.36507415771484375, 0.3841552734375, 0.40323638916015625, 0.4223175048828125, 0.44139862060546875, 0.460479736328125, 0.47956085205078125, 0.4986419677734375, 0.5177230834960938, 0.53680419921875, 0.5558853149414062, 0.5749664306640625, 0.5940475463867188, 0.613128662109375, 0.6322097778320312, 0.6512908935546875, 0.6703720092773438, 0.689453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 6.0, 13.0, 15.0, 25.0, 22.0, 40.0, 52.0, 80.0, 141.0, 234.0, 119.0, 68.0, 42.0, 38.0, 20.0, 17.0, 18.0, 12.0, 10.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412353515625, -0.40128326416015625, -0.3902130126953125, -0.37914276123046875, -0.368072509765625, -0.35700225830078125, -0.3459320068359375, -0.33486175537109375, -0.32379150390625, -0.31272125244140625, -0.3016510009765625, -0.29058074951171875, -0.279510498046875, -0.26844024658203125, -0.2573699951171875, -0.24629974365234375, -0.2352294921875, -0.22415924072265625, -0.2130889892578125, -0.20201873779296875, -0.190948486328125, -0.17987823486328125, -0.1688079833984375, -0.15773773193359375, -0.14666748046875, -0.13559722900390625, -0.1245269775390625, -0.11345672607421875, -0.102386474609375, -0.09131622314453125, -0.0802459716796875, -0.06917572021484375, -0.05810546875, -0.04703521728515625, -0.0359649658203125, -0.02489471435546875, -0.013824462890625, -0.00275421142578125, 0.0083160400390625, 0.01938629150390625, 0.03045654296875, 0.04152679443359375, 0.0525970458984375, 0.06366729736328125, 0.074737548828125, 0.08580780029296875, 0.0968780517578125, 0.10794830322265625, 0.1190185546875, 0.13008880615234375, 0.1411590576171875, 0.15222930908203125, 0.163299560546875, 0.17436981201171875, 0.1854400634765625, 0.19651031494140625, 0.20758056640625, 0.21865081787109375, 0.2297210693359375, 0.24079132080078125, 0.251861572265625, 0.26293182373046875, 0.2740020751953125, 0.28507232666015625, 0.296142578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 32.0, 100.0, 293.0, 351.0, 159.0, 45.0, 16.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.670278072357178, -6.201328754425049, -5.73237943649292, -5.263430595397949, -4.79448127746582, -4.325531959533691, -3.8565826416015625, -3.3876333236694336, -2.9186840057373047, -2.449734687805176, -1.9807854890823364, -1.511836290359497, -1.0428869724273682, -0.5739376544952393, -0.10498857498168945, 0.36396074295043945, 0.8329100608825684, 1.3018593788146973, 1.7708085775375366, 2.239757776260376, 2.708707094192505, 3.177656412124634, 3.6466054916381836, 4.1155548095703125, 4.584504127502441, 5.05345344543457, 5.522402763366699, 5.991352081298828, 6.460301399230957, 6.929250717163086, 7.398199558258057, 7.8671488761901855, 8.336097717285156, 8.805047035217285, 9.273996353149414, 9.742945671081543, 10.211894989013672, 10.6808443069458, 11.14979362487793, 11.618741989135742, 12.087692260742188, 12.556641578674316, 13.025590896606445, 13.494540214538574, 13.963489532470703, 14.432438850402832, 14.901388168334961, 15.370336532592773, 15.839285850524902, 16.30823516845703, 16.777183532714844, 17.24613380432129, 17.7150821685791, 18.184032440185547, 18.65298080444336, 19.121931076049805, 19.590879440307617, 20.05982780456543, 20.528778076171875, 20.997726440429688, 21.466676712036133, 21.935625076293945, 22.40457534790039, 22.873523712158203, 23.34247398376465]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 5.0, 3.0, 11.0, 10.0, 10.0, 24.0, 26.0, 24.0, 33.0, 27.0, 18.0, 45.0, 32.0, 48.0, 41.0, 36.0, 43.0, 48.0, 52.0, 49.0, 47.0, 34.0, 42.0, 27.0, 37.0, 47.0, 29.0, 16.0, 21.0, 22.0, 20.0, 18.0, 9.0, 10.0, 9.0, 5.0, 4.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.781528949737549, -4.603460788726807, -4.425393104553223, -4.2473249435424805, -4.069256782531738, -3.8911890983581543, -3.713120937347412, -3.535053014755249, -3.356985092163086, -3.178917169570923, -3.0008490085601807, -2.8227810859680176, -2.6447131633758545, -2.4666452407836914, -2.288577079772949, -2.110509157180786, -1.932440996170044, -1.7543729543685913, -1.5763050317764282, -1.3982369899749756, -1.2201690673828125, -1.0421010255813599, -0.8640329837799072, -0.6859650611877441, -0.5078970193862915, -0.32982903718948364, -0.1517610251903534, 0.026306986808776855, 0.20437496900558472, 0.3824429512023926, 0.5605109930038452, 0.7385789155960083, 0.9166469573974609, 1.0947149991989136, 1.2727829217910767, 1.4508509635925293, 1.6289188861846924, 1.806986927986145, 1.9850549697875977, 2.1631228923797607, 2.341190814971924, 2.519258737564087, 2.697326898574829, 2.875394821166992, 3.0534627437591553, 3.2315306663513184, 3.4095988273620605, 3.5876667499542236, 3.765734910964966, 3.943802833557129, 4.121870994567871, 4.299939155578613, 4.478006839752197, 4.6560750007629395, 4.834142684936523, 5.012210845947266, 5.190279006958008, 5.36834716796875, 5.546414852142334, 5.724483013153076, 5.902551174163818, 6.080618858337402, 6.2586870193481445, 6.436755180358887, 6.614822864532471]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 15.0, 13.0, 23.0, 21.0, 24.0, 31.0, 44.0, 57.0, 84.0, 127.0, 158.0, 253.0, 355.0, 515.0, 951.0, 1815.0, 3513.0, 8597.0, 25557.0, 116232.0, 1669861.0, 2187792.0, 134549.0, 26826.0, 8538.0, 3703.0, 1689.0, 965.0, 585.0, 393.0, 260.0, 180.0, 110.0, 104.0, 86.0, 59.0, 43.0, 38.0, 36.0, 18.0, 15.0, 10.0, 15.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.046875, -1.973876953125, -1.90087890625, -1.827880859375, -1.7548828125, -1.681884765625, -1.60888671875, -1.535888671875, -1.462890625, -1.389892578125, -1.31689453125, -1.243896484375, -1.1708984375, -1.097900390625, -1.02490234375, -0.951904296875, -0.87890625, -0.805908203125, -0.73291015625, -0.659912109375, -0.5869140625, -0.513916015625, -0.44091796875, -0.367919921875, -0.294921875, -0.221923828125, -0.14892578125, -0.075927734375, -0.0029296875, 0.070068359375, 0.14306640625, 0.216064453125, 0.2890625, 0.362060546875, 0.43505859375, 0.508056640625, 0.5810546875, 0.654052734375, 0.72705078125, 0.800048828125, 0.873046875, 0.946044921875, 1.01904296875, 1.092041015625, 1.1650390625, 1.238037109375, 1.31103515625, 1.384033203125, 1.45703125, 1.530029296875, 1.60302734375, 1.676025390625, 1.7490234375, 1.822021484375, 1.89501953125, 1.968017578125, 2.041015625, 2.114013671875, 2.18701171875, 2.260009765625, 2.3330078125, 2.406005859375, 2.47900390625, 2.552001953125, 2.625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 18.0, 45.0, 42.0, 41.0, 64.0, 98.0, 90.0, 100.0, 107.0, 78.0, 75.0, 48.0, 47.0, 24.0, 29.0, 19.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.254669189453125, -1.18707275390625, -1.119476318359375, -1.0518798828125, -0.984283447265625, -0.91668701171875, -0.849090576171875, -0.781494140625, -0.713897705078125, -0.64630126953125, -0.578704833984375, -0.5111083984375, -0.443511962890625, -0.37591552734375, -0.308319091796875, -0.24072265625, -0.173126220703125, -0.10552978515625, -0.037933349609375, 0.0296630859375, 0.097259521484375, 0.16485595703125, 0.232452392578125, 0.300048828125, 0.367645263671875, 0.43524169921875, 0.502838134765625, 0.5704345703125, 0.638031005859375, 0.70562744140625, 0.773223876953125, 0.8408203125, 0.908416748046875, 0.97601318359375, 1.043609619140625, 1.1112060546875, 1.178802490234375, 1.24639892578125, 1.313995361328125, 1.381591796875, 1.449188232421875, 1.51678466796875, 1.584381103515625, 1.6519775390625, 1.719573974609375, 1.78717041015625, 1.854766845703125, 1.92236328125, 1.989959716796875, 2.05755615234375, 2.125152587890625, 2.1927490234375, 2.260345458984375, 2.32794189453125, 2.395538330078125, 2.463134765625, 2.530731201171875, 2.59832763671875, 2.665924072265625, 2.7335205078125, 2.801116943359375, 2.86871337890625, 2.936309814453125, 3.00390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 7.0, 21.0, 27.0, 62.0, 99.0, 143.0, 260.0, 582.0, 1286.0, 4037.0, 21820.0, 454698.0, 3614012.0, 84027.0, 9089.0, 2264.0, 941.0, 397.0, 207.0, 104.0, 64.0, 37.0, 21.0, 12.0, 10.0, 8.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.91015625, -4.75311279296875, -4.5960693359375, -4.43902587890625, -4.281982421875, -4.12493896484375, -3.9678955078125, -3.81085205078125, -3.65380859375, -3.49676513671875, -3.3397216796875, -3.18267822265625, -3.025634765625, -2.86859130859375, -2.7115478515625, -2.55450439453125, -2.3974609375, -2.24041748046875, -2.0833740234375, -1.92633056640625, -1.769287109375, -1.61224365234375, -1.4552001953125, -1.29815673828125, -1.14111328125, -0.98406982421875, -0.8270263671875, -0.66998291015625, -0.512939453125, -0.35589599609375, -0.1988525390625, -0.04180908203125, 0.115234375, 0.27227783203125, 0.4293212890625, 0.58636474609375, 0.743408203125, 0.90045166015625, 1.0574951171875, 1.21453857421875, 1.37158203125, 1.52862548828125, 1.6856689453125, 1.84271240234375, 1.999755859375, 2.15679931640625, 2.3138427734375, 2.47088623046875, 2.6279296875, 2.78497314453125, 2.9420166015625, 3.09906005859375, 3.256103515625, 3.41314697265625, 3.5701904296875, 3.72723388671875, 3.88427734375, 4.04132080078125, 4.1983642578125, 4.35540771484375, 4.512451171875, 4.66949462890625, 4.8265380859375, 4.98358154296875, 5.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 17.0, 22.0, 31.0, 40.0, 70.0, 102.0, 160.0, 265.0, 541.0, 834.0, 776.0, 441.0, 277.0, 157.0, 117.0, 58.0, 47.0, 27.0, 24.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0794525146484375, -1.048553466796875, -1.0176544189453125, -0.98675537109375, -0.9558563232421875, -0.924957275390625, -0.8940582275390625, -0.8631591796875, -0.8322601318359375, -0.801361083984375, -0.7704620361328125, -0.73956298828125, -0.7086639404296875, -0.677764892578125, -0.6468658447265625, -0.615966796875, -0.5850677490234375, -0.554168701171875, -0.5232696533203125, -0.49237060546875, -0.4614715576171875, -0.430572509765625, -0.3996734619140625, -0.3687744140625, -0.3378753662109375, -0.306976318359375, -0.2760772705078125, -0.24517822265625, -0.2142791748046875, -0.183380126953125, -0.1524810791015625, -0.12158203125, -0.0906829833984375, -0.059783935546875, -0.0288848876953125, 0.00201416015625, 0.0329132080078125, 0.063812255859375, 0.0947113037109375, 0.1256103515625, 0.1565093994140625, 0.187408447265625, 0.2183074951171875, 0.24920654296875, 0.2801055908203125, 0.311004638671875, 0.3419036865234375, 0.372802734375, 0.4037017822265625, 0.434600830078125, 0.4654998779296875, 0.49639892578125, 0.5272979736328125, 0.558197021484375, 0.5890960693359375, 0.6199951171875, 0.6508941650390625, 0.681793212890625, 0.7126922607421875, 0.74359130859375, 0.7744903564453125, 0.805389404296875, 0.8362884521484375, 0.8671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 9.0, 13.0, 20.0, 20.0, 25.0, 25.0, 52.0, 52.0, 60.0, 66.0, 80.0, 70.0, 71.0, 86.0, 68.0, 73.0, 49.0, 31.0, 25.0, 29.0, 16.0, 10.0, 7.0, 9.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.405890464782715, -2.3250732421875, -2.244256019592285, -2.1634387969970703, -2.0826215744018555, -2.0018043518066406, -1.9209871292114258, -1.840169906616211, -1.759352684020996, -1.6785354614257812, -1.5977182388305664, -1.5169010162353516, -1.4360837936401367, -1.3552665710449219, -1.274449348449707, -1.1936321258544922, -1.1128149032592773, -1.0319976806640625, -0.9511804580688477, -0.8703632354736328, -0.789546012878418, -0.7087287902832031, -0.6279115676879883, -0.5470943450927734, -0.4662771224975586, -0.38545989990234375, -0.3046426773071289, -0.22382545471191406, -0.14300823211669922, -0.062191009521484375, 0.01862621307373047, 0.09944343566894531, 0.18026089668273926, 0.2610781192779541, 0.34189534187316895, 0.4227125644683838, 0.5035297870635986, 0.5843470096588135, 0.6651642322540283, 0.7459814548492432, 0.826798677444458, 0.9076159000396729, 0.9884331226348877, 1.0692503452301025, 1.1500675678253174, 1.2308847904205322, 1.311702013015747, 1.392519235610962, 1.4733364582061768, 1.5541536808013916, 1.6349709033966064, 1.7157881259918213, 1.7966053485870361, 1.877422571182251, 1.9582397937774658, 2.0390570163726807, 2.1198742389678955, 2.2006914615631104, 2.281508684158325, 2.36232590675354, 2.443143129348755, 2.5239603519439697, 2.6047775745391846, 2.6855947971343994, 2.7664120197296143]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 8.0, 14.0, 20.0, 34.0, 33.0, 38.0, 56.0, 53.0, 57.0, 69.0, 71.0, 63.0, 56.0, 62.0, 71.0, 50.0, 54.0, 41.0, 40.0, 34.0, 24.0, 12.0, 11.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.071363925933838, -1.985168695449829, -1.8989734649658203, -1.8127782344818115, -1.7265828847885132, -1.6403876543045044, -1.5541924238204956, -1.4679970741271973, -1.3818018436431885, -1.2956066131591797, -1.209411382675171, -1.123216152191162, -1.0370208024978638, -0.950825572013855, -0.8646303415298462, -0.7784350514411926, -0.6922398805618286, -0.6060446500778198, -0.5198493599891663, -0.43365412950515747, -0.3474588692188263, -0.2612636089324951, -0.17506837844848633, -0.08887308835983276, -0.0026778578758239746, 0.0835173949599266, 0.16971264779567719, 0.25590789318084717, 0.34210315346717834, 0.4282984137535095, 0.5144936442375183, 0.6006889343261719, 0.6868841648101807, 0.7730793952941895, 0.859274685382843, 0.9454699158668518, 1.0316652059555054, 1.1178604364395142, 1.204055666923523, 1.2902510166168213, 1.37644624710083, 1.4626414775848389, 1.5488367080688477, 1.6350319385528564, 1.7212272882461548, 1.8074225187301636, 1.8936177492141724, 1.9798130989074707, 2.0660080909729004, 2.152203321456909, 2.238398551940918, 2.3245937824249268, 2.4107890129089355, 2.4969844818115234, 2.583179473876953, 2.669374942779541, 2.75557017326355, 2.8417654037475586, 2.9279606342315674, 3.014155864715576, 3.100351095199585, 3.1865463256835938, 3.2727417945861816, 3.3589370250701904, 3.445132255554199]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 18.0, 29.0, 36.0, 54.0, 97.0, 183.0, 354.0, 885.0, 2959.0, 18904.0, 565457.0, 438939.0, 16394.0, 2645.0, 800.0, 354.0, 163.0, 102.0, 58.0, 35.0, 20.0, 17.0, 15.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3390541076660156, -0.32288360595703125, -0.3067131042480469, -0.2905426025390625, -0.2743721008300781, -0.25820159912109375, -0.24203109741210938, -0.225860595703125, -0.20969009399414062, -0.19351959228515625, -0.17734909057617188, -0.1611785888671875, -0.14500808715820312, -0.12883758544921875, -0.11266708374023438, -0.09649658203125, -0.08032608032226562, -0.06415557861328125, -0.047985076904296875, -0.0318145751953125, -0.015644073486328125, 0.00052642822265625, 0.016696929931640625, 0.032867431640625, 0.049037933349609375, 0.06520843505859375, 0.08137893676757812, 0.0975494384765625, 0.11371994018554688, 0.12989044189453125, 0.14606094360351562, 0.1622314453125, 0.17840194702148438, 0.19457244873046875, 0.21074295043945312, 0.2269134521484375, 0.24308395385742188, 0.25925445556640625, 0.2754249572753906, 0.291595458984375, 0.3077659606933594, 0.32393646240234375, 0.3401069641113281, 0.3562774658203125, 0.3724479675292969, 0.38861846923828125, 0.4047889709472656, 0.42095947265625, 0.4371299743652344, 0.45330047607421875, 0.4694709777832031, 0.4856414794921875, 0.5018119812011719, 0.5179824829101562, 0.5341529846191406, 0.550323486328125, 0.5664939880371094, 0.5826644897460938, 0.5988349914550781, 0.6150054931640625, 0.6311759948730469, 0.6473464965820312, 0.6635169982910156, 0.6796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 12.0, 9.0, 23.0, 26.0, 29.0, 52.0, 50.0, 57.0, 68.0, 70.0, 85.0, 69.0, 81.0, 66.0, 65.0, 59.0, 50.0, 39.0, 31.0, 15.0, 14.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3081207275390625, -1.246124267578125, -1.1841278076171875, -1.12213134765625, -1.0601348876953125, -0.998138427734375, -0.9361419677734375, -0.8741455078125, -0.8121490478515625, -0.750152587890625, -0.6881561279296875, -0.62615966796875, -0.5641632080078125, -0.502166748046875, -0.4401702880859375, -0.378173828125, -0.3161773681640625, -0.254180908203125, -0.1921844482421875, -0.13018798828125, -0.0681915283203125, -0.006195068359375, 0.0558013916015625, 0.1177978515625, 0.1797943115234375, 0.241790771484375, 0.3037872314453125, 0.36578369140625, 0.4277801513671875, 0.489776611328125, 0.5517730712890625, 0.61376953125, 0.6757659912109375, 0.737762451171875, 0.7997589111328125, 0.86175537109375, 0.9237518310546875, 0.985748291015625, 1.0477447509765625, 1.1097412109375, 1.1717376708984375, 1.233734130859375, 1.2957305908203125, 1.35772705078125, 1.4197235107421875, 1.481719970703125, 1.5437164306640625, 1.605712890625, 1.6677093505859375, 1.729705810546875, 1.7917022705078125, 1.85369873046875, 1.9156951904296875, 1.977691650390625, 2.0396881103515625, 2.1016845703125, 2.1636810302734375, 2.225677490234375, 2.2876739501953125, 2.34967041015625, 2.4116668701171875, 2.473663330078125, 2.5356597900390625, 2.59765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 9.0, 11.0, 10.0, 16.0, 12.0, 23.0, 21.0, 32.0, 58.0, 46.0, 88.0, 124.0, 166.0, 282.0, 430.0, 994.0, 4642.0, 48591.0, 796180.0, 182880.0, 10697.0, 1533.0, 576.0, 309.0, 206.0, 138.0, 123.0, 83.0, 73.0, 47.0, 38.0, 17.0, 24.0, 24.0, 15.0, 4.0, 5.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24874114990234375, -0.2394256591796875, -0.23011016845703125, -0.220794677734375, -0.21147918701171875, -0.2021636962890625, -0.19284820556640625, -0.18353271484375, -0.17421722412109375, -0.1649017333984375, -0.15558624267578125, -0.146270751953125, -0.13695526123046875, -0.1276397705078125, -0.11832427978515625, -0.1090087890625, -0.09969329833984375, -0.0903778076171875, -0.08106231689453125, -0.071746826171875, -0.06243133544921875, -0.0531158447265625, -0.04380035400390625, -0.03448486328125, -0.02516937255859375, -0.0158538818359375, -0.00653839111328125, 0.002777099609375, 0.01209259033203125, 0.0214080810546875, 0.03072357177734375, 0.0400390625, 0.04935455322265625, 0.0586700439453125, 0.06798553466796875, 0.077301025390625, 0.08661651611328125, 0.0959320068359375, 0.10524749755859375, 0.11456298828125, 0.12387847900390625, 0.1331939697265625, 0.14250946044921875, 0.151824951171875, 0.16114044189453125, 0.1704559326171875, 0.17977142333984375, 0.1890869140625, 0.19840240478515625, 0.2077178955078125, 0.21703338623046875, 0.226348876953125, 0.23566436767578125, 0.2449798583984375, 0.25429534912109375, 0.26361083984375, 0.27292633056640625, 0.2822418212890625, 0.29155731201171875, 0.300872802734375, 0.31018829345703125, 0.3195037841796875, 0.32881927490234375, 0.338134765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 6.0, 6.0, 14.0, 5.0, 13.0, 18.0, 17.0, 32.0, 26.0, 37.0, 35.0, 40.0, 56.0, 60.0, 42.0, 50.0, 43.0, 55.0, 66.0, 53.0, 41.0, 35.0, 33.0, 33.0, 33.0, 21.0, 21.0, 24.0, 10.0, 10.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.341094970703125, -2.25054931640625, -2.160003662109375, -2.0694580078125, -1.978912353515625, -1.88836669921875, -1.797821044921875, -1.707275390625, -1.616729736328125, -1.52618408203125, -1.435638427734375, -1.3450927734375, -1.254547119140625, -1.16400146484375, -1.073455810546875, -0.98291015625, -0.892364501953125, -0.80181884765625, -0.711273193359375, -0.6207275390625, -0.530181884765625, -0.43963623046875, -0.349090576171875, -0.258544921875, -0.167999267578125, -0.07745361328125, 0.013092041015625, 0.1036376953125, 0.194183349609375, 0.28472900390625, 0.375274658203125, 0.4658203125, 0.556365966796875, 0.64691162109375, 0.737457275390625, 0.8280029296875, 0.918548583984375, 1.00909423828125, 1.099639892578125, 1.190185546875, 1.280731201171875, 1.37127685546875, 1.461822509765625, 1.5523681640625, 1.642913818359375, 1.73345947265625, 1.824005126953125, 1.91455078125, 2.005096435546875, 2.09564208984375, 2.186187744140625, 2.2767333984375, 2.367279052734375, 2.45782470703125, 2.548370361328125, 2.638916015625, 2.729461669921875, 2.82000732421875, 2.910552978515625, 3.0010986328125, 3.091644287109375, 3.18218994140625, 3.272735595703125, 3.36328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 9.0, 12.0, 20.0, 24.0, 39.0, 57.0, 97.0, 192.0, 394.0, 981.0, 13344.0, 1023689.0, 8018.0, 880.0, 306.0, 157.0, 104.0, 77.0, 54.0, 26.0, 20.0, 8.0, 9.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.16002655029296875, -0.1553802490234375, -0.15073394775390625, -0.146087646484375, -0.14144134521484375, -0.1367950439453125, -0.13214874267578125, -0.12750244140625, -0.12285614013671875, -0.1182098388671875, -0.11356353759765625, -0.108917236328125, -0.10427093505859375, -0.0996246337890625, -0.09497833251953125, -0.09033203125, -0.08568572998046875, -0.0810394287109375, -0.07639312744140625, -0.071746826171875, -0.06710052490234375, -0.0624542236328125, -0.05780792236328125, -0.05316162109375, -0.04851531982421875, -0.0438690185546875, -0.03922271728515625, -0.034576416015625, -0.02993011474609375, -0.0252838134765625, -0.02063751220703125, -0.0159912109375, -0.01134490966796875, -0.0066986083984375, -0.00205230712890625, 0.002593994140625, 0.00724029541015625, 0.0118865966796875, 0.01653289794921875, 0.02117919921875, 0.02582550048828125, 0.0304718017578125, 0.03511810302734375, 0.039764404296875, 0.04441070556640625, 0.0490570068359375, 0.05370330810546875, 0.058349609375, 0.06299591064453125, 0.0676422119140625, 0.07228851318359375, 0.076934814453125, 0.08158111572265625, 0.0862274169921875, 0.09087371826171875, 0.09552001953125, 0.10016632080078125, 0.1048126220703125, 0.10945892333984375, 0.114105224609375, 0.11875152587890625, 0.1233978271484375, 0.12804412841796875, 0.1326904296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 15.0, 21.0, 20.0, 44.0, 76.0, 169.0, 221.0, 165.0, 114.0, 49.0, 34.0, 17.0, 19.0, 14.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.791615694761276e-05, -5.652569234371185e-05, -5.5135227739810944e-05, -5.3744763135910034e-05, -5.2354298532009125e-05, -5.0963833928108215e-05, -4.9573369324207306e-05, -4.8182904720306396e-05, -4.679244011640549e-05, -4.540197551250458e-05, -4.401151090860367e-05, -4.262104630470276e-05, -4.123058170080185e-05, -3.984011709690094e-05, -3.844965249300003e-05, -3.705918788909912e-05, -3.566872328519821e-05, -3.42782586812973e-05, -3.288779407739639e-05, -3.1497329473495483e-05, -3.0106864869594574e-05, -2.8716400265693665e-05, -2.7325935661792755e-05, -2.5935471057891846e-05, -2.4545006453990936e-05, -2.3154541850090027e-05, -2.1764077246189117e-05, -2.0373612642288208e-05, -1.89831480383873e-05, -1.759268343448639e-05, -1.620221883058548e-05, -1.481175422668457e-05, -1.3421289622783661e-05, -1.2030825018882751e-05, -1.0640360414981842e-05, -9.249895811080933e-06, -7.859431207180023e-06, -6.468966603279114e-06, -5.078501999378204e-06, -3.688037395477295e-06, -2.2975727915763855e-06, -9.071081876754761e-07, 4.833564162254333e-07, 1.8738210201263428e-06, 3.264285624027252e-06, 4.654750227928162e-06, 6.045214831829071e-06, 7.4356794357299805e-06, 8.82614403963089e-06, 1.02166086435318e-05, 1.1607073247432709e-05, 1.2997537851333618e-05, 1.4388002455234528e-05, 1.5778467059135437e-05, 1.7168931663036346e-05, 1.8559396266937256e-05, 1.9949860870838165e-05, 2.1340325474739075e-05, 2.2730790078639984e-05, 2.4121254682540894e-05, 2.5511719286441803e-05, 2.6902183890342712e-05, 2.8292648494243622e-05, 2.968311309814453e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 11.0, 10.0, 22.0, 29.0, 59.0, 73.0, 149.0, 246.0, 413.0, 807.0, 1691.0, 4619.0, 18023.0, 275116.0, 713034.0, 24600.0, 5710.0, 1947.0, 874.0, 485.0, 259.0, 138.0, 95.0, 52.0, 33.0, 24.0, 18.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1229248046875, -0.11951828002929688, -0.11611175537109375, -0.11270523071289062, -0.1092987060546875, -0.10589218139648438, -0.10248565673828125, -0.09907913208007812, -0.095672607421875, -0.09226608276367188, -0.08885955810546875, -0.08545303344726562, -0.0820465087890625, -0.07863998413085938, -0.07523345947265625, -0.07182693481445312, -0.06842041015625, -0.06501388549804688, -0.06160736083984375, -0.058200836181640625, -0.0547943115234375, -0.051387786865234375, -0.04798126220703125, -0.044574737548828125, -0.041168212890625, -0.037761688232421875, -0.03435516357421875, -0.030948638916015625, -0.0275421142578125, -0.024135589599609375, -0.02072906494140625, -0.017322540283203125, -0.013916015625, -0.010509490966796875, -0.00710296630859375, -0.003696441650390625, -0.0002899169921875, 0.003116607666015625, 0.00652313232421875, 0.009929656982421875, 0.013336181640625, 0.016742706298828125, 0.02014923095703125, 0.023555755615234375, 0.0269622802734375, 0.030368804931640625, 0.03377532958984375, 0.037181854248046875, 0.04058837890625, 0.043994903564453125, 0.04740142822265625, 0.050807952880859375, 0.0542144775390625, 0.057621002197265625, 0.06102752685546875, 0.06443405151367188, 0.067840576171875, 0.07124710083007812, 0.07465362548828125, 0.07806015014648438, 0.0814666748046875, 0.08487319946289062, 0.08827972412109375, 0.09168624877929688, 0.0950927734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 9.0, 2.0, 7.0, 3.0, 9.0, 11.0, 16.0, 21.0, 51.0, 96.0, 313.0, 258.0, 96.0, 41.0, 24.0, 18.0, 5.0, 6.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03143310546875, -0.030305862426757812, -0.029178619384765625, -0.028051376342773438, -0.02692413330078125, -0.025796890258789062, -0.024669647216796875, -0.023542404174804688, -0.0224151611328125, -0.021287918090820312, -0.020160675048828125, -0.019033432006835938, -0.01790618896484375, -0.016778945922851562, -0.015651702880859375, -0.014524459838867188, -0.013397216796875, -0.012269973754882812, -0.011142730712890625, -0.010015487670898438, -0.00888824462890625, -0.0077610015869140625, -0.006633758544921875, -0.0055065155029296875, -0.0043792724609375, -0.0032520294189453125, -0.002124786376953125, -0.0009975433349609375, 0.00012969970703125, 0.0012569427490234375, 0.002384185791015625, 0.0035114288330078125, 0.004638671875, 0.0057659149169921875, 0.006893157958984375, 0.008020401000976562, 0.00914764404296875, 0.010274887084960938, 0.011402130126953125, 0.012529373168945312, 0.0136566162109375, 0.014783859252929688, 0.015911102294921875, 0.017038345336914062, 0.01816558837890625, 0.019292831420898438, 0.020420074462890625, 0.021547317504882812, 0.022674560546875, 0.023801803588867188, 0.024929046630859375, 0.026056289672851562, 0.02718353271484375, 0.028310775756835938, 0.029438018798828125, 0.030565261840820312, 0.0316925048828125, 0.03281974792480469, 0.033946990966796875, 0.03507423400878906, 0.03620147705078125, 0.03732872009277344, 0.038455963134765625, 0.03958320617675781, 0.04071044921875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 11.0, 15.0, 22.0, 29.0, 36.0, 72.0, 80.0, 76.0, 126.0, 94.0, 112.0, 96.0, 78.0, 50.0, 22.0, 29.0, 17.0, 8.0, 3.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5251941680908203, -2.455779790878296, -2.3863654136657715, -2.316951274871826, -2.2475368976593018, -2.1781225204467773, -2.108708143234253, -2.0392937660217285, -1.9698795080184937, -1.9004651308059692, -1.8310508728027344, -1.76163649559021, -1.6922221183776855, -1.6228078603744507, -1.5533934831619263, -1.4839792251586914, -1.414564847946167, -1.3451504707336426, -1.2757362127304077, -1.2063218355178833, -1.1369075775146484, -1.067493200302124, -0.9980788230895996, -0.92866450548172, -0.8592501878738403, -0.7898358702659607, -0.720421552658081, -0.6510071754455566, -0.581592857837677, -0.5121785402297974, -0.44276419281959534, -0.3733498454093933, -0.3039356470108032, -0.2345213145017624, -0.16510698199272156, -0.09569264948368073, -0.026278316974639893, 0.043136000633239746, 0.11255034804344177, 0.1819646954536438, 0.25137901306152344, 0.3207933306694031, 0.3902076780796051, 0.45962202548980713, 0.5290363430976868, 0.5984506607055664, 0.6678650379180908, 0.7372793555259705, 0.8066936731338501, 0.8761079907417297, 0.9455223083496094, 1.0149366855621338, 1.0843510627746582, 1.153765320777893, 1.2231796979904175, 1.2925939559936523, 1.3620083332061768, 1.4314227104187012, 1.500836968421936, 1.5702513456344604, 1.6396656036376953, 1.7090799808502197, 1.7784943580627441, 1.8479087352752686, 1.9173229932785034]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 6.0, 26.0, 25.0, 33.0, 47.0, 52.0, 64.0, 74.0, 69.0, 76.0, 69.0, 75.0, 75.0, 59.0, 59.0, 47.0, 40.0, 30.0, 20.0, 13.0, 9.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3186020851135254, -1.2591097354888916, -1.1996172666549683, -1.1401249170303345, -1.0806325674057007, -1.0211400985717773, -0.9616477489471436, -0.9021553993225098, -0.8426629900932312, -0.7831705808639526, -0.7236782312393188, -0.6641858220100403, -0.6046934127807617, -0.5452010631561279, -0.48570865392684937, -0.4262162744998932, -0.366723895072937, -0.30723151564598083, -0.24773912131786346, -0.1882467269897461, -0.12875434756278992, -0.06926196813583374, -0.009769558906555176, 0.049722820520401, 0.10921519994735718, 0.16870757937431335, 0.22819997370243073, 0.2876923680305481, 0.3471847474575043, 0.40667712688446045, 0.466169536113739, 0.5256619453430176, 0.5851542949676514, 0.6446467041969299, 0.7041390538215637, 0.7636314630508423, 0.8231238126754761, 0.8826162219047546, 0.9421086311340332, 1.001600980758667, 1.0610933303833008, 1.1205856800079346, 1.180078148841858, 1.2395704984664917, 1.2990628480911255, 1.3585553169250488, 1.4180476665496826, 1.4775400161743164, 1.5370324850082397, 1.5965248346328735, 1.6560173034667969, 1.7155096530914307, 1.7750020027160645, 1.8344943523406982, 1.8939868211746216, 1.9534791707992554, 2.0129716396331787, 2.0724639892578125, 2.1319563388824463, 2.19144868850708, 2.250941276550293, 2.3104336261749268, 2.3699259757995605, 2.4294183254241943, 2.488910675048828]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 12.0, 23.0, 27.0, 35.0, 42.0, 77.0, 106.0, 136.0, 215.0, 317.0, 439.0, 666.0, 1109.0, 1686.0, 2792.0, 4821.0, 8745.0, 16475.0, 35723.0, 92560.0, 386242.0, 342871.0, 84285.0, 33156.0, 15657.0, 8216.0, 4579.0, 2707.0, 1689.0, 1068.0, 691.0, 413.0, 302.0, 191.0, 131.0, 91.0, 81.0, 57.0, 26.0, 23.0, 16.0, 15.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6640625, -1.6135711669921875, -1.563079833984375, -1.5125885009765625, -1.46209716796875, -1.4116058349609375, -1.361114501953125, -1.3106231689453125, -1.2601318359375, -1.2096405029296875, -1.159149169921875, -1.1086578369140625, -1.05816650390625, -1.0076751708984375, -0.957183837890625, -0.9066925048828125, -0.856201171875, -0.8057098388671875, -0.755218505859375, -0.7047271728515625, -0.65423583984375, -0.6037445068359375, -0.553253173828125, -0.5027618408203125, -0.4522705078125, -0.4017791748046875, -0.351287841796875, -0.3007965087890625, -0.25030517578125, -0.1998138427734375, -0.149322509765625, -0.0988311767578125, -0.04833984375, 0.0021514892578125, 0.052642822265625, 0.1031341552734375, 0.15362548828125, 0.2041168212890625, 0.254608154296875, 0.3050994873046875, 0.3555908203125, 0.4060821533203125, 0.456573486328125, 0.5070648193359375, 0.55755615234375, 0.6080474853515625, 0.658538818359375, 0.7090301513671875, 0.759521484375, 0.8100128173828125, 0.860504150390625, 0.9109954833984375, 0.96148681640625, 1.0119781494140625, 1.062469482421875, 1.1129608154296875, 1.1634521484375, 1.2139434814453125, 1.264434814453125, 1.3149261474609375, 1.36541748046875, 1.4159088134765625, 1.466400146484375, 1.5168914794921875, 1.5673828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 16.0, 14.0, 36.0, 32.0, 41.0, 60.0, 61.0, 65.0, 71.0, 74.0, 65.0, 83.0, 56.0, 70.0, 44.0, 47.0, 41.0, 27.0, 23.0, 18.0, 8.0, 9.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.185882568359375, -3.07293701171875, -2.959991455078125, -2.8470458984375, -2.734100341796875, -2.62115478515625, -2.508209228515625, -2.395263671875, -2.282318115234375, -2.16937255859375, -2.056427001953125, -1.9434814453125, -1.830535888671875, -1.71759033203125, -1.604644775390625, -1.49169921875, -1.378753662109375, -1.26580810546875, -1.152862548828125, -1.0399169921875, -0.926971435546875, -0.81402587890625, -0.701080322265625, -0.588134765625, -0.475189208984375, -0.36224365234375, -0.249298095703125, -0.1363525390625, -0.023406982421875, 0.08953857421875, 0.202484130859375, 0.3154296875, 0.428375244140625, 0.54132080078125, 0.654266357421875, 0.7672119140625, 0.880157470703125, 0.99310302734375, 1.106048583984375, 1.218994140625, 1.331939697265625, 1.44488525390625, 1.557830810546875, 1.6707763671875, 1.783721923828125, 1.89666748046875, 2.009613037109375, 2.12255859375, 2.235504150390625, 2.34844970703125, 2.461395263671875, 2.5743408203125, 2.687286376953125, 2.80023193359375, 2.913177490234375, 3.026123046875, 3.139068603515625, 3.25201416015625, 3.364959716796875, 3.4779052734375, 3.590850830078125, 3.70379638671875, 3.816741943359375, 3.9296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 20.0, 19.0, 51.0, 62.0, 104.0, 218.0, 381.0, 805.0, 2014.0, 5645.0, 21378.0, 112933.0, 762737.0, 111559.0, 21301.0, 5680.0, 1947.0, 821.0, 371.0, 202.0, 118.0, 72.0, 38.0, 22.0, 11.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0], "bins": [-4.62109375, -4.517242431640625, -4.41339111328125, -4.309539794921875, -4.2056884765625, -4.101837158203125, -3.99798583984375, -3.894134521484375, -3.790283203125, -3.686431884765625, -3.58258056640625, -3.478729248046875, -3.3748779296875, -3.271026611328125, -3.16717529296875, -3.063323974609375, -2.95947265625, -2.855621337890625, -2.75177001953125, -2.647918701171875, -2.5440673828125, -2.440216064453125, -2.33636474609375, -2.232513427734375, -2.128662109375, -2.024810791015625, -1.92095947265625, -1.817108154296875, -1.7132568359375, -1.609405517578125, -1.50555419921875, -1.401702880859375, -1.2978515625, -1.194000244140625, -1.09014892578125, -0.986297607421875, -0.8824462890625, -0.778594970703125, -0.67474365234375, -0.570892333984375, -0.467041015625, -0.363189697265625, -0.25933837890625, -0.155487060546875, -0.0516357421875, 0.052215576171875, 0.15606689453125, 0.259918212890625, 0.36376953125, 0.467620849609375, 0.57147216796875, 0.675323486328125, 0.7791748046875, 0.883026123046875, 0.98687744140625, 1.090728759765625, 1.194580078125, 1.298431396484375, 1.40228271484375, 1.506134033203125, 1.6099853515625, 1.713836669921875, 1.81768798828125, 1.921539306640625, 2.025390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 8.0, 7.0, 3.0, 8.0, 9.0, 9.0, 11.0, 20.0, 25.0, 34.0, 36.0, 35.0, 47.0, 40.0, 55.0, 49.0, 66.0, 56.0, 55.0, 59.0, 54.0, 59.0, 45.0, 40.0, 27.0, 28.0, 32.0, 19.0, 18.0, 16.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34765625, -4.21820068359375, -4.0887451171875, -3.95928955078125, -3.829833984375, -3.70037841796875, -3.5709228515625, -3.44146728515625, -3.31201171875, -3.18255615234375, -3.0531005859375, -2.92364501953125, -2.794189453125, -2.66473388671875, -2.5352783203125, -2.40582275390625, -2.2763671875, -2.14691162109375, -2.0174560546875, -1.88800048828125, -1.758544921875, -1.62908935546875, -1.4996337890625, -1.37017822265625, -1.24072265625, -1.11126708984375, -0.9818115234375, -0.85235595703125, -0.722900390625, -0.59344482421875, -0.4639892578125, -0.33453369140625, -0.205078125, -0.07562255859375, 0.0538330078125, 0.18328857421875, 0.312744140625, 0.44219970703125, 0.5716552734375, 0.70111083984375, 0.83056640625, 0.96002197265625, 1.0894775390625, 1.21893310546875, 1.348388671875, 1.47784423828125, 1.6072998046875, 1.73675537109375, 1.8662109375, 1.99566650390625, 2.1251220703125, 2.25457763671875, 2.384033203125, 2.51348876953125, 2.6429443359375, 2.77239990234375, 2.90185546875, 3.03131103515625, 3.1607666015625, 3.29022216796875, 3.419677734375, 3.54913330078125, 3.6785888671875, 3.80804443359375, 3.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 11.0, 5.0, 11.0, 25.0, 24.0, 39.0, 63.0, 95.0, 137.0, 241.0, 471.0, 1007.0, 2280.0, 5677.0, 18008.0, 69757.0, 357520.0, 471756.0, 87746.0, 21825.0, 6731.0, 2611.0, 1174.0, 574.0, 278.0, 151.0, 112.0, 62.0, 43.0, 27.0, 21.0, 11.0, 13.0, 10.0, 12.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.71337890625, -0.69244384765625, -0.6715087890625, -0.65057373046875, -0.629638671875, -0.60870361328125, -0.5877685546875, -0.56683349609375, -0.5458984375, -0.52496337890625, -0.5040283203125, -0.48309326171875, -0.462158203125, -0.44122314453125, -0.4202880859375, -0.39935302734375, -0.37841796875, -0.35748291015625, -0.3365478515625, -0.31561279296875, -0.294677734375, -0.27374267578125, -0.2528076171875, -0.23187255859375, -0.2109375, -0.19000244140625, -0.1690673828125, -0.14813232421875, -0.127197265625, -0.10626220703125, -0.0853271484375, -0.06439208984375, -0.04345703125, -0.02252197265625, -0.0015869140625, 0.01934814453125, 0.040283203125, 0.06121826171875, 0.0821533203125, 0.10308837890625, 0.1240234375, 0.14495849609375, 0.1658935546875, 0.18682861328125, 0.207763671875, 0.22869873046875, 0.2496337890625, 0.27056884765625, 0.29150390625, 0.31243896484375, 0.3333740234375, 0.35430908203125, 0.375244140625, 0.39617919921875, 0.4171142578125, 0.43804931640625, 0.458984375, 0.47991943359375, 0.5008544921875, 0.52178955078125, 0.542724609375, 0.56365966796875, 0.5845947265625, 0.60552978515625, 0.62646484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 8.0, 12.0, 12.0, 18.0, 32.0, 36.0, 48.0, 42.0, 83.0, 118.0, 127.0, 98.0, 84.0, 56.0, 56.0, 30.0, 29.0, 15.0, 12.0, 11.0, 14.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010097026824951172, -9.754952043294907e-05, -9.412877261638641e-05, -9.070802479982376e-05, -8.728727698326111e-05, -8.386652916669846e-05, -8.04457813501358e-05, -7.702503353357315e-05, -7.36042857170105e-05, -7.018353790044785e-05, -6.676279008388519e-05, -6.334204226732254e-05, -5.992129445075989e-05, -5.6500546634197235e-05, -5.307979881763458e-05, -4.965905100107193e-05, -4.623830318450928e-05, -4.2817555367946625e-05, -3.939680755138397e-05, -3.597605973482132e-05, -3.255531191825867e-05, -2.9134564101696014e-05, -2.5713816285133362e-05, -2.229306846857071e-05, -1.8872320652008057e-05, -1.5451572835445404e-05, -1.2030825018882751e-05, -8.610077202320099e-06, -5.189329385757446e-06, -1.7685815691947937e-06, 1.6521662473678589e-06, 5.0729140639305115e-06, 8.493661880493164e-06, 1.1914409697055817e-05, 1.533515751361847e-05, 1.8755905330181122e-05, 2.2176653146743774e-05, 2.5597400963306427e-05, 2.901814877986908e-05, 3.243889659643173e-05, 3.5859644412994385e-05, 3.928039222955704e-05, 4.270114004611969e-05, 4.612188786268234e-05, 4.9542635679244995e-05, 5.296338349580765e-05, 5.63841313123703e-05, 5.980487912893295e-05, 6.32256269454956e-05, 6.664637476205826e-05, 7.006712257862091e-05, 7.348787039518356e-05, 7.690861821174622e-05, 8.032936602830887e-05, 8.375011384487152e-05, 8.717086166143417e-05, 9.059160947799683e-05, 9.401235729455948e-05, 9.743310511112213e-05, 0.00010085385292768478, 0.00010427460074424744, 0.00010769534856081009, 0.00011111609637737274, 0.0001145368441939354, 0.00011795759201049805]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 24.0, 38.0, 71.0, 143.0, 278.0, 608.0, 1494.0, 4389.0, 15382.0, 70665.0, 458457.0, 411332.0, 64713.0, 14231.0, 4074.0, 1425.0, 564.0, 267.0, 125.0, 72.0, 52.0, 20.0, 15.0, 16.0, 5.0, 12.0, 9.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85791015625, -0.8326568603515625, -0.807403564453125, -0.7821502685546875, -0.75689697265625, -0.7316436767578125, -0.706390380859375, -0.6811370849609375, -0.6558837890625, -0.6306304931640625, -0.605377197265625, -0.5801239013671875, -0.55487060546875, -0.5296173095703125, -0.504364013671875, -0.4791107177734375, -0.453857421875, -0.4286041259765625, -0.403350830078125, -0.3780975341796875, -0.35284423828125, -0.3275909423828125, -0.302337646484375, -0.2770843505859375, -0.2518310546875, -0.2265777587890625, -0.201324462890625, -0.1760711669921875, -0.15081787109375, -0.1255645751953125, -0.100311279296875, -0.0750579833984375, -0.0498046875, -0.0245513916015625, 0.000701904296875, 0.0259552001953125, 0.05120849609375, 0.0764617919921875, 0.101715087890625, 0.1269683837890625, 0.1522216796875, 0.1774749755859375, 0.202728271484375, 0.2279815673828125, 0.25323486328125, 0.2784881591796875, 0.303741455078125, 0.3289947509765625, 0.354248046875, 0.3795013427734375, 0.404754638671875, 0.4300079345703125, 0.45526123046875, 0.4805145263671875, 0.505767822265625, 0.5310211181640625, 0.5562744140625, 0.5815277099609375, 0.606781005859375, 0.6320343017578125, 0.65728759765625, 0.6825408935546875, 0.707794189453125, 0.7330474853515625, 0.75830078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 4.0, 8.0, 14.0, 12.0, 18.0, 16.0, 22.0, 28.0, 32.0, 35.0, 49.0, 73.0, 77.0, 122.0, 83.0, 90.0, 54.0, 56.0, 38.0, 25.0, 26.0, 18.0, 13.0, 12.0, 21.0, 9.0, 2.0, 6.0, 4.0, 2.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.37451171875, -0.364105224609375, -0.35369873046875, -0.343292236328125, -0.3328857421875, -0.322479248046875, -0.31207275390625, -0.301666259765625, -0.291259765625, -0.280853271484375, -0.27044677734375, -0.260040283203125, -0.2496337890625, -0.239227294921875, -0.22882080078125, -0.218414306640625, -0.2080078125, -0.197601318359375, -0.18719482421875, -0.176788330078125, -0.1663818359375, -0.155975341796875, -0.14556884765625, -0.135162353515625, -0.124755859375, -0.114349365234375, -0.10394287109375, -0.093536376953125, -0.0831298828125, -0.072723388671875, -0.06231689453125, -0.051910400390625, -0.04150390625, -0.031097412109375, -0.02069091796875, -0.010284423828125, 0.0001220703125, 0.010528564453125, 0.02093505859375, 0.031341552734375, 0.041748046875, 0.052154541015625, 0.06256103515625, 0.072967529296875, 0.0833740234375, 0.093780517578125, 0.10418701171875, 0.114593505859375, 0.125, 0.135406494140625, 0.14581298828125, 0.156219482421875, 0.1666259765625, 0.177032470703125, 0.18743896484375, 0.197845458984375, 0.208251953125, 0.218658447265625, 0.22906494140625, 0.239471435546875, 0.2498779296875, 0.260284423828125, 0.27069091796875, 0.281097412109375, 0.29150390625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 41.0, 407.0, 490.0, 67.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0273895263671875, -3.052302837371826, -2.077216148376465, -1.1021292209625244, -0.12704253196716309, 0.8480443954467773, 1.8231310844421387, 2.7982177734375, 3.7733044624328613, 4.748391151428223, 5.723477840423584, 6.698564529418945, 7.673651695251465, 8.648738861083984, 9.623825073242188, 10.59891128540039, 11.57399845123291, 12.54908561706543, 13.524171829223633, 14.499258995056152, 15.474345207214355, 16.449432373046875, 17.424518585205078, 18.39960479736328, 19.374692916870117, 20.34977912902832, 21.324867248535156, 22.29995346069336, 23.275039672851562, 24.250125885009766, 25.2252140045166, 26.200300216674805, 27.175386428833008, 28.15047264099121, 29.125560760498047, 30.10064697265625, 31.075733184814453, 32.050819396972656, 33.02590560913086, 34.00099182128906, 34.97608184814453, 35.951168060302734, 36.92625427246094, 37.90134048461914, 38.87643051147461, 39.85151672363281, 40.826602935791016, 41.80168914794922, 42.77677536010742, 43.751861572265625, 44.72694778442383, 45.70203399658203, 46.6771240234375, 47.6522102355957, 48.627296447753906, 49.60238265991211, 50.57746887207031, 51.552555084228516, 52.52764129638672, 53.50272750854492, 54.47781753540039, 55.452903747558594, 56.4279899597168, 57.403076171875, 58.3781623840332]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 12.0, 8.0, 9.0, 24.0, 17.0, 25.0, 21.0, 27.0, 24.0, 43.0, 24.0, 27.0, 35.0, 34.0, 47.0, 44.0, 37.0, 32.0, 33.0, 34.0, 41.0, 36.0, 46.0, 35.0, 33.0, 28.0, 18.0, 24.0, 25.0, 22.0, 27.0, 19.0, 17.0, 11.0, 10.0, 3.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.838257312774658, -5.665676116943359, -5.4930949211120605, -5.320513725280762, -5.147933006286621, -4.975351810455322, -4.802770614624023, -4.630189418792725, -4.457608222961426, -4.285027027130127, -4.112445831298828, -3.9398648738861084, -3.7672836780548096, -3.5947024822235107, -3.422121524810791, -3.249540328979492, -3.0769591331481934, -2.9043779373168945, -2.7317967414855957, -2.559215784072876, -2.386634588241577, -2.2140533924102783, -2.0414724349975586, -1.8688912391662598, -1.696310043334961, -1.523728847503662, -1.3511477708816528, -1.1785666942596436, -1.0059854984283447, -0.8334043622016907, -0.6608232259750366, -0.48824214935302734, -0.3156609535217285, -0.14307981729507446, 0.02950131893157959, 0.20208245515823364, 0.3746635913848877, 0.5472447276115417, 0.7198258638381958, 0.8924069404602051, 1.064988136291504, 1.2375693321228027, 1.410150408744812, 1.5827314853668213, 1.7553126811981201, 1.927893877029419, 2.1004748344421387, 2.2730560302734375, 2.4456372261047363, 2.618218421936035, 2.790799617767334, 2.9633805751800537, 3.1359617710113525, 3.3085429668426514, 3.481123924255371, 3.65370512008667, 3.8262863159179688, 3.9988675117492676, 4.171448707580566, 4.344029903411865, 4.516611099243164, 4.689191818237305, 4.8617730140686035, 5.034354209899902, 5.206935405731201]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 5.0, 10.0, 22.0, 20.0, 38.0, 51.0, 78.0, 130.0, 407.0, 1600.0, 11294.0, 458804.0, 3682739.0, 34607.0, 3283.0, 702.0, 221.0, 82.0, 65.0, 47.0, 31.0, 14.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.8817138671875, -4.661865234375, -4.4420166015625, -4.22216796875, -4.0023193359375, -3.782470703125, -3.5626220703125, -3.3427734375, -3.1229248046875, -2.903076171875, -2.6832275390625, -2.46337890625, -2.2435302734375, -2.023681640625, -1.8038330078125, -1.583984375, -1.3641357421875, -1.144287109375, -0.9244384765625, -0.70458984375, -0.4847412109375, -0.264892578125, -0.0450439453125, 0.1748046875, 0.3946533203125, 0.614501953125, 0.8343505859375, 1.05419921875, 1.2740478515625, 1.493896484375, 1.7137451171875, 1.93359375, 2.1534423828125, 2.373291015625, 2.5931396484375, 2.81298828125, 3.0328369140625, 3.252685546875, 3.4725341796875, 3.6923828125, 3.9122314453125, 4.132080078125, 4.3519287109375, 4.57177734375, 4.7916259765625, 5.011474609375, 5.2313232421875, 5.451171875, 5.6710205078125, 5.890869140625, 6.1107177734375, 6.33056640625, 6.5504150390625, 6.770263671875, 6.9901123046875, 7.2099609375, 7.4298095703125, 7.649658203125, 7.8695068359375, 8.08935546875, 8.3092041015625, 8.529052734375, 8.7489013671875, 8.96875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 1.0, 6.0, 10.0, 13.0, 17.0, 27.0, 32.0, 38.0, 58.0, 38.0, 57.0, 74.0, 69.0, 74.0, 68.0, 73.0, 60.0, 61.0, 47.0, 44.0, 34.0, 27.0, 30.0, 10.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4636077880859375, -1.412567138671875, -1.3615264892578125, -1.31048583984375, -1.2594451904296875, -1.208404541015625, -1.1573638916015625, -1.1063232421875, -1.0552825927734375, -1.004241943359375, -0.9532012939453125, -0.90216064453125, -0.8511199951171875, -0.800079345703125, -0.7490386962890625, -0.697998046875, -0.6469573974609375, -0.595916748046875, -0.5448760986328125, -0.49383544921875, -0.4427947998046875, -0.391754150390625, -0.3407135009765625, -0.2896728515625, -0.2386322021484375, -0.187591552734375, -0.1365509033203125, -0.08551025390625, -0.0344696044921875, 0.016571044921875, 0.0676116943359375, 0.11865234375, 0.1696929931640625, 0.220733642578125, 0.2717742919921875, 0.32281494140625, 0.3738555908203125, 0.424896240234375, 0.4759368896484375, 0.5269775390625, 0.5780181884765625, 0.629058837890625, 0.6800994873046875, 0.73114013671875, 0.7821807861328125, 0.833221435546875, 0.8842620849609375, 0.935302734375, 0.9863433837890625, 1.037384033203125, 1.0884246826171875, 1.13946533203125, 1.1905059814453125, 1.241546630859375, 1.2925872802734375, 1.3436279296875, 1.3946685791015625, 1.445709228515625, 1.4967498779296875, 1.54779052734375, 1.5988311767578125, 1.649871826171875, 1.7009124755859375, 1.751953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 12.0, 21.0, 23.0, 43.0, 58.0, 96.0, 139.0, 271.0, 652.0, 1904.0, 9090.0, 76131.0, 2773924.0, 1277031.0, 45817.0, 6301.0, 1575.0, 546.0, 263.0, 141.0, 61.0, 50.0, 33.0, 20.0, 21.0, 6.0, 11.0, 4.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.02734375, -3.87762451171875, -3.7279052734375, -3.57818603515625, -3.428466796875, -3.27874755859375, -3.1290283203125, -2.97930908203125, -2.82958984375, -2.67987060546875, -2.5301513671875, -2.38043212890625, -2.230712890625, -2.08099365234375, -1.9312744140625, -1.78155517578125, -1.6318359375, -1.48211669921875, -1.3323974609375, -1.18267822265625, -1.032958984375, -0.88323974609375, -0.7335205078125, -0.58380126953125, -0.43408203125, -0.28436279296875, -0.1346435546875, 0.01507568359375, 0.164794921875, 0.31451416015625, 0.4642333984375, 0.61395263671875, 0.763671875, 0.91339111328125, 1.0631103515625, 1.21282958984375, 1.362548828125, 1.51226806640625, 1.6619873046875, 1.81170654296875, 1.96142578125, 2.11114501953125, 2.2608642578125, 2.41058349609375, 2.560302734375, 2.71002197265625, 2.8597412109375, 3.00946044921875, 3.1591796875, 3.30889892578125, 3.4586181640625, 3.60833740234375, 3.758056640625, 3.90777587890625, 4.0574951171875, 4.20721435546875, 4.35693359375, 4.50665283203125, 4.6563720703125, 4.80609130859375, 4.955810546875, 5.10552978515625, 5.2552490234375, 5.40496826171875, 5.5546875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 12.0, 18.0, 27.0, 25.0, 57.0, 85.0, 113.0, 191.0, 228.0, 368.0, 549.0, 690.0, 518.0, 395.0, 228.0, 168.0, 105.0, 77.0, 50.0, 43.0, 30.0, 21.0, 19.0, 6.0, 9.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0788192749023438, -1.0492401123046875, -1.0196609497070312, -0.990081787109375, -0.9605026245117188, -0.9309234619140625, -0.9013442993164062, -0.87176513671875, -0.8421859741210938, -0.8126068115234375, -0.7830276489257812, -0.753448486328125, -0.7238693237304688, -0.6942901611328125, -0.6647109985351562, -0.6351318359375, -0.6055526733398438, -0.5759735107421875, -0.5463943481445312, -0.516815185546875, -0.48723602294921875, -0.4576568603515625, -0.42807769775390625, -0.39849853515625, -0.36891937255859375, -0.3393402099609375, -0.30976104736328125, -0.280181884765625, -0.25060272216796875, -0.2210235595703125, -0.19144439697265625, -0.161865234375, -0.13228607177734375, -0.1027069091796875, -0.07312774658203125, -0.043548583984375, -0.01396942138671875, 0.0156097412109375, 0.04518890380859375, 0.07476806640625, 0.10434722900390625, 0.1339263916015625, 0.16350555419921875, 0.193084716796875, 0.22266387939453125, 0.2522430419921875, 0.28182220458984375, 0.3114013671875, 0.34098052978515625, 0.3705596923828125, 0.40013885498046875, 0.429718017578125, 0.45929718017578125, 0.4888763427734375, 0.5184555053710938, 0.54803466796875, 0.5776138305664062, 0.6071929931640625, 0.6367721557617188, 0.666351318359375, 0.6959304809570312, 0.7255096435546875, 0.7550888061523438, 0.78466796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 11.0, 29.0, 31.0, 36.0, 54.0, 66.0, 67.0, 86.0, 85.0, 90.0, 92.0, 67.0, 54.0, 52.0, 46.0, 28.0, 31.0, 15.0, 13.0, 10.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7800548076629639, -1.679813027381897, -1.57957124710083, -1.4793293476104736, -1.3790875673294067, -1.2788457870483398, -1.1786038875579834, -1.0783621072769165, -0.9781203269958496, -0.8778785467147827, -0.777636706829071, -0.6773948669433594, -0.5771530866622925, -0.4769113063812256, -0.3766694664955139, -0.27642762660980225, -0.17618584632873535, -0.07594403624534607, 0.024297773838043213, 0.1245395839214325, 0.22478139400482178, 0.32502317428588867, 0.42526501417160034, 0.525506854057312, 0.6257486343383789, 0.7259904146194458, 0.8262322545051575, 0.9264740943908691, 1.026715874671936, 1.126957654953003, 1.2271995544433594, 1.3274413347244263, 1.4276833534240723, 1.5279251337051392, 1.628166913986206, 1.7284088134765625, 1.8286505937576294, 1.9288923740386963, 2.0291342735290527, 2.12937593460083, 2.2296178340911865, 2.329859733581543, 2.4301013946533203, 2.5303432941436768, 2.630585193634033, 2.7308268547058105, 2.831068754196167, 2.9313106536865234, 3.031552314758301, 3.1317942142486572, 3.2320358753204346, 3.332277774810791, 3.4325194358825684, 3.532761335372925, 3.6330032348632812, 3.7332448959350586, 3.833486795425415, 3.9337286949157715, 4.033970355987549, 4.134212017059326, 4.234454154968262, 4.334695816040039, 4.434937477111816, 4.535179615020752, 4.635421276092529]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 9.0, 12.0, 9.0, 18.0, 20.0, 18.0, 24.0, 34.0, 35.0, 25.0, 44.0, 45.0, 49.0, 34.0, 43.0, 36.0, 45.0, 45.0, 59.0, 40.0, 33.0, 38.0, 37.0, 43.0, 21.0, 32.0, 22.0, 20.0, 17.0, 11.0, 6.0, 14.0, 10.0, 3.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4243059158325195, -1.3674544095993042, -1.3106030225753784, -1.253751516342163, -1.1969001293182373, -1.140048623085022, -1.0831971168518066, -1.0263457298278809, -0.9694942235946655, -0.912642776966095, -0.8557913303375244, -0.7989398241043091, -0.7420883774757385, -0.685236930847168, -0.6283854842185974, -0.5715340375900269, -0.5146825909614563, -0.45783114433288574, -0.4009796679019928, -0.34412822127342224, -0.2872767448425293, -0.23042529821395874, -0.17357385158538818, -0.11672237515449524, -0.05987092852592468, -0.0030194707214832306, 0.05383198708295822, 0.11068344116210938, 0.16753490269184113, 0.22438636422157288, 0.28123781085014343, 0.3380892872810364, 0.39494073390960693, 0.4517921805381775, 0.508643627166748, 0.5654951333999634, 0.6223465800285339, 0.6791980266571045, 0.736049473285675, 0.7929009199142456, 0.8497524261474609, 0.9066038727760315, 0.963455319404602, 1.0203068256378174, 1.0771582126617432, 1.1340097188949585, 1.1908612251281738, 1.2477126121520996, 1.3045639991760254, 1.3614155054092407, 1.4182668924331665, 1.4751183986663818, 1.5319697856903076, 1.588821291923523, 1.6456727981567383, 1.702524185180664, 1.7593756914138794, 1.8162271976470947, 1.8730785846710205, 1.9299300909042358, 1.9867814779281616, 2.043632984161377, 2.1004843711853027, 2.1573359966278076, 2.2141873836517334]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 10.0, 12.0, 19.0, 18.0, 32.0, 55.0, 64.0, 126.0, 190.0, 305.0, 506.0, 1159.0, 7431.0, 843226.0, 190102.0, 3215.0, 951.0, 388.0, 251.0, 159.0, 98.0, 67.0, 52.0, 26.0, 23.0, 18.0, 12.0, 14.0, 4.0, 3.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9079055786132812, -0.8802642822265625, -0.8526229858398438, -0.824981689453125, -0.7973403930664062, -0.7696990966796875, -0.7420578002929688, -0.71441650390625, -0.6867752075195312, -0.6591339111328125, -0.6314926147460938, -0.603851318359375, -0.5762100219726562, -0.5485687255859375, -0.5209274291992188, -0.4932861328125, -0.46564483642578125, -0.4380035400390625, -0.41036224365234375, -0.382720947265625, -0.35507965087890625, -0.3274383544921875, -0.29979705810546875, -0.27215576171875, -0.24451446533203125, -0.2168731689453125, -0.18923187255859375, -0.161590576171875, -0.13394927978515625, -0.1063079833984375, -0.07866668701171875, -0.051025390625, -0.02338409423828125, 0.0042572021484375, 0.03189849853515625, 0.059539794921875, 0.08718109130859375, 0.1148223876953125, 0.14246368408203125, 0.17010498046875, 0.19774627685546875, 0.2253875732421875, 0.25302886962890625, 0.280670166015625, 0.30831146240234375, 0.3359527587890625, 0.36359405517578125, 0.3912353515625, 0.41887664794921875, 0.4465179443359375, 0.47415924072265625, 0.501800537109375, 0.5294418334960938, 0.5570831298828125, 0.5847244262695312, 0.61236572265625, 0.6400070190429688, 0.6676483154296875, 0.6952896118164062, 0.722930908203125, 0.7505722045898438, 0.7782135009765625, 0.8058547973632812, 0.83349609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 5.0, 7.0, 14.0, 15.0, 12.0, 15.0, 27.0, 20.0, 35.0, 44.0, 53.0, 47.0, 65.0, 57.0, 72.0, 64.0, 55.0, 65.0, 58.0, 63.0, 47.0, 34.0, 29.0, 30.0, 21.0, 11.0, 11.0, 10.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.71929931640625, -1.6641845703125, -1.60906982421875, -1.553955078125, -1.49884033203125, -1.4437255859375, -1.38861083984375, -1.33349609375, -1.27838134765625, -1.2232666015625, -1.16815185546875, -1.113037109375, -1.05792236328125, -1.0028076171875, -0.94769287109375, -0.892578125, -0.83746337890625, -0.7823486328125, -0.72723388671875, -0.672119140625, -0.61700439453125, -0.5618896484375, -0.50677490234375, -0.45166015625, -0.39654541015625, -0.3414306640625, -0.28631591796875, -0.231201171875, -0.17608642578125, -0.1209716796875, -0.06585693359375, -0.0107421875, 0.04437255859375, 0.0994873046875, 0.15460205078125, 0.209716796875, 0.26483154296875, 0.3199462890625, 0.37506103515625, 0.43017578125, 0.48529052734375, 0.5404052734375, 0.59552001953125, 0.650634765625, 0.70574951171875, 0.7608642578125, 0.81597900390625, 0.87109375, 0.92620849609375, 0.9813232421875, 1.03643798828125, 1.091552734375, 1.14666748046875, 1.2017822265625, 1.25689697265625, 1.31201171875, 1.36712646484375, 1.4222412109375, 1.47735595703125, 1.532470703125, 1.58758544921875, 1.6427001953125, 1.69781494140625, 1.7529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 8.0, 5.0, 3.0, 4.0, 5.0, 14.0, 12.0, 7.0, 24.0, 20.0, 32.0, 30.0, 48.0, 53.0, 84.0, 90.0, 129.0, 138.0, 218.0, 351.0, 558.0, 1521.0, 7984.0, 79778.0, 764801.0, 175249.0, 13520.0, 1907.0, 638.0, 338.0, 222.0, 199.0, 150.0, 108.0, 71.0, 60.0, 43.0, 26.0, 31.0, 29.0, 17.0, 9.0, 11.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.32958984375, -0.32007598876953125, -0.3105621337890625, -0.30104827880859375, -0.291534423828125, -0.28202056884765625, -0.2725067138671875, -0.26299285888671875, -0.25347900390625, -0.24396514892578125, -0.2344512939453125, -0.22493743896484375, -0.215423583984375, -0.20590972900390625, -0.1963958740234375, -0.18688201904296875, -0.1773681640625, -0.16785430908203125, -0.1583404541015625, -0.14882659912109375, -0.139312744140625, -0.12979888916015625, -0.1202850341796875, -0.11077117919921875, -0.10125732421875, -0.09174346923828125, -0.0822296142578125, -0.07271575927734375, -0.063201904296875, -0.05368804931640625, -0.0441741943359375, -0.03466033935546875, -0.025146484375, -0.01563262939453125, -0.0061187744140625, 0.00339508056640625, 0.012908935546875, 0.02242279052734375, 0.0319366455078125, 0.04145050048828125, 0.05096435546875, 0.06047821044921875, 0.0699920654296875, 0.07950592041015625, 0.089019775390625, 0.09853363037109375, 0.1080474853515625, 0.11756134033203125, 0.1270751953125, 0.13658905029296875, 0.1461029052734375, 0.15561676025390625, 0.165130615234375, 0.17464447021484375, 0.1841583251953125, 0.19367218017578125, 0.20318603515625, 0.21269989013671875, 0.2222137451171875, 0.23172760009765625, 0.241241455078125, 0.25075531005859375, 0.2602691650390625, 0.26978302001953125, 0.279296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 4.0, 5.0, 5.0, 9.0, 15.0, 9.0, 13.0, 13.0, 22.0, 29.0, 22.0, 29.0, 44.0, 47.0, 35.0, 47.0, 41.0, 42.0, 31.0, 55.0, 46.0, 31.0, 53.0, 40.0, 33.0, 32.0, 37.0, 27.0, 38.0, 15.0, 24.0, 21.0, 19.0, 12.0, 11.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.913818359375, -2.82177734375, -2.729736328125, -2.6376953125, -2.545654296875, -2.45361328125, -2.361572265625, -2.26953125, -2.177490234375, -2.08544921875, -1.993408203125, -1.9013671875, -1.809326171875, -1.71728515625, -1.625244140625, -1.533203125, -1.441162109375, -1.34912109375, -1.257080078125, -1.1650390625, -1.072998046875, -0.98095703125, -0.888916015625, -0.796875, -0.704833984375, -0.61279296875, -0.520751953125, -0.4287109375, -0.336669921875, -0.24462890625, -0.152587890625, -0.060546875, 0.031494140625, 0.12353515625, 0.215576171875, 0.3076171875, 0.399658203125, 0.49169921875, 0.583740234375, 0.67578125, 0.767822265625, 0.85986328125, 0.951904296875, 1.0439453125, 1.135986328125, 1.22802734375, 1.320068359375, 1.412109375, 1.504150390625, 1.59619140625, 1.688232421875, 1.7802734375, 1.872314453125, 1.96435546875, 2.056396484375, 2.1484375, 2.240478515625, 2.33251953125, 2.424560546875, 2.5166015625, 2.608642578125, 2.70068359375, 2.792724609375, 2.884765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 6.0, 10.0, 6.0, 12.0, 20.0, 37.0, 75.0, 186.0, 671.0, 6441.0, 1037429.0, 2890.0, 471.0, 165.0, 69.0, 19.0, 11.0, 11.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.34814453125, -0.33930397033691406, -0.3304634094238281, -0.3216228485107422, -0.31278228759765625, -0.3039417266845703, -0.2951011657714844, -0.28626060485839844, -0.2774200439453125, -0.26857948303222656, -0.2597389221191406, -0.2508983612060547, -0.24205780029296875, -0.2332172393798828, -0.22437667846679688, -0.21553611755371094, -0.206695556640625, -0.19785499572753906, -0.18901443481445312, -0.1801738739013672, -0.17133331298828125, -0.1624927520751953, -0.15365219116210938, -0.14481163024902344, -0.1359710693359375, -0.12713050842285156, -0.11828994750976562, -0.10944938659667969, -0.10060882568359375, -0.09176826477050781, -0.08292770385742188, -0.07408714294433594, -0.06524658203125, -0.05640602111816406, -0.047565460205078125, -0.03872489929199219, -0.02988433837890625, -0.021043777465820312, -0.012203216552734375, -0.0033626556396484375, 0.0054779052734375, 0.014318466186523438, 0.023159027099609375, 0.03199958801269531, 0.04084014892578125, 0.04968070983886719, 0.058521270751953125, 0.06736183166503906, 0.076202392578125, 0.08504295349121094, 0.09388351440429688, 0.10272407531738281, 0.11156463623046875, 0.12040519714355469, 0.12924575805664062, 0.13808631896972656, 0.1469268798828125, 0.15576744079589844, 0.16460800170898438, 0.1734485626220703, 0.18228912353515625, 0.1911296844482422, 0.19997024536132812, 0.20881080627441406, 0.2176513671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 9.0, 11.0, 30.0, 44.0, 62.0, 64.0, 89.0, 116.0, 130.0, 113.0, 97.0, 56.0, 44.0, 30.0, 20.0, 14.0, 13.0, 11.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.653764724731445e-05, -3.540609031915665e-05, -3.427453339099884e-05, -3.3142976462841034e-05, -3.201141953468323e-05, -3.087986260652542e-05, -2.9748305678367615e-05, -2.861674875020981e-05, -2.7485191822052002e-05, -2.6353634893894196e-05, -2.522207796573639e-05, -2.4090521037578583e-05, -2.2958964109420776e-05, -2.182740718126297e-05, -2.0695850253105164e-05, -1.9564293324947357e-05, -1.843273639678955e-05, -1.7301179468631744e-05, -1.6169622540473938e-05, -1.5038065612316132e-05, -1.3906508684158325e-05, -1.2774951756000519e-05, -1.1643394827842712e-05, -1.0511837899684906e-05, -9.3802809715271e-06, -8.248724043369293e-06, -7.117167115211487e-06, -5.98561018705368e-06, -4.854053258895874e-06, -3.7224963307380676e-06, -2.5909394025802612e-06, -1.4593824744224548e-06, -3.2782554626464844e-07, 8.03731381893158e-07, 1.9352883100509644e-06, 3.0668452382087708e-06, 4.198402166366577e-06, 5.3299590945243835e-06, 6.46151602268219e-06, 7.593072950839996e-06, 8.724629878997803e-06, 9.856186807155609e-06, 1.0987743735313416e-05, 1.2119300663471222e-05, 1.3250857591629028e-05, 1.4382414519786835e-05, 1.551397144794464e-05, 1.6645528376102448e-05, 1.7777085304260254e-05, 1.890864223241806e-05, 2.0040199160575867e-05, 2.1171756088733673e-05, 2.230331301689148e-05, 2.3434869945049286e-05, 2.4566426873207092e-05, 2.56979838013649e-05, 2.6829540729522705e-05, 2.796109765768051e-05, 2.9092654585838318e-05, 3.0224211513996124e-05, 3.135576844215393e-05, 3.248732537031174e-05, 3.3618882298469543e-05, 3.475043922662735e-05, 3.5881996154785156e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 15.0, 28.0, 30.0, 50.0, 66.0, 91.0, 123.0, 219.0, 314.0, 618.0, 1166.0, 2606.0, 6880.0, 25681.0, 762661.0, 219558.0, 18314.0, 5669.0, 2179.0, 1010.0, 487.0, 278.0, 170.0, 111.0, 79.0, 42.0, 29.0, 18.0, 16.0, 8.0, 9.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10711669921875, -0.1034078598022461, -0.09969902038574219, -0.09599018096923828, -0.09228134155273438, -0.08857250213623047, -0.08486366271972656, -0.08115482330322266, -0.07744598388671875, -0.07373714447021484, -0.07002830505371094, -0.06631946563720703, -0.06261062622070312, -0.05890178680419922, -0.05519294738769531, -0.051484107971191406, -0.0477752685546875, -0.044066429138183594, -0.04035758972167969, -0.03664875030517578, -0.032939910888671875, -0.02923107147216797, -0.025522232055664062, -0.021813392639160156, -0.01810455322265625, -0.014395713806152344, -0.010686874389648438, -0.006978034973144531, -0.003269195556640625, 0.00043964385986328125, 0.0041484832763671875, 0.007857322692871094, 0.011566162109375, 0.015275001525878906, 0.018983840942382812, 0.02269268035888672, 0.026401519775390625, 0.03011035919189453, 0.03381919860839844, 0.037528038024902344, 0.04123687744140625, 0.044945716857910156, 0.04865455627441406, 0.05236339569091797, 0.056072235107421875, 0.05978107452392578, 0.06348991394042969, 0.0671987533569336, 0.0709075927734375, 0.0746164321899414, 0.07832527160644531, 0.08203411102294922, 0.08574295043945312, 0.08945178985595703, 0.09316062927246094, 0.09686946868896484, 0.10057830810546875, 0.10428714752197266, 0.10799598693847656, 0.11170482635498047, 0.11541366577148438, 0.11912250518798828, 0.12283134460449219, 0.1265401840209961, 0.1302490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 11.0, 26.0, 47.0, 295.0, 449.0, 78.0, 36.0, 10.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061279296875, -0.05953407287597656, -0.057788848876953125, -0.05604362487792969, -0.05429840087890625, -0.05255317687988281, -0.050807952880859375, -0.04906272888183594, -0.0473175048828125, -0.04557228088378906, -0.043827056884765625, -0.04208183288574219, -0.04033660888671875, -0.03859138488769531, -0.036846160888671875, -0.03510093688964844, -0.033355712890625, -0.03161048889160156, -0.029865264892578125, -0.028120040893554688, -0.02637481689453125, -0.024629592895507812, -0.022884368896484375, -0.021139144897460938, -0.0193939208984375, -0.017648696899414062, -0.015903472900390625, -0.014158248901367188, -0.01241302490234375, -0.010667800903320312, -0.008922576904296875, -0.0071773529052734375, -0.00543212890625, -0.0036869049072265625, -0.001941680908203125, -0.0001964569091796875, 0.00154876708984375, 0.0032939910888671875, 0.005039215087890625, 0.0067844390869140625, 0.0085296630859375, 0.010274887084960938, 0.012020111083984375, 0.013765335083007812, 0.01551055908203125, 0.017255783081054688, 0.019001007080078125, 0.020746231079101562, 0.022491455078125, 0.024236679077148438, 0.025981903076171875, 0.027727127075195312, 0.02947235107421875, 0.031217575073242188, 0.032962799072265625, 0.03470802307128906, 0.0364532470703125, 0.03819847106933594, 0.039943695068359375, 0.04168891906738281, 0.04343414306640625, 0.04517936706542969, 0.046924591064453125, 0.04866981506347656, 0.0504150390625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 5.0, 6.0, 12.0, 21.0, 22.0, 21.0, 24.0, 32.0, 33.0, 30.0, 46.0, 51.0, 50.0, 54.0, 44.0, 60.0, 50.0, 42.0, 45.0, 38.0, 45.0, 33.0, 31.0, 28.0, 25.0, 15.0, 27.0, 16.0, 18.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1751829385757446, -1.1364110708236694, -1.0976390838623047, -1.0588672161102295, -1.0200952291488647, -0.9813233613967896, -0.9425514340400696, -0.9037795066833496, -0.8650075793266296, -0.8262356519699097, -0.7874637246131897, -0.7486917972564697, -0.7099199295043945, -0.6711479425430298, -0.6323760747909546, -0.5936041474342346, -0.5548322200775146, -0.5160602927207947, -0.4772883653640747, -0.4385164678096771, -0.39974454045295715, -0.3609726130962372, -0.3222007155418396, -0.28342878818511963, -0.24465686082839966, -0.2058849334716797, -0.1671130210161209, -0.12834110856056213, -0.08956918120384216, -0.05079725384712219, -0.012025341391563416, 0.02674657106399536, 0.06551837921142578, 0.10429029911756516, 0.14306221902370453, 0.1818341314792633, 0.22060605883598328, 0.25937798619270325, 0.29814988374710083, 0.3369218111038208, 0.37569373846054077, 0.41446566581726074, 0.4532375931739807, 0.4920094907283783, 0.5307813882827759, 0.5695533752441406, 0.6083252429962158, 0.6470971703529358, 0.6858690977096558, 0.7246410250663757, 0.7634129524230957, 0.8021848797798157, 0.8409568071365356, 0.8797286748886108, 0.9185006022453308, 0.9572725296020508, 0.9960444569587708, 1.0348163843154907, 1.073588252067566, 1.1123602390289307, 1.1511321067810059, 1.1899040937423706, 1.2286759614944458, 1.2674479484558105, 1.3062198162078857]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 4.0, 6.0, 7.0, 11.0, 11.0, 10.0, 19.0, 24.0, 26.0, 28.0, 34.0, 29.0, 44.0, 49.0, 54.0, 53.0, 39.0, 70.0, 49.0, 54.0, 44.0, 48.0, 46.0, 42.0, 42.0, 26.0, 28.0, 27.0, 15.0, 17.0, 8.0, 11.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2294435501098633, -1.185463309288025, -1.1414830684661865, -1.0975029468536377, -1.0535227060317993, -1.009542465209961, -0.9655622839927673, -0.9215821027755737, -0.8776018619537354, -0.833621621131897, -0.7896414399147034, -0.7456612586975098, -0.7016810178756714, -0.657700777053833, -0.6137205958366394, -0.5697404146194458, -0.5257601737976074, -0.48177996277809143, -0.43779975175857544, -0.39381954073905945, -0.34983932971954346, -0.30585911870002747, -0.2618789076805115, -0.21789869666099548, -0.1739184856414795, -0.1299382746219635, -0.08595806360244751, -0.04197785258293152, 0.0020023584365844727, 0.045982569456100464, 0.08996278047561646, 0.13394299149513245, 0.1779230833053589, 0.22190329432487488, 0.26588350534439087, 0.30986371636390686, 0.35384392738342285, 0.39782413840293884, 0.44180434942245483, 0.4857845604419708, 0.5297647714614868, 0.5737450122833252, 0.6177251935005188, 0.6617053747177124, 0.7056856155395508, 0.7496658563613892, 0.7936460375785828, 0.8376262187957764, 0.8816064596176147, 0.9255867004394531, 0.9695668816566467, 1.0135470628738403, 1.0575273036956787, 1.101507544517517, 1.1454877853393555, 1.1894679069519043, 1.2334481477737427, 1.277428388595581, 1.3214085102081299, 1.3653887510299683, 1.4093689918518066, 1.453349232673645, 1.4973294734954834, 1.5413095951080322, 1.5852898359298706]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 18.0, 18.0, 11.0, 24.0, 35.0, 42.0, 75.0, 106.0, 149.0, 240.0, 355.0, 598.0, 948.0, 1705.0, 2855.0, 5459.0, 11061.0, 25231.0, 69582.0, 221988.0, 419815.0, 185975.0, 58595.0, 22240.0, 9772.0, 5060.0, 2603.0, 1502.0, 890.0, 548.0, 309.0, 215.0, 153.0, 96.0, 70.0, 58.0, 27.0, 24.0, 29.0, 8.0, 14.0, 13.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5902099609375, -1.530029296875, -1.4698486328125, -1.40966796875, -1.3494873046875, -1.289306640625, -1.2291259765625, -1.1689453125, -1.1087646484375, -1.048583984375, -0.9884033203125, -0.92822265625, -0.8680419921875, -0.807861328125, -0.7476806640625, -0.6875, -0.6273193359375, -0.567138671875, -0.5069580078125, -0.44677734375, -0.3865966796875, -0.326416015625, -0.2662353515625, -0.2060546875, -0.1458740234375, -0.085693359375, -0.0255126953125, 0.03466796875, 0.0948486328125, 0.155029296875, 0.2152099609375, 0.275390625, 0.3355712890625, 0.395751953125, 0.4559326171875, 0.51611328125, 0.5762939453125, 0.636474609375, 0.6966552734375, 0.7568359375, 0.8170166015625, 0.877197265625, 0.9373779296875, 0.99755859375, 1.0577392578125, 1.117919921875, 1.1781005859375, 1.23828125, 1.2984619140625, 1.358642578125, 1.4188232421875, 1.47900390625, 1.5391845703125, 1.599365234375, 1.6595458984375, 1.7197265625, 1.7799072265625, 1.840087890625, 1.9002685546875, 1.96044921875, 2.0206298828125, 2.080810546875, 2.1409912109375, 2.201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 5.0, 2.0, 2.0, 4.0, 13.0, 21.0, 17.0, 22.0, 22.0, 24.0, 31.0, 43.0, 47.0, 49.0, 49.0, 56.0, 60.0, 49.0, 72.0, 60.0, 62.0, 40.0, 39.0, 31.0, 45.0, 33.0, 27.0, 17.0, 12.0, 11.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.655426025390625, -2.57061767578125, -2.485809326171875, -2.4010009765625, -2.316192626953125, -2.23138427734375, -2.146575927734375, -2.061767578125, -1.976959228515625, -1.89215087890625, -1.807342529296875, -1.7225341796875, -1.637725830078125, -1.55291748046875, -1.468109130859375, -1.38330078125, -1.298492431640625, -1.21368408203125, -1.128875732421875, -1.0440673828125, -0.959259033203125, -0.87445068359375, -0.789642333984375, -0.704833984375, -0.620025634765625, -0.53521728515625, -0.450408935546875, -0.3656005859375, -0.280792236328125, -0.19598388671875, -0.111175537109375, -0.0263671875, 0.058441162109375, 0.14324951171875, 0.228057861328125, 0.3128662109375, 0.397674560546875, 0.48248291015625, 0.567291259765625, 0.652099609375, 0.736907958984375, 0.82171630859375, 0.906524658203125, 0.9913330078125, 1.076141357421875, 1.16094970703125, 1.245758056640625, 1.33056640625, 1.415374755859375, 1.50018310546875, 1.584991455078125, 1.6697998046875, 1.754608154296875, 1.83941650390625, 1.924224853515625, 2.009033203125, 2.093841552734375, 2.17864990234375, 2.263458251953125, 2.3482666015625, 2.433074951171875, 2.51788330078125, 2.602691650390625, 2.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 4.0, 13.0, 23.0, 12.0, 22.0, 41.0, 61.0, 81.0, 112.0, 163.0, 237.0, 462.0, 718.0, 1213.0, 2235.0, 4181.0, 9062.0, 22308.0, 73534.0, 328652.0, 445536.0, 108160.0, 29237.0, 11194.0, 5033.0, 2606.0, 1420.0, 796.0, 472.0, 292.0, 206.0, 128.0, 102.0, 79.0, 43.0, 44.0, 16.0, 16.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.274139404296875, -2.19866943359375, -2.123199462890625, -2.0477294921875, -1.972259521484375, -1.89678955078125, -1.821319580078125, -1.745849609375, -1.670379638671875, -1.59490966796875, -1.519439697265625, -1.4439697265625, -1.368499755859375, -1.29302978515625, -1.217559814453125, -1.14208984375, -1.066619873046875, -0.99114990234375, -0.915679931640625, -0.8402099609375, -0.764739990234375, -0.68927001953125, -0.613800048828125, -0.538330078125, -0.462860107421875, -0.38739013671875, -0.311920166015625, -0.2364501953125, -0.160980224609375, -0.08551025390625, -0.010040283203125, 0.0654296875, 0.140899658203125, 0.21636962890625, 0.291839599609375, 0.3673095703125, 0.442779541015625, 0.51824951171875, 0.593719482421875, 0.669189453125, 0.744659423828125, 0.82012939453125, 0.895599365234375, 0.9710693359375, 1.046539306640625, 1.12200927734375, 1.197479248046875, 1.27294921875, 1.348419189453125, 1.42388916015625, 1.499359130859375, 1.5748291015625, 1.650299072265625, 1.72576904296875, 1.801239013671875, 1.876708984375, 1.952178955078125, 2.02764892578125, 2.103118896484375, 2.1785888671875, 2.254058837890625, 2.32952880859375, 2.404998779296875, 2.48046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 13.0, 10.0, 8.0, 20.0, 18.0, 22.0, 31.0, 38.0, 38.0, 37.0, 44.0, 40.0, 34.0, 47.0, 53.0, 49.0, 47.0, 56.0, 43.0, 47.0, 47.0, 42.0, 30.0, 35.0, 20.0, 16.0, 18.0, 20.0, 16.0, 10.0, 8.0, 9.0, 6.0, 4.0, 0.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.998046875, -2.896484375, -2.794921875, -2.693359375, -2.591796875, -2.490234375, -2.388671875, -2.287109375, -2.185546875, -2.083984375, -1.982421875, -1.880859375, -1.779296875, -1.677734375, -1.576171875, -1.474609375, -1.373046875, -1.271484375, -1.169921875, -1.068359375, -0.966796875, -0.865234375, -0.763671875, -0.662109375, -0.560546875, -0.458984375, -0.357421875, -0.255859375, -0.154296875, -0.052734375, 0.048828125, 0.150390625, 0.251953125, 0.353515625, 0.455078125, 0.556640625, 0.658203125, 0.759765625, 0.861328125, 0.962890625, 1.064453125, 1.166015625, 1.267578125, 1.369140625, 1.470703125, 1.572265625, 1.673828125, 1.775390625, 1.876953125, 1.978515625, 2.080078125, 2.181640625, 2.283203125, 2.384765625, 2.486328125, 2.587890625, 2.689453125, 2.791015625, 2.892578125, 2.994140625, 3.095703125, 3.197265625, 3.298828125, 3.400390625, 3.501953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 15.0, 19.0, 14.0, 36.0, 55.0, 65.0, 70.0, 111.0, 156.0, 195.0, 300.0, 407.0, 587.0, 833.0, 1342.0, 2218.0, 4032.0, 8866.0, 23084.0, 70107.0, 239180.0, 467579.0, 152590.0, 45207.0, 16063.0, 6743.0, 3220.0, 1844.0, 1089.0, 688.0, 487.0, 342.0, 254.0, 190.0, 133.0, 106.0, 81.0, 64.0, 49.0, 35.0, 24.0, 19.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6267852783203125, -0.606109619140625, -0.5854339599609375, -0.56475830078125, -0.5440826416015625, -0.523406982421875, -0.5027313232421875, -0.4820556640625, -0.4613800048828125, -0.440704345703125, -0.4200286865234375, -0.39935302734375, -0.3786773681640625, -0.358001708984375, -0.3373260498046875, -0.316650390625, -0.2959747314453125, -0.275299072265625, -0.2546234130859375, -0.23394775390625, -0.2132720947265625, -0.192596435546875, -0.1719207763671875, -0.1512451171875, -0.1305694580078125, -0.109893798828125, -0.0892181396484375, -0.06854248046875, -0.0478668212890625, -0.027191162109375, -0.0065155029296875, 0.01416015625, 0.0348358154296875, 0.055511474609375, 0.0761871337890625, 0.09686279296875, 0.1175384521484375, 0.138214111328125, 0.1588897705078125, 0.1795654296875, 0.2002410888671875, 0.220916748046875, 0.2415924072265625, 0.26226806640625, 0.2829437255859375, 0.303619384765625, 0.3242950439453125, 0.344970703125, 0.3656463623046875, 0.386322021484375, 0.4069976806640625, 0.42767333984375, 0.4483489990234375, 0.469024658203125, 0.4897003173828125, 0.5103759765625, 0.5310516357421875, 0.551727294921875, 0.5724029541015625, 0.59307861328125, 0.6137542724609375, 0.634429931640625, 0.6551055908203125, 0.67578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 5.0, 7.0, 13.0, 13.0, 33.0, 51.0, 58.0, 83.0, 105.0, 171.0, 118.0, 85.0, 67.0, 59.0, 35.0, 26.0, 20.0, 14.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014925003051757812, -0.00014317035675048828, -0.00013709068298339844, -0.0001310110092163086, -0.00012493133544921875, -0.0001188516616821289, -0.00011277198791503906, -0.00010669231414794922, -0.00010061264038085938, -9.453296661376953e-05, -8.845329284667969e-05, -8.237361907958984e-05, -7.62939453125e-05, -7.021427154541016e-05, -6.413459777832031e-05, -5.805492401123047e-05, -5.1975250244140625e-05, -4.589557647705078e-05, -3.981590270996094e-05, -3.3736228942871094e-05, -2.765655517578125e-05, -2.1576881408691406e-05, -1.5497207641601562e-05, -9.417533874511719e-06, -3.337860107421875e-06, 2.7418136596679688e-06, 8.821487426757812e-06, 1.4901161193847656e-05, 2.09808349609375e-05, 2.7060508728027344e-05, 3.314018249511719e-05, 3.921985626220703e-05, 4.5299530029296875e-05, 5.137920379638672e-05, 5.745887756347656e-05, 6.35385513305664e-05, 6.961822509765625e-05, 7.56978988647461e-05, 8.177757263183594e-05, 8.785724639892578e-05, 9.393692016601562e-05, 0.00010001659393310547, 0.00010609626770019531, 0.00011217594146728516, 0.000118255615234375, 0.00012433528900146484, 0.0001304149627685547, 0.00013649463653564453, 0.00014257431030273438, 0.00014865398406982422, 0.00015473365783691406, 0.0001608133316040039, 0.00016689300537109375, 0.0001729726791381836, 0.00017905235290527344, 0.00018513202667236328, 0.00019121170043945312, 0.00019729137420654297, 0.0002033710479736328, 0.00020945072174072266, 0.0002155303955078125, 0.00022161006927490234, 0.0002276897430419922, 0.00023376941680908203, 0.00023984909057617188]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 8.0, 10.0, 11.0, 11.0, 23.0, 31.0, 31.0, 30.0, 40.0, 75.0, 89.0, 116.0, 165.0, 260.0, 389.0, 574.0, 1020.0, 1894.0, 4426.0, 12209.0, 45568.0, 229892.0, 574124.0, 132804.0, 28826.0, 8575.0, 3328.0, 1557.0, 821.0, 478.0, 339.0, 233.0, 136.0, 120.0, 72.0, 65.0, 48.0, 32.0, 32.0, 22.0, 17.0, 15.0, 15.0, 6.0, 4.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9093170166015625, -0.877227783203125, -0.8451385498046875, -0.81304931640625, -0.7809600830078125, -0.748870849609375, -0.7167816162109375, -0.6846923828125, -0.6526031494140625, -0.620513916015625, -0.5884246826171875, -0.55633544921875, -0.5242462158203125, -0.492156982421875, -0.4600677490234375, -0.427978515625, -0.3958892822265625, -0.363800048828125, -0.3317108154296875, -0.29962158203125, -0.2675323486328125, -0.235443115234375, -0.2033538818359375, -0.1712646484375, -0.1391754150390625, -0.107086181640625, -0.0749969482421875, -0.04290771484375, -0.0108184814453125, 0.021270751953125, 0.0533599853515625, 0.08544921875, 0.1175384521484375, 0.149627685546875, 0.1817169189453125, 0.21380615234375, 0.2458953857421875, 0.277984619140625, 0.3100738525390625, 0.3421630859375, 0.3742523193359375, 0.406341552734375, 0.4384307861328125, 0.47052001953125, 0.5026092529296875, 0.534698486328125, 0.5667877197265625, 0.598876953125, 0.6309661865234375, 0.663055419921875, 0.6951446533203125, 0.72723388671875, 0.7593231201171875, 0.791412353515625, 0.8235015869140625, 0.8555908203125, 0.8876800537109375, 0.919769287109375, 0.9518585205078125, 0.98394775390625, 1.0160369873046875, 1.048126220703125, 1.0802154541015625, 1.1123046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 24.0, 35.0, 63.0, 78.0, 104.0, 189.0, 149.0, 97.0, 75.0, 44.0, 39.0, 25.0, 15.0, 13.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8505859375, -0.8261947631835938, -0.8018035888671875, -0.7774124145507812, -0.753021240234375, -0.7286300659179688, -0.7042388916015625, -0.6798477172851562, -0.65545654296875, -0.6310653686523438, -0.6066741943359375, -0.5822830200195312, -0.557891845703125, -0.5335006713867188, -0.5091094970703125, -0.48471832275390625, -0.4603271484375, -0.43593597412109375, -0.4115447998046875, -0.38715362548828125, -0.362762451171875, -0.33837127685546875, -0.3139801025390625, -0.28958892822265625, -0.26519775390625, -0.24080657958984375, -0.2164154052734375, -0.19202423095703125, -0.167633056640625, -0.14324188232421875, -0.1188507080078125, -0.09445953369140625, -0.070068359375, -0.04567718505859375, -0.0212860107421875, 0.00310516357421875, 0.027496337890625, 0.05188751220703125, 0.0762786865234375, 0.10066986083984375, 0.12506103515625, 0.14945220947265625, 0.1738433837890625, 0.19823455810546875, 0.222625732421875, 0.24701690673828125, 0.2714080810546875, 0.29579925537109375, 0.3201904296875, 0.34458160400390625, 0.3689727783203125, 0.39336395263671875, 0.417755126953125, 0.44214630126953125, 0.4665374755859375, 0.49092864990234375, 0.51531982421875, 0.5397109985351562, 0.5641021728515625, 0.5884933471679688, 0.612884521484375, 0.6372756958007812, 0.6616668701171875, 0.6860580444335938, 0.71044921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 12.0, 27.0, 45.0, 93.0, 143.0, 180.0, 164.0, 126.0, 93.0, 51.0, 29.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.819700002670288, -2.505915641784668, -2.192131280899048, -1.8783470392227173, -1.5645626783370972, -1.250778317451477, -0.9369940757751465, -0.6232097148895264, -0.30942535400390625, 0.0043589770793914795, 0.3181433081626892, 0.6319276094436646, 0.9457119703292847, 1.2594963312149048, 1.5732805728912354, 1.8870649337768555, 2.2008492946624756, 2.5146336555480957, 2.828418016433716, 3.142202377319336, 3.455986499786377, 3.769771099090576, 4.083555221557617, 4.397339820861816, 4.711123943328857, 5.024908065795898, 5.338692665100098, 5.652476787567139, 5.966261386871338, 6.280045509338379, 6.593830108642578, 6.907614231109619, 7.22139835357666, 7.535182476043701, 7.8489670753479, 8.162751197814941, 8.47653579711914, 8.79032039642334, 9.104104042053223, 9.417888641357422, 9.731673240661621, 10.04545783996582, 10.359241485595703, 10.673026084899902, 10.986810684204102, 11.3005952835083, 11.614378929138184, 11.928163528442383, 12.241947174072266, 12.555731773376465, 12.869515419006348, 13.183300018310547, 13.497084617614746, 13.810869216918945, 14.124652862548828, 14.438437461853027, 14.752222061157227, 15.066006660461426, 15.379790306091309, 15.693574905395508, 16.00735855102539, 16.321144104003906, 16.63492774963379, 16.948711395263672, 17.262496948242188]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 10.0, 11.0, 10.0, 27.0, 18.0, 17.0, 20.0, 35.0, 34.0, 30.0, 43.0, 46.0, 37.0, 36.0, 35.0, 42.0, 48.0, 42.0, 46.0, 40.0, 36.0, 44.0, 30.0, 46.0, 31.0, 32.0, 30.0, 18.0, 20.0, 21.0, 9.0, 15.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.205555438995361, -5.030652046203613, -4.855748176574707, -4.680844783782959, -4.505941390991211, -4.331037521362305, -4.156134128570557, -3.9812304973602295, -3.8063268661499023, -3.631423234939575, -3.456519603729248, -3.2816162109375, -3.106712579727173, -2.9318089485168457, -2.7569055557250977, -2.5820019245147705, -2.4070982933044434, -2.232194662094116, -2.057291030883789, -1.882387638092041, -1.7074840068817139, -1.5325803756713867, -1.3576768636703491, -1.1827733516693115, -1.0078697204589844, -0.832966148853302, -0.6580625772476196, -0.48315900564193726, -0.3082554340362549, -0.1333518624305725, 0.04155170917510986, 0.21645522117614746, 0.3913588523864746, 0.566262423992157, 0.7411659955978394, 0.9160695672035217, 1.090973138809204, 1.2658767700195312, 1.4407802820205688, 1.6156837940216064, 1.7905874252319336, 1.9654910564422607, 2.140394687652588, 2.315298080444336, 2.490201711654663, 2.6651053428649902, 2.8400087356567383, 3.0149123668670654, 3.1898159980773926, 3.3647196292877197, 3.539623260498047, 3.714526653289795, 3.889430284500122, 4.064333915710449, 4.239237308502197, 4.414140701293945, 4.589044570922852, 4.7639479637146, 4.938851833343506, 5.113755226135254, 5.28865909576416, 5.463562488555908, 5.638465881347656, 5.8133697509765625, 5.9882731437683105]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 2.0, 9.0, 8.0, 12.0, 20.0, 27.0, 23.0, 39.0, 49.0, 57.0, 92.0, 107.0, 140.0, 203.0, 307.0, 440.0, 714.0, 956.0, 1323.0, 1691.0, 2826.0, 1034716.0, 1906.0, 1400.0, 1047.0, 743.0, 482.0, 353.0, 239.0, 167.0, 122.0, 102.0, 58.0, 44.0, 43.0, 27.0, 26.0, 17.0, 23.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.112381935119629, -5.909613609313965, -5.706845283508301, -5.504076957702637, -5.301308631896973, -5.098540306091309, -4.895771503448486, -4.693003177642822, -4.490234851837158, -4.287466526031494, -4.08469820022583, -3.881929636001587, -3.679161310195923, -3.476392984390259, -3.2736244201660156, -3.0708560943603516, -2.8680877685546875, -2.6653194427490234, -2.4625511169433594, -2.259782552719116, -2.057014226913452, -1.854245901107788, -1.6514774560928345, -1.4487090110778809, -1.2459406852722168, -1.0431723594665527, -0.8404039144515991, -0.6376355290412903, -0.43486714363098145, -0.23209881782531738, -0.02933037281036377, 0.17343807220458984, 0.3762059211730957, 0.5789743065834045, 0.7817426919937134, 0.9845110774040222, 1.187279462814331, 1.3900477886199951, 1.5928162336349487, 1.7955846786499023, 1.9983530044555664, 2.2011213302612305, 2.4038896560668945, 2.6066582202911377, 2.8094265460968018, 3.012194871902466, 3.214963436126709, 3.417731761932373, 3.620500087738037, 3.823268413543701, 4.026036739349365, 4.228805065155029, 4.431573867797852, 4.634342193603516, 4.83711051940918, 5.039878845214844, 5.242647171020508, 5.445415496826172, 5.648183822631836, 5.8509521484375, 6.053720474243164, 6.256488800048828, 6.45925760269165, 6.6620259284973145, 6.8647942543029785]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 15.0, 21.0, 51.0, 96.0, 137.0, 312.0, 749.0, 2594.0, 12733.0, 51424808.0, 23009.0, 4648.0, 1268.0, 455.0, 209.0, 103.0, 50.0, 26.0, 17.0, 11.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.0030460357666, -19.40827178955078, -18.81349754333496, -18.21872329711914, -17.62394905090332, -17.0291748046875, -16.43440055847168, -15.839627265930176, -15.244853019714355, -14.650078773498535, -14.055304527282715, -13.460530281066895, -12.86575698852539, -12.27098274230957, -11.67620849609375, -11.08143424987793, -10.48666000366211, -9.891885757446289, -9.297111511230469, -8.702337265014648, -8.107563018798828, -7.512789249420166, -6.918015480041504, -6.323241233825684, -5.728466987609863, -5.133692741394043, -4.538918495178223, -3.9441447257995605, -3.3493704795837402, -2.75459623336792, -2.1598222255706787, -1.5650482177734375, -0.9702720642089844, -0.3754979372024536, 0.21927618980407715, 0.8140503168106079, 1.4088244438171387, 2.003598690032959, 2.5983726978302, 3.1931467056274414, 3.7879209518432617, 4.382695198059082, 4.977469444274902, 5.5722432136535645, 6.167017459869385, 6.761791706085205, 7.356565475463867, 7.9513397216796875, 8.546113967895508, 9.140888214111328, 9.735662460327148, 10.330436706542969, 10.925210952758789, 11.51998519897461, 12.114758491516113, 12.709532737731934, 13.304306983947754, 13.899081230163574, 14.493855476379395, 15.088629722595215, 15.683403015136719, 16.27817726135254, 16.87295150756836, 17.46772575378418, 18.0625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 30.0, 35.0, 39.0, 42.0, 72.0, 150.0, 237.0, 401.0, 665.0, 1323.0, 3118.0, 8415.0, 30780.0, 151851.0, 872771.0, 4738461.0, 388199.0, 69309.0, 16079.0, 4999.0, 2093.0, 987.0, 544.0, 324.0, 156.0, 115.0, 85.0, 34.0, 22.0, 19.0, 14.0, 13.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.39990234375, -0.3875083923339844, -0.37511444091796875, -0.3627204895019531, -0.3503265380859375, -0.3379325866699219, -0.32553863525390625, -0.3131446838378906, -0.300750732421875, -0.2883567810058594, -0.27596282958984375, -0.2635688781738281, -0.2511749267578125, -0.23878097534179688, -0.22638702392578125, -0.21399307250976562, -0.20159912109375, -0.18920516967773438, -0.17681121826171875, -0.16441726684570312, -0.1520233154296875, -0.13962936401367188, -0.12723541259765625, -0.11484146118164062, -0.102447509765625, -0.09005355834960938, -0.07765960693359375, -0.06526565551757812, -0.0528717041015625, -0.040477752685546875, -0.02808380126953125, -0.015689849853515625, -0.0032958984375, 0.009098052978515625, 0.02149200439453125, 0.033885955810546875, 0.0462799072265625, 0.058673858642578125, 0.07106781005859375, 0.08346176147460938, 0.095855712890625, 0.10824966430664062, 0.12064361572265625, 0.13303756713867188, 0.1454315185546875, 0.15782546997070312, 0.17021942138671875, 0.18261337280273438, 0.19500732421875, 0.20740127563476562, 0.21979522705078125, 0.23218917846679688, 0.2445831298828125, 0.2569770812988281, 0.26937103271484375, 0.2817649841308594, 0.294158935546875, 0.3065528869628906, 0.31894683837890625, 0.3313407897949219, 0.3437347412109375, 0.3561286926269531, 0.36852264404296875, 0.3809165954589844, 0.393310546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 20.0, 17.0, 19.0, 24.0, 29.0, 43.0, 40.0, 39.0, 45.0, 44.0, 61.0, 77.0, 1080.0, 45.0, 45.0, 52.0, 52.0, 48.0, 36.0, 27.0, 21.0, 25.0, 28.0, 25.0, 7.0, 14.0, 12.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.46728515625, -9.1064453125, -8.74560546875, -8.384765625, -8.02392578125, -7.6630859375, -7.30224609375, -6.94140625, -6.58056640625, -6.2197265625, -5.85888671875, -5.498046875, -5.13720703125, -4.7763671875, -4.41552734375, -4.0546875, -3.69384765625, -3.3330078125, -2.97216796875, -2.611328125, -2.25048828125, -1.8896484375, -1.52880859375, -1.16796875, -0.80712890625, -0.4462890625, -0.08544921875, 0.275390625, 0.63623046875, 0.9970703125, 1.35791015625, 1.71875, 2.07958984375, 2.4404296875, 2.80126953125, 3.162109375, 3.52294921875, 3.8837890625, 4.24462890625, 4.60546875, 4.96630859375, 5.3271484375, 5.68798828125, 6.048828125, 6.40966796875, 6.7705078125, 7.13134765625, 7.4921875, 7.85302734375, 8.2138671875, 8.57470703125, 8.935546875, 9.29638671875, 9.6572265625, 10.01806640625, 10.37890625, 10.73974609375, 11.1005859375, 11.46142578125, 11.822265625, 12.18310546875, 12.5439453125, 12.90478515625, 13.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 19.0, 14.0, 29.0, 59.0, 120.0, 176.0, 258.0, 512.0, 905.0, 1967.0, 6335.0, 34194.0, 280182.0, 4873824.0, 957666.0, 112277.0, 16057.0, 3769.0, 1378.0, 682.0, 398.0, 193.0, 127.0, 103.0, 45.0, 32.0, 19.0, 24.0, 5.0, 5.0, 5.0, 7.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30517578125, -0.29334259033203125, -0.2815093994140625, -0.26967620849609375, -0.257843017578125, -0.24600982666015625, -0.2341766357421875, -0.22234344482421875, -0.21051025390625, -0.19867706298828125, -0.1868438720703125, -0.17501068115234375, -0.163177490234375, -0.15134429931640625, -0.1395111083984375, -0.12767791748046875, -0.1158447265625, -0.10401153564453125, -0.0921783447265625, -0.08034515380859375, -0.068511962890625, -0.05667877197265625, -0.0448455810546875, -0.03301239013671875, -0.02117919921875, -0.00934600830078125, 0.0024871826171875, 0.01432037353515625, 0.026153564453125, 0.03798675537109375, 0.0498199462890625, 0.06165313720703125, 0.073486328125, 0.08531951904296875, 0.0971527099609375, 0.10898590087890625, 0.120819091796875, 0.13265228271484375, 0.1444854736328125, 0.15631866455078125, 0.16815185546875, 0.17998504638671875, 0.1918182373046875, 0.20365142822265625, 0.215484619140625, 0.22731781005859375, 0.2391510009765625, 0.25098419189453125, 0.2628173828125, 0.27465057373046875, 0.2864837646484375, 0.29831695556640625, 0.310150146484375, 0.32198333740234375, 0.3338165283203125, 0.34564971923828125, 0.35748291015625, 0.36931610107421875, 0.3811492919921875, 0.39298248291015625, 0.404815673828125, 0.41664886474609375, 0.4284820556640625, 0.44031524658203125, 0.4521484375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 10.0, 13.0, 14.0, 12.0, 9.0, 24.0, 24.0, 29.0, 28.0, 34.0, 35.0, 37.0, 51.0, 34.0, 45.0, 27.0, 610.0, 489.0, 42.0, 43.0, 41.0, 38.0, 35.0, 36.0, 41.0, 27.0, 26.0, 29.0, 24.0, 22.0, 12.0, 15.0, 6.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.25, -8.01422119140625, -7.7784423828125, -7.54266357421875, -7.306884765625, -7.07110595703125, -6.8353271484375, -6.59954833984375, -6.36376953125, -6.12799072265625, -5.8922119140625, -5.65643310546875, -5.420654296875, -5.18487548828125, -4.9490966796875, -4.71331787109375, -4.4775390625, -4.24176025390625, -4.0059814453125, -3.77020263671875, -3.534423828125, -3.29864501953125, -3.0628662109375, -2.82708740234375, -2.59130859375, -2.35552978515625, -2.1197509765625, -1.88397216796875, -1.648193359375, -1.41241455078125, -1.1766357421875, -0.94085693359375, -0.705078125, -0.46929931640625, -0.2335205078125, 0.00225830078125, 0.238037109375, 0.47381591796875, 0.7095947265625, 0.94537353515625, 1.18115234375, 1.41693115234375, 1.6527099609375, 1.88848876953125, 2.124267578125, 2.36004638671875, 2.5958251953125, 2.83160400390625, 3.0673828125, 3.30316162109375, 3.5389404296875, 3.77471923828125, 4.010498046875, 4.24627685546875, 4.4820556640625, 4.71783447265625, 4.95361328125, 5.18939208984375, 5.4251708984375, 5.66094970703125, 5.896728515625, 6.13250732421875, 6.3682861328125, 6.60406494140625, 6.83984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 3.0, 2.0, 1.0, 6.0, 8.0, 5.0, 4.0, 6.0, 13.0, 32.0, 42.0, 67.0, 183.0, 400.0, 1054.0, 3202.0, 17198.0, 6162274.0, 98199.0, 5709.0, 1623.0, 677.0, 286.0, 145.0, 84.0, 68.0, 40.0, 36.0, 21.0, 16.0, 6.0, 7.0, 6.0, 4.0, 2.0], "bins": [-1.9306640625, -1.8893356323242188, -1.8480072021484375, -1.8066787719726562, -1.765350341796875, -1.7240219116210938, -1.6826934814453125, -1.6413650512695312, -1.60003662109375, -1.5587081909179688, -1.5173797607421875, -1.4760513305664062, -1.434722900390625, -1.3933944702148438, -1.3520660400390625, -1.3107376098632812, -1.2694091796875, -1.2280807495117188, -1.1867523193359375, -1.1454238891601562, -1.104095458984375, -1.0627670288085938, -1.0214385986328125, -0.9801101684570312, -0.93878173828125, -0.8974533081054688, -0.8561248779296875, -0.8147964477539062, -0.773468017578125, -0.7321395874023438, -0.6908111572265625, -0.6494827270507812, -0.608154296875, -0.5668258666992188, -0.5254974365234375, -0.48416900634765625, -0.442840576171875, -0.40151214599609375, -0.3601837158203125, -0.31885528564453125, -0.27752685546875, -0.23619842529296875, -0.1948699951171875, -0.15354156494140625, -0.112213134765625, -0.07088470458984375, -0.0295562744140625, 0.01177215576171875, 0.0531005859375, 0.09442901611328125, 0.1357574462890625, 0.17708587646484375, 0.218414306640625, 0.25974273681640625, 0.3010711669921875, 0.34239959716796875, 0.38372802734375, 0.42505645751953125, 0.4663848876953125, 0.5077133178710938, 0.549041748046875, 0.5903701782226562, 0.6316986083984375, 0.6730270385742188, 0.71435546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 17.0, 39.0, 57.0, 81.0, 80.0, 125.0, 1163.0, 135.0, 93.0, 83.0, 58.0, 44.0, 25.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.86328125, -7.39080810546875, -6.9183349609375, -6.44586181640625, -5.973388671875, -5.50091552734375, -5.0284423828125, -4.55596923828125, -4.08349609375, -3.61102294921875, -3.1385498046875, -2.66607666015625, -2.193603515625, -1.72113037109375, -1.2486572265625, -0.77618408203125, -0.3037109375, 0.16876220703125, 0.6412353515625, 1.11370849609375, 1.586181640625, 2.05865478515625, 2.5311279296875, 3.00360107421875, 3.47607421875, 3.94854736328125, 4.4210205078125, 4.89349365234375, 5.365966796875, 5.83843994140625, 6.3109130859375, 6.78338623046875, 7.255859375, 7.72833251953125, 8.2008056640625, 8.67327880859375, 9.145751953125, 9.61822509765625, 10.0906982421875, 10.56317138671875, 11.03564453125, 11.50811767578125, 11.9805908203125, 12.45306396484375, 12.925537109375, 13.39801025390625, 13.8704833984375, 14.34295654296875, 14.8154296875, 15.28790283203125, 15.7603759765625, 16.23284912109375, 16.705322265625, 17.17779541015625, 17.6502685546875, 18.12274169921875, 18.59521484375, 19.06768798828125, 19.5401611328125, 20.01263427734375, 20.485107421875, 20.95758056640625, 21.4300537109375, 21.90252685546875, 22.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 13.0, 672.0, 307.0, 13.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.86222839355469, -50.89992141723633, -49.937618255615234, -48.975311279296875, -48.013004302978516, -47.050697326660156, -46.08839416503906, -45.1260871887207, -44.163780212402344, -43.201473236083984, -42.23917007446289, -41.27686309814453, -40.31455612182617, -39.35224914550781, -38.38994598388672, -37.42763900756836, -36.465335845947266, -35.503028869628906, -34.54072570800781, -33.57841873168945, -32.616111755371094, -31.653806686401367, -30.69150161743164, -29.72919464111328, -28.766887664794922, -27.804582595825195, -26.842275619506836, -25.87997055053711, -24.91766357421875, -23.955358505249023, -22.993053436279297, -22.030746459960938, -21.068439483642578, -20.10613441467285, -19.143827438354492, -18.181522369384766, -17.219215393066406, -16.25691032409668, -15.294604301452637, -14.332298278808594, -13.369993209838867, -12.407687187194824, -11.445381164550781, -10.483076095581055, -9.520770072937012, -8.558464050292969, -7.596158027648926, -6.633852481842041, -5.671546936035156, -4.709240913391113, -3.7469353675842285, -2.7846293449401855, -1.8223235607147217, -0.8600177764892578, 0.10228824615478516, 1.06459379196167, 2.026899814605713, 2.9892055988311768, 3.9515113830566406, 4.913817405700684, 5.876123428344727, 6.838428974151611, 7.800734996795654, 8.763040542602539, 9.725346565246582]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 14.0, 27.0, 65.0, 83.0, 117.0, 144.0, 152.0, 145.0, 105.0, 75.0, 31.0, 21.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.46249771118164, -30.51834487915039, -29.57419204711914, -28.630041122436523, -27.685888290405273, -26.741735458374023, -25.797584533691406, -24.853431701660156, -23.909278869628906, -22.965126037597656, -22.020973205566406, -21.07682228088379, -20.13266944885254, -19.18851661682129, -18.244365692138672, -17.300212860107422, -16.356060028076172, -15.411907196044922, -14.467755317687988, -13.523603439331055, -12.579450607299805, -11.635297775268555, -10.691145896911621, -9.746994018554688, -8.802841186523438, -7.858688831329346, -6.914536476135254, -5.970384120941162, -5.02623176574707, -4.0820794105529785, -3.1379270553588867, -2.193774700164795, -1.249624252319336, -0.30547189712524414, 0.6386804580688477, 1.5828328132629395, 2.5269851684570312, 3.471137523651123, 4.415289878845215, 5.359442234039307, 6.303594589233398, 7.24774694442749, 8.191899299621582, 9.136051177978516, 10.080204010009766, 11.024356842041016, 11.96850872039795, 12.912660598754883, 13.856813430786133, 14.800966262817383, 15.745118141174316, 16.68927001953125, 17.6334228515625, 18.57757568359375, 19.521728515625, 20.465879440307617, 21.410032272338867, 22.354185104370117, 23.298336029052734, 24.242488861083984, 25.186641693115234, 26.130794525146484, 27.074947357177734, 28.01909828186035, 28.9632511138916]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 9.0, 15.0, 30.0, 68.0, 5306.0, 3721.0, 12511.0, 4113097.0, 52116.0, 6381.0, 849.0, 73.0, 42.0, 16.0, 15.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0312042236328125, -0.03007340431213379, -0.028942584991455078, -0.027811765670776367, -0.026680946350097656, -0.025550127029418945, -0.024419307708740234, -0.023288488388061523, -0.022157669067382812, -0.0210268497467041, -0.01989603042602539, -0.01876521110534668, -0.01763439178466797, -0.016503572463989258, -0.015372753143310547, -0.014241933822631836, -0.013111114501953125, -0.011980295181274414, -0.010849475860595703, -0.009718656539916992, -0.008587837219238281, -0.00745701789855957, -0.006326198577880859, -0.0051953792572021484, -0.0040645599365234375, -0.0029337406158447266, -0.0018029212951660156, -0.0006721019744873047, 0.00045871734619140625, 0.0015895366668701172, 0.002720355987548828, 0.003851175308227539, 0.00498199462890625, 0.006112813949584961, 0.007243633270263672, 0.008374452590942383, 0.009505271911621094, 0.010636091232299805, 0.011766910552978516, 0.012897729873657227, 0.014028549194335938, 0.015159368515014648, 0.01629018783569336, 0.01742100715637207, 0.01855182647705078, 0.019682645797729492, 0.020813465118408203, 0.021944284439086914, 0.023075103759765625, 0.024205923080444336, 0.025336742401123047, 0.026467561721801758, 0.02759838104248047, 0.02872920036315918, 0.02986001968383789, 0.0309908390045166, 0.03212165832519531, 0.03325247764587402, 0.034383296966552734, 0.035514116287231445, 0.036644935607910156, 0.03777575492858887, 0.03890657424926758, 0.04003739356994629, 0.041168212890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 12.0, 14.0, 29.0, 92.0, 242.0, 409.0, 106.0, 45.0, 23.0, 10.0, 11.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0162811279296875, -0.015659809112548828, -0.015038490295410156, -0.014417171478271484, -0.013795852661132812, -0.01317453384399414, -0.012553215026855469, -0.011931896209716797, -0.011310577392578125, -0.010689258575439453, -0.010067939758300781, -0.00944662094116211, -0.008825302124023438, -0.008203983306884766, -0.007582664489746094, -0.006961345672607422, -0.00634002685546875, -0.005718708038330078, -0.005097389221191406, -0.004476070404052734, -0.0038547515869140625, -0.0032334327697753906, -0.0026121139526367188, -0.001990795135498047, -0.001369476318359375, -0.0007481575012207031, -0.00012683868408203125, 0.0004944801330566406, 0.0011157989501953125, 0.0017371177673339844, 0.0023584365844726562, 0.002979755401611328, 0.00360107421875, 0.004222393035888672, 0.004843711853027344, 0.005465030670166016, 0.0060863494873046875, 0.006707668304443359, 0.007328987121582031, 0.007950305938720703, 0.008571624755859375, 0.009192943572998047, 0.009814262390136719, 0.01043558120727539, 0.011056900024414062, 0.011678218841552734, 0.012299537658691406, 0.012920856475830078, 0.01354217529296875, 0.014163494110107422, 0.014784812927246094, 0.015406131744384766, 0.016027450561523438, 0.01664876937866211, 0.01727008819580078, 0.017891407012939453, 0.018512725830078125, 0.019134044647216797, 0.01975536346435547, 0.02037668228149414, 0.020998001098632812, 0.021619319915771484, 0.022240638732910156, 0.022861957550048828, 0.0234832763671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 3.0, 2.0, 6.0, 8.0, 21.0, 10.0, 25.0, 28.0, 38.0, 48.0, 92.0, 176.0, 405.0, 1525.0, 4181691.0, 9140.0, 524.0, 218.0, 109.0, 71.0, 35.0, 29.0, 19.0, 10.0, 6.0, 5.0, 8.0, 6.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033721923828125, -0.03272056579589844, -0.031719207763671875, -0.030717849731445312, -0.02971649169921875, -0.028715133666992188, -0.027713775634765625, -0.026712417602539062, -0.0257110595703125, -0.024709701538085938, -0.023708343505859375, -0.022706985473632812, -0.02170562744140625, -0.020704269409179688, -0.019702911376953125, -0.018701553344726562, -0.0177001953125, -0.016698837280273438, -0.015697479248046875, -0.014696121215820312, -0.01369476318359375, -0.012693405151367188, -0.011692047119140625, -0.010690689086914062, -0.0096893310546875, -0.008687973022460938, -0.007686614990234375, -0.0066852569580078125, -0.00568389892578125, -0.0046825408935546875, -0.003681182861328125, -0.0026798248291015625, -0.001678466796875, -0.0006771087646484375, 0.000324249267578125, 0.0013256072998046875, 0.00232696533203125, 0.0033283233642578125, 0.004329681396484375, 0.0053310394287109375, 0.0063323974609375, 0.0073337554931640625, 0.008335113525390625, 0.009336471557617188, 0.01033782958984375, 0.011339187622070312, 0.012340545654296875, 0.013341903686523438, 0.01434326171875, 0.015344619750976562, 0.016345977783203125, 0.017347335815429688, 0.01834869384765625, 0.019350051879882812, 0.020351409912109375, 0.021352767944335938, 0.0223541259765625, 0.023355484008789062, 0.024356842041015625, 0.025358200073242188, 0.02635955810546875, 0.027360916137695312, 0.028362274169921875, 0.029363632202148438, 0.030364990234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 8.0, 16.0, 12.0, 21.0, 29.0, 32.0, 48.0, 62.0, 137.0, 269.0, 513.0, 925.0, 900.0, 502.0, 234.0, 120.0, 74.0, 45.0, 33.0, 20.0, 12.0, 7.0, 5.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007175445556640625, -0.006964385509490967, -0.006753325462341309, -0.00654226541519165, -0.006331205368041992, -0.006120145320892334, -0.005909085273742676, -0.005698025226593018, -0.005486965179443359, -0.005275905132293701, -0.005064845085144043, -0.004853785037994385, -0.0046427249908447266, -0.004431664943695068, -0.00422060489654541, -0.004009544849395752, -0.0037984848022460938, -0.0035874247550964355, -0.0033763647079467773, -0.003165304660797119, -0.002954244613647461, -0.0027431845664978027, -0.0025321245193481445, -0.0023210644721984863, -0.002110004425048828, -0.00189894437789917, -0.0016878843307495117, -0.0014768242835998535, -0.0012657642364501953, -0.0010547041893005371, -0.0008436441421508789, -0.0006325840950012207, -0.0004215240478515625, -0.0002104640007019043, 5.960464477539062e-07, 0.0002116560935974121, 0.0004227161407470703, 0.0006337761878967285, 0.0008448362350463867, 0.001055896282196045, 0.0012669563293457031, 0.0014780163764953613, 0.0016890764236450195, 0.0019001364707946777, 0.002111196517944336, 0.002322256565093994, 0.0025333166122436523, 0.0027443766593933105, 0.0029554367065429688, 0.003166496753692627, 0.003377556800842285, 0.0035886168479919434, 0.0037996768951416016, 0.00401073694229126, 0.004221796989440918, 0.004432857036590576, 0.004643917083740234, 0.004854977130889893, 0.005066037178039551, 0.005277097225189209, 0.005488157272338867, 0.005699217319488525, 0.005910277366638184, 0.006121337413787842, 0.0063323974609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 58.0, 756.0, 186.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016395432874560356, -0.01527087390422821, -0.014146314933896065, -0.013021755032241344, -0.011897196061909199, -0.010772637091577053, -0.009648077189922333, -0.008523518219590187, -0.007398959249258041, -0.006274400278925896, -0.005149840842932463, -0.00402528140693903, -0.002900722436606884, -0.0017761634662747383, -0.0006516040302813053, 0.0004729554057121277, 0.0015975143760442734, 0.0027220735792070627, 0.003846632782369852, 0.004971192218363285, 0.006095751188695431, 0.0072203101590275764, 0.008344870060682297, 0.009469429031014442, 0.010593988001346588, 0.011718546971678734, 0.01284310594201088, 0.0139676658436656, 0.015092224813997746, 0.016216784715652466, 0.01734134368598461, 0.018465902656316757, 0.019590459764003754, 0.0207150187343359, 0.021839577704668045, 0.02296413667500019, 0.024088695645332336, 0.02521325647830963, 0.026337815448641777, 0.027462374418973923, 0.02858693338930607, 0.029711492359638214, 0.03083605132997036, 0.031960610300302505, 0.0330851711332798, 0.0342097282409668, 0.03533428907394409, 0.03645884990692139, 0.03758340701460838, 0.03870796784758568, 0.039832524955272675, 0.04095708578824997, 0.042081642895936966, 0.04320620372891426, 0.04433076083660126, 0.04545532166957855, 0.04657988250255585, 0.04770444333553314, 0.04882900044322014, 0.049953561276197433, 0.05107811838388443, 0.052202679216861725, 0.05332723632454872, 0.054451797157526016, 0.05557635426521301]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 9.0, 12.0, 14.0, 16.0, 16.0, 26.0, 24.0, 33.0, 24.0, 37.0, 30.0, 33.0, 40.0, 47.0, 49.0, 49.0, 27.0, 73.0, 58.0, 48.0, 44.0, 41.0, 44.0, 27.0, 28.0, 28.0, 21.0, 13.0, 14.0, 20.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.016760945320129395, -0.016301672905683517, -0.01584239862859249, -0.01538312528282404, -0.014923851937055588, -0.014464578591287136, -0.014005305245518684, -0.013546031899750233, -0.013086758553981781, -0.01262748520821333, -0.012168211862444878, -0.011708938516676426, -0.011249665170907974, -0.010790391825139523, -0.01033111847937107, -0.00987184513360262, -0.009412571787834167, -0.008953298442065716, -0.008494025096297264, -0.008034751750528812, -0.007575478404760361, -0.007116205058991909, -0.006656931713223457, -0.006197658367455006, -0.005738385021686554, -0.005279111675918102, -0.004819838330149651, -0.004360564984381199, -0.003901291638612747, -0.0034420182928442955, -0.002982744947075844, -0.002523471601307392, -0.0020641982555389404, -0.0016049249097704887, -0.001145651564002037, -0.0006863782182335854, -0.00022710487246513367, 0.00023216847330331802, 0.0006914418190717697, 0.0011507151648402214, 0.001609988510608673, 0.002069261856377125, 0.0025285352021455765, 0.002987808547914028, 0.00344708189368248, 0.0039063552394509315, 0.004365628585219383, 0.004824901930987835, 0.005284175276756287, 0.005743448622524738, 0.00620272196829319, 0.006661995314061642, 0.007121268659830093, 0.007580542005598545, 0.008039815351366997, 0.008499088697135448, 0.0089583620429039, 0.009417635388672352, 0.009876908734440804, 0.010336182080209255, 0.010795455425977707, 0.011254728771746159, 0.01171400211751461, 0.012173275463283062, 0.012632548809051514]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 10.0, 10.0, 11.0, 8.0, 21.0, 36.0, 25.0, 39.0, 46.0, 75.0, 75.0, 130.0, 206.0, 356.0, 674.0, 1903.0, 10407.0, 956799.0, 70603.0, 4468.0, 1176.0, 558.0, 296.0, 180.0, 132.0, 67.0, 77.0, 35.0, 19.0, 16.0, 12.0, 14.0, 7.0, 4.0, 8.0, 8.0, 2.0, 0.0, 2.0, 3.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.88818359375, -0.8550338745117188, -0.8218841552734375, -0.7887344360351562, -0.755584716796875, -0.7224349975585938, -0.6892852783203125, -0.6561355590820312, -0.62298583984375, -0.5898361206054688, -0.5566864013671875, -0.5235366821289062, -0.490386962890625, -0.45723724365234375, -0.4240875244140625, -0.39093780517578125, -0.3577880859375, -0.32463836669921875, -0.2914886474609375, -0.25833892822265625, -0.225189208984375, -0.19203948974609375, -0.1588897705078125, -0.12574005126953125, -0.09259033203125, -0.05944061279296875, -0.0262908935546875, 0.00685882568359375, 0.040008544921875, 0.07315826416015625, 0.1063079833984375, 0.13945770263671875, 0.172607421875, 0.20575714111328125, 0.2389068603515625, 0.27205657958984375, 0.305206298828125, 0.33835601806640625, 0.3715057373046875, 0.40465545654296875, 0.43780517578125, 0.47095489501953125, 0.5041046142578125, 0.5372543334960938, 0.570404052734375, 0.6035537719726562, 0.6367034912109375, 0.6698532104492188, 0.7030029296875, 0.7361526489257812, 0.7693023681640625, 0.8024520874023438, 0.835601806640625, 0.8687515258789062, 0.9019012451171875, 0.9350509643554688, 0.96820068359375, 1.0013504028320312, 1.0345001220703125, 1.0676498413085938, 1.100799560546875, 1.1339492797851562, 1.1670989990234375, 1.2002487182617188, 1.2333984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 12.0, 12.0, 25.0, 72.0, 214.0, 410.0, 143.0, 58.0, 25.0, 9.0, 14.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01611328125, -0.015502691268920898, -0.014892101287841797, -0.014281511306762695, -0.013670921325683594, -0.013060331344604492, -0.01244974136352539, -0.011839151382446289, -0.011228561401367188, -0.010617971420288086, -0.010007381439208984, -0.009396791458129883, -0.008786201477050781, -0.00817561149597168, -0.007565021514892578, -0.0069544315338134766, -0.006343841552734375, -0.0057332515716552734, -0.005122661590576172, -0.00451207160949707, -0.0039014816284179688, -0.003290891647338867, -0.0026803016662597656, -0.002069711685180664, -0.0014591217041015625, -0.0008485317230224609, -0.00023794174194335938, 0.0003726482391357422, 0.0009832382202148438, 0.0015938282012939453, 0.002204418182373047, 0.0028150081634521484, 0.00342559814453125, 0.0040361881256103516, 0.004646778106689453, 0.005257368087768555, 0.005867958068847656, 0.006478548049926758, 0.007089138031005859, 0.007699728012084961, 0.008310317993164062, 0.008920907974243164, 0.009531497955322266, 0.010142087936401367, 0.010752677917480469, 0.01136326789855957, 0.011973857879638672, 0.012584447860717773, 0.013195037841796875, 0.013805627822875977, 0.014416217803955078, 0.01502680778503418, 0.01563739776611328, 0.016247987747192383, 0.016858577728271484, 0.017469167709350586, 0.018079757690429688, 0.01869034767150879, 0.01930093765258789, 0.019911527633666992, 0.020522117614746094, 0.021132707595825195, 0.021743297576904297, 0.0223538875579834, 0.0229644775390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 2.0, 4.0, 9.0, 14.0, 18.0, 24.0, 33.0, 60.0, 88.0, 116.0, 181.0, 268.0, 440.0, 634.0, 996.0, 1512.0, 2510.0, 3882.0, 6336.0, 10179.0, 16757.0, 30673.0, 60794.0, 144917.0, 434088.0, 180159.0, 70329.0, 34581.0, 19091.0, 11203.0, 6798.0, 4311.0, 2732.0, 1703.0, 1106.0, 674.0, 421.0, 291.0, 209.0, 127.0, 80.0, 60.0, 45.0, 32.0, 17.0, 6.0, 15.0, 9.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0223388671875, -0.021673917770385742, -0.021008968353271484, -0.020344018936157227, -0.01967906951904297, -0.01901412010192871, -0.018349170684814453, -0.017684221267700195, -0.017019271850585938, -0.01635432243347168, -0.015689373016357422, -0.015024423599243164, -0.014359474182128906, -0.013694524765014648, -0.01302957534790039, -0.012364625930786133, -0.011699676513671875, -0.011034727096557617, -0.01036977767944336, -0.009704828262329102, -0.009039878845214844, -0.008374929428100586, -0.007709980010986328, -0.00704503059387207, -0.0063800811767578125, -0.005715131759643555, -0.005050182342529297, -0.004385232925415039, -0.0037202835083007812, -0.0030553340911865234, -0.0023903846740722656, -0.0017254352569580078, -0.00106048583984375, -0.0003955364227294922, 0.0002694129943847656, 0.0009343624114990234, 0.0015993118286132812, 0.002264261245727539, 0.002929210662841797, 0.0035941600799560547, 0.0042591094970703125, 0.00492405891418457, 0.005589008331298828, 0.006253957748413086, 0.006918907165527344, 0.0075838565826416016, 0.00824880599975586, 0.008913755416870117, 0.009578704833984375, 0.010243654251098633, 0.01090860366821289, 0.011573553085327148, 0.012238502502441406, 0.012903451919555664, 0.013568401336669922, 0.01423335075378418, 0.014898300170898438, 0.015563249588012695, 0.016228199005126953, 0.01689314842224121, 0.01755809783935547, 0.018223047256469727, 0.018887996673583984, 0.019552946090698242, 0.0202178955078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 4.0, 5.0, 13.0, 9.0, 10.0, 17.0, 10.0, 23.0, 9.0, 15.0, 11.0, 21.0, 35.0, 44.0, 32.0, 29.0, 38.0, 39.0, 34.0, 37.0, 29.0, 40.0, 42.0, 38.0, 33.0, 30.0, 43.0, 26.0, 33.0, 20.0, 38.0, 23.0, 14.0, 22.0, 19.0, 16.0, 11.0, 11.0, 9.0, 10.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01287841796875, -0.012460589408874512, -0.012042760848999023, -0.011624932289123535, -0.011207103729248047, -0.010789275169372559, -0.01037144660949707, -0.009953618049621582, -0.009535789489746094, -0.009117960929870605, -0.008700132369995117, -0.008282303810119629, -0.00786447525024414, -0.007446646690368652, -0.007028818130493164, -0.006610989570617676, -0.0061931610107421875, -0.005775332450866699, -0.005357503890991211, -0.004939675331115723, -0.004521846771240234, -0.004104018211364746, -0.003686189651489258, -0.0032683610916137695, -0.0028505325317382812, -0.002432703971862793, -0.0020148754119873047, -0.0015970468521118164, -0.0011792182922363281, -0.0007613897323608398, -0.00034356117248535156, 7.426738739013672e-05, 0.000492095947265625, 0.0009099245071411133, 0.0013277530670166016, 0.0017455816268920898, 0.002163410186767578, 0.0025812387466430664, 0.0029990673065185547, 0.003416895866394043, 0.0038347244262695312, 0.0042525529861450195, 0.004670381546020508, 0.005088210105895996, 0.005506038665771484, 0.005923867225646973, 0.006341695785522461, 0.006759524345397949, 0.0071773529052734375, 0.007595181465148926, 0.008013010025024414, 0.008430838584899902, 0.00884866714477539, 0.009266495704650879, 0.009684324264526367, 0.010102152824401855, 0.010519981384277344, 0.010937809944152832, 0.01135563850402832, 0.011773467063903809, 0.012191295623779297, 0.012609124183654785, 0.013026952743530273, 0.013444781303405762, 0.01386260986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 14.0, 9.0, 30.0, 38.0, 78.0, 175.0, 266.0, 710.0, 1957.0, 6265.0, 30284.0, 636974.0, 339980.0, 23584.0, 5311.0, 1656.0, 640.0, 290.0, 127.0, 59.0, 34.0, 25.0, 10.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0146026611328125, -0.014097929000854492, -0.013593196868896484, -0.013088464736938477, -0.012583732604980469, -0.012079000473022461, -0.011574268341064453, -0.011069536209106445, -0.010564804077148438, -0.01006007194519043, -0.009555339813232422, -0.009050607681274414, -0.008545875549316406, -0.008041143417358398, -0.007536411285400391, -0.007031679153442383, -0.006526947021484375, -0.006022214889526367, -0.005517482757568359, -0.0050127506256103516, -0.004508018493652344, -0.004003286361694336, -0.003498554229736328, -0.0029938220977783203, -0.0024890899658203125, -0.0019843578338623047, -0.0014796257019042969, -0.0009748935699462891, -0.00047016143798828125, 3.457069396972656e-05, 0.0005393028259277344, 0.0010440349578857422, 0.00154876708984375, 0.002053499221801758, 0.0025582313537597656, 0.0030629634857177734, 0.0035676956176757812, 0.004072427749633789, 0.004577159881591797, 0.005081892013549805, 0.0055866241455078125, 0.00609135627746582, 0.006596088409423828, 0.007100820541381836, 0.007605552673339844, 0.008110284805297852, 0.00861501693725586, 0.009119749069213867, 0.009624481201171875, 0.010129213333129883, 0.01063394546508789, 0.011138677597045898, 0.011643409729003906, 0.012148141860961914, 0.012652873992919922, 0.01315760612487793, 0.013662338256835938, 0.014167070388793945, 0.014671802520751953, 0.015176534652709961, 0.01568126678466797, 0.016185998916625977, 0.016690731048583984, 0.017195463180541992, 0.0177001953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 6.0, 13.0, 18.0, 24.0, 20.0, 25.0, 53.0, 82.0, 197.0, 257.0, 114.0, 61.0, 24.0, 27.0, 22.0, 8.0, 12.0, 5.0, 5.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011116266250610352, -0.00010690558701753616, -0.00010264851152896881, -9.839143604040146e-05, -9.41343605518341e-05, -8.987728506326675e-05, -8.56202095746994e-05, -8.136313408613205e-05, -7.71060585975647e-05, -7.284898310899734e-05, -6.859190762042999e-05, -6.433483213186264e-05, -6.007775664329529e-05, -5.5820681154727936e-05, -5.1563605666160583e-05, -4.730653017759323e-05, -4.304945468902588e-05, -3.8792379200458527e-05, -3.4535303711891174e-05, -3.0278228223323822e-05, -2.602115273475647e-05, -2.1764077246189117e-05, -1.7507001757621765e-05, -1.3249926269054413e-05, -8.99285078048706e-06, -4.735775291919708e-06, -4.78699803352356e-07, 3.7783756852149963e-06, 8.035451173782349e-06, 1.2292526662349701e-05, 1.6549602150917053e-05, 2.0806677639484406e-05, 2.5063753128051758e-05, 2.932082861661911e-05, 3.357790410518646e-05, 3.7834979593753815e-05, 4.209205508232117e-05, 4.634913057088852e-05, 5.060620605945587e-05, 5.4863281548023224e-05, 5.9120357036590576e-05, 6.337743252515793e-05, 6.763450801372528e-05, 7.189158350229263e-05, 7.614865899085999e-05, 8.040573447942734e-05, 8.466280996799469e-05, 8.891988545656204e-05, 9.31769609451294e-05, 9.743403643369675e-05, 0.0001016911119222641, 0.00010594818741083145, 0.0001102052628993988, 0.00011446233838796616, 0.00011871941387653351, 0.00012297648936510086, 0.0001272335648536682, 0.00013149064034223557, 0.00013574771583080292, 0.00014000479131937027, 0.00014426186680793762, 0.00014851894229650497, 0.00015277601778507233, 0.00015703309327363968, 0.00016129016876220703]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 1.0, 5.0, 6.0, 6.0, 4.0, 9.0, 21.0, 20.0, 43.0, 78.0, 163.0, 393.0, 1652.0, 17862.0, 1000452.0, 24913.0, 2101.0, 441.0, 168.0, 72.0, 41.0, 29.0, 14.0, 11.0, 14.0, 10.0, 9.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046966552734375, -0.045523643493652344, -0.04408073425292969, -0.04263782501220703, -0.041194915771484375, -0.03975200653076172, -0.03830909729003906, -0.036866188049316406, -0.03542327880859375, -0.033980369567871094, -0.03253746032714844, -0.03109455108642578, -0.029651641845703125, -0.02820873260498047, -0.026765823364257812, -0.025322914123535156, -0.0238800048828125, -0.022437095642089844, -0.020994186401367188, -0.01955127716064453, -0.018108367919921875, -0.01666545867919922, -0.015222549438476562, -0.013779640197753906, -0.01233673095703125, -0.010893821716308594, -0.009450912475585938, -0.008008003234863281, -0.006565093994140625, -0.005122184753417969, -0.0036792755126953125, -0.0022363662719726562, -0.00079345703125, 0.0006494522094726562, 0.0020923614501953125, 0.0035352706909179688, 0.004978179931640625, 0.006421089172363281, 0.007863998413085938, 0.009306907653808594, 0.01074981689453125, 0.012192726135253906, 0.013635635375976562, 0.015078544616699219, 0.016521453857421875, 0.01796436309814453, 0.019407272338867188, 0.020850181579589844, 0.0222930908203125, 0.023736000061035156, 0.025178909301757812, 0.02662181854248047, 0.028064727783203125, 0.02950763702392578, 0.030950546264648438, 0.032393455505371094, 0.03383636474609375, 0.035279273986816406, 0.03672218322753906, 0.03816509246826172, 0.039608001708984375, 0.04105091094970703, 0.04249382019042969, 0.043936729431152344, 0.045379638671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 9.0, 5.0, 6.0, 10.0, 10.0, 14.0, 15.0, 34.0, 50.0, 60.0, 132.0, 225.0, 178.0, 76.0, 43.0, 30.0, 32.0, 11.0, 14.0, 8.0, 10.0, 5.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00982666015625, -0.009516716003417969, -0.009206771850585938, -0.008896827697753906, -0.008586883544921875, -0.008276939392089844, -0.007966995239257812, -0.007657051086425781, -0.00734710693359375, -0.007037162780761719, -0.0067272186279296875, -0.006417274475097656, -0.006107330322265625, -0.005797386169433594, -0.0054874420166015625, -0.005177497863769531, -0.0048675537109375, -0.004557609558105469, -0.0042476654052734375, -0.003937721252441406, -0.003627777099609375, -0.0033178329467773438, -0.0030078887939453125, -0.0026979446411132812, -0.00238800048828125, -0.0020780563354492188, -0.0017681121826171875, -0.0014581680297851562, -0.001148223876953125, -0.0008382797241210938, -0.0005283355712890625, -0.00021839141845703125, 9.1552734375e-05, 0.00040149688720703125, 0.0007114410400390625, 0.0010213851928710938, 0.001331329345703125, 0.0016412734985351562, 0.0019512176513671875, 0.0022611618041992188, 0.00257110595703125, 0.0028810501098632812, 0.0031909942626953125, 0.0035009384155273438, 0.003810882568359375, 0.004120826721191406, 0.0044307708740234375, 0.004740715026855469, 0.0050506591796875, 0.005360603332519531, 0.0056705474853515625, 0.005980491638183594, 0.006290435791015625, 0.006600379943847656, 0.0069103240966796875, 0.007220268249511719, 0.00753021240234375, 0.007840156555175781, 0.008150100708007812, 0.008460044860839844, 0.008769989013671875, 0.009079933166503906, 0.009389877319335938, 0.009699821472167969, 0.010009765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 93.0, 613.0, 228.0, 49.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773010611534119, -0.9563300609588623, -0.9353590607643127, -0.9143880605697632, -0.8934170007705688, -0.8724460005760193, -0.8514750003814697, -0.8305040001869202, -0.8095329999923706, -0.788561999797821, -0.7675909996032715, -0.7466199398040771, -0.7256489396095276, -0.704677939414978, -0.6837069392204285, -0.6627359390258789, -0.6417648792266846, -0.620793879032135, -0.5998228788375854, -0.5788518190383911, -0.5578808188438416, -0.536909818649292, -0.5159388184547424, -0.49496781826019287, -0.4739967882633209, -0.45302578806877136, -0.4320547580718994, -0.41108375787734985, -0.3901127576828003, -0.36914172768592834, -0.3481707274913788, -0.32719969749450684, -0.3062286972999573, -0.2852576971054077, -0.26428666710853577, -0.2433156669139862, -0.22234465181827545, -0.2013736367225647, -0.18040263652801514, -0.15943162143230438, -0.13846060633659363, -0.11748959124088287, -0.09651858359575272, -0.07554757595062256, -0.054576560854911804, -0.03360554575920105, -0.01263454556465149, 0.008336469531059265, 0.02930748462677002, 0.050278495997190475, 0.07124950736761093, 0.09222051501274109, 0.11319153010845184, 0.1341625452041626, 0.15513354539871216, 0.1761045604944229, 0.19707557559013367, 0.21804659068584442, 0.23901760578155518, 0.25998860597610474, 0.2809596061706543, 0.30193063616752625, 0.3229016363620758, 0.34387266635894775, 0.3648436665534973]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 12.0, 14.0, 16.0, 16.0, 20.0, 25.0, 28.0, 38.0, 56.0, 37.0, 51.0, 56.0, 69.0, 81.0, 60.0, 61.0, 44.0, 46.0, 58.0, 38.0, 36.0, 35.0, 17.0, 23.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11985033750534058, -0.11644826084375381, -0.11304618418216705, -0.10964410752058029, -0.10624203085899353, -0.10283994674682617, -0.09943787008523941, -0.09603579342365265, -0.09263371676206589, -0.08923164010047913, -0.08582956343889236, -0.0824274867773056, -0.07902540266513824, -0.07562333345413208, -0.07222124934196472, -0.06881917268037796, -0.0654170960187912, -0.06201501935720444, -0.058612942695617676, -0.055210862308740616, -0.051808785647153854, -0.04840670898556709, -0.04500462859869003, -0.04160255193710327, -0.03820047527551651, -0.03479839861392975, -0.03139632195234299, -0.027994241565465927, -0.024592164903879166, -0.021190088242292404, -0.017788009718060493, -0.014385931193828583, -0.010983854532241821, -0.007581776939332485, -0.004179699346423149, -0.000777621753513813, 0.002624455839395523, 0.0060265325009822845, 0.009428611025214195, 0.012830689549446106, 0.016232766211032867, 0.01963484287261963, 0.02303692139685154, 0.02643899992108345, 0.029841076582670212, 0.03324315324425697, 0.03664523363113403, 0.040047310292720795, 0.043449386954307556, 0.04685146361589432, 0.05025354027748108, 0.05365562066435814, 0.0570576973259449, 0.06045977398753166, 0.06386185437440872, 0.06726393103599548, 0.07066600769758224, 0.074068084359169, 0.07747016102075577, 0.08087223768234253, 0.08427432179450989, 0.08767639100551605, 0.09107847511768341, 0.09448055177927017, 0.09788262844085693]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 10.0, 9.0, 7.0, 13.0, 19.0, 29.0, 31.0, 40.0, 59.0, 79.0, 100.0, 166.0, 270.0, 672.0, 3148.0, 50067.0, 4128339.0, 8895.0, 1291.0, 337.0, 184.0, 99.0, 91.0, 74.0, 55.0, 39.0, 41.0, 24.0, 19.0, 17.0, 19.0, 9.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1401195526123047, -0.13497543334960938, -0.12983131408691406, -0.12468719482421875, -0.11954307556152344, -0.11439895629882812, -0.10925483703613281, -0.1041107177734375, -0.09896659851074219, -0.09382247924804688, -0.08867835998535156, -0.08353424072265625, -0.07839012145996094, -0.07324600219726562, -0.06810188293457031, -0.062957763671875, -0.05781364440917969, -0.052669525146484375, -0.04752540588378906, -0.04238128662109375, -0.03723716735839844, -0.032093048095703125, -0.026948928833007812, -0.0218048095703125, -0.016660690307617188, -0.011516571044921875, -0.0063724517822265625, -0.00122833251953125, 0.0039157867431640625, 0.009059906005859375, 0.014204025268554688, 0.01934814453125, 0.024492263793945312, 0.029636383056640625, 0.03478050231933594, 0.03992462158203125, 0.04506874084472656, 0.050212860107421875, 0.05535697937011719, 0.0605010986328125, 0.06564521789550781, 0.07078933715820312, 0.07593345642089844, 0.08107757568359375, 0.08622169494628906, 0.09136581420898438, 0.09650993347167969, 0.101654052734375, 0.10679817199707031, 0.11194229125976562, 0.11708641052246094, 0.12223052978515625, 0.12737464904785156, 0.13251876831054688, 0.1376628875732422, 0.1428070068359375, 0.1479511260986328, 0.15309524536132812, 0.15823936462402344, 0.16338348388671875, 0.16852760314941406, 0.17367172241210938, 0.1788158416748047, 0.1839599609375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 21.0, 56.0, 147.0, 314.0, 268.0, 100.0, 36.0, 21.0, 9.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0161895751953125, -0.01560831069946289, -0.015027046203613281, -0.014445781707763672, -0.013864517211914062, -0.013283252716064453, -0.012701988220214844, -0.012120723724365234, -0.011539459228515625, -0.010958194732666016, -0.010376930236816406, -0.009795665740966797, -0.009214401245117188, -0.008633136749267578, -0.008051872253417969, -0.007470607757568359, -0.00688934326171875, -0.006308078765869141, -0.005726814270019531, -0.005145549774169922, -0.0045642852783203125, -0.003983020782470703, -0.0034017562866210938, -0.0028204917907714844, -0.002239227294921875, -0.0016579627990722656, -0.0010766983032226562, -0.0004954338073730469, 8.58306884765625e-05, 0.0006670951843261719, 0.0012483596801757812, 0.0018296241760253906, 0.002410888671875, 0.0029921531677246094, 0.0035734176635742188, 0.004154682159423828, 0.0047359466552734375, 0.005317211151123047, 0.005898475646972656, 0.006479740142822266, 0.007061004638671875, 0.007642269134521484, 0.008223533630371094, 0.008804798126220703, 0.009386062622070312, 0.009967327117919922, 0.010548591613769531, 0.01112985610961914, 0.01171112060546875, 0.01229238510131836, 0.012873649597167969, 0.013454914093017578, 0.014036178588867188, 0.014617443084716797, 0.015198707580566406, 0.015779972076416016, 0.016361236572265625, 0.016942501068115234, 0.017523765563964844, 0.018105030059814453, 0.018686294555664062, 0.019267559051513672, 0.01984882354736328, 0.02043008804321289, 0.0210113525390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 14.0, 26.0, 52.0, 57.0, 156.0, 293.0, 695.0, 2492.0, 28258.0, 4023157.0, 132016.0, 5308.0, 1020.0, 379.0, 158.0, 96.0, 41.0, 25.0, 17.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.0817418098449707, -0.0796823501586914, -0.07762289047241211, -0.07556343078613281, -0.07350397109985352, -0.07144451141357422, -0.06938505172729492, -0.06732559204101562, -0.06526613235473633, -0.06320667266845703, -0.061147212982177734, -0.05908775329589844, -0.05702829360961914, -0.054968833923339844, -0.05290937423706055, -0.05084991455078125, -0.04879045486450195, -0.046730995178222656, -0.04467153549194336, -0.04261207580566406, -0.040552616119384766, -0.03849315643310547, -0.03643369674682617, -0.034374237060546875, -0.03231477737426758, -0.03025531768798828, -0.028195858001708984, -0.026136398315429688, -0.02407693862915039, -0.022017478942871094, -0.019958019256591797, -0.0178985595703125, -0.015839099884033203, -0.013779640197753906, -0.01172018051147461, -0.009660720825195312, -0.007601261138916016, -0.005541801452636719, -0.003482341766357422, -0.001422882080078125, 0.0006365776062011719, 0.0026960372924804688, 0.004755496978759766, 0.0068149566650390625, 0.00887441635131836, 0.010933876037597656, 0.012993335723876953, 0.01505279541015625, 0.017112255096435547, 0.019171714782714844, 0.02123117446899414, 0.023290634155273438, 0.025350093841552734, 0.02740955352783203, 0.029469013214111328, 0.031528472900390625, 0.03358793258666992, 0.03564739227294922, 0.037706851959228516, 0.03976631164550781, 0.04182577133178711, 0.043885231018066406, 0.0459446907043457, 0.048004150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 11.0, 19.0, 18.0, 24.0, 34.0, 83.0, 119.0, 215.0, 537.0, 1919.0, 573.0, 232.0, 110.0, 70.0, 36.0, 24.0, 19.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0299224853515625, -0.029292821884155273, -0.028663158416748047, -0.02803349494934082, -0.027403831481933594, -0.026774168014526367, -0.02614450454711914, -0.025514841079711914, -0.024885177612304688, -0.02425551414489746, -0.023625850677490234, -0.022996187210083008, -0.02236652374267578, -0.021736860275268555, -0.021107196807861328, -0.0204775333404541, -0.019847869873046875, -0.01921820640563965, -0.018588542938232422, -0.017958879470825195, -0.01732921600341797, -0.016699552536010742, -0.016069889068603516, -0.015440225601196289, -0.014810562133789062, -0.014180898666381836, -0.01355123519897461, -0.012921571731567383, -0.012291908264160156, -0.01166224479675293, -0.011032581329345703, -0.010402917861938477, -0.00977325439453125, -0.009143590927124023, -0.008513927459716797, -0.00788426399230957, -0.007254600524902344, -0.006624937057495117, -0.005995273590087891, -0.005365610122680664, -0.0047359466552734375, -0.004106283187866211, -0.0034766197204589844, -0.002846956253051758, -0.0022172927856445312, -0.0015876293182373047, -0.0009579658508300781, -0.00032830238342285156, 0.000301361083984375, 0.0009310245513916016, 0.0015606880187988281, 0.0021903514862060547, 0.0028200149536132812, 0.003449678421020508, 0.004079341888427734, 0.004709005355834961, 0.0053386688232421875, 0.005968332290649414, 0.006597995758056641, 0.007227659225463867, 0.007857322692871094, 0.00848698616027832, 0.009116649627685547, 0.009746313095092773, 0.0103759765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 16.0, 42.0, 136.0, 384.0, 317.0, 84.0, 19.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1301613450050354, -0.12550246715545654, -0.12084360420703888, -0.11618472635746002, -0.11152585595846176, -0.1068669855594635, -0.10220810770988464, -0.09754923731088638, -0.09289036691188812, -0.08823149651288986, -0.0835726261138916, -0.07891374826431274, -0.07425487786531448, -0.06959600746631622, -0.06493712961673737, -0.060278259217739105, -0.055619388818740845, -0.050960518419742584, -0.046301644295454025, -0.041642770171165466, -0.036983899772167206, -0.032325029373168945, -0.027666155248880386, -0.023007281124591827, -0.018348410725593567, -0.013689538463950157, -0.009030666202306747, -0.004371793940663338, 0.000287078320980072, 0.004945950582623482, 0.009604822844266891, 0.01426369696855545, 0.01892256736755371, 0.02358143962919712, 0.02824031189084053, 0.03289918601512909, 0.03755805641412735, 0.04221692681312561, 0.04687580093741417, 0.05153467506170273, 0.05619354546070099, 0.06085241585969925, 0.06551128625869751, 0.07017016410827637, 0.07482903450727463, 0.07948790490627289, 0.08414678275585175, 0.08880565315485, 0.09346452355384827, 0.09812339395284653, 0.10278226435184479, 0.10744114220142365, 0.1121000126004219, 0.11675888299942017, 0.12141776084899902, 0.12607663869857788, 0.13073550164699554, 0.1353943794965744, 0.14005324244499207, 0.14471212029457092, 0.14937099814414978, 0.15402986109256744, 0.1586887389421463, 0.16334760189056396, 0.16800647974014282]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 13.0, 13.0, 14.0, 18.0, 29.0, 33.0, 41.0, 37.0, 43.0, 27.0, 35.0, 37.0, 43.0, 47.0, 52.0, 46.0, 52.0, 51.0, 44.0, 46.0, 32.0, 39.0, 28.0, 21.0, 26.0, 23.0, 21.0, 16.0, 11.0, 14.0, 12.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.049556076526641846, -0.04827851057052612, -0.0470009446144104, -0.04572337493300438, -0.04444580897688866, -0.043168243020772934, -0.04189067333936691, -0.04061310738325119, -0.03933554142713547, -0.038057975471019745, -0.03678040951490402, -0.035502839833498, -0.03422527387738228, -0.032947707921266556, -0.031670138239860535, -0.030392572283744812, -0.02911500632762909, -0.027837440371513367, -0.026559872552752495, -0.025282304733991623, -0.0240047387778759, -0.022727172821760178, -0.021449605002999306, -0.020172037184238434, -0.01889447122812271, -0.01761690527200699, -0.016339337453246117, -0.01506177056580782, -0.013784203678369522, -0.012506636790931225, -0.011229069903492928, -0.00995150301605463, -0.008673936128616333, -0.007396369241178036, -0.0061188023537397385, -0.004841235466301441, -0.003563668578863144, -0.0022861016914248466, -0.0010085348039865494, 0.0002690320834517479, 0.0015465989708900452, 0.0028241658583283424, 0.00410173274576664, 0.005379299633204937, 0.006656866520643234, 0.007934433408081532, 0.009212000295519829, 0.010489567182958126, 0.011767134070396423, 0.01304470095783472, 0.014322267845273018, 0.015599834732711315, 0.016877401620149612, 0.018154967576265335, 0.019432535395026207, 0.02071010321378708, 0.0219876691699028, 0.023265235126018524, 0.024542802944779396, 0.025820370763540268, 0.02709793671965599, 0.028375502675771713, 0.029653070494532585, 0.030930638313293457, 0.03220820426940918]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 6.0, 10.0, 26.0, 13.0, 21.0, 43.0, 40.0, 52.0, 78.0, 87.0, 123.0, 167.0, 264.0, 366.0, 619.0, 1465.0, 7212.0, 299703.0, 723420.0, 10980.0, 1772.0, 722.0, 398.0, 255.0, 191.0, 117.0, 110.0, 67.0, 33.0, 49.0, 32.0, 27.0, 22.0, 18.0, 8.0, 10.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0693359375, -0.06710529327392578, -0.06487464904785156, -0.06264400482177734, -0.060413360595703125, -0.058182716369628906, -0.05595207214355469, -0.05372142791748047, -0.05149078369140625, -0.04926013946533203, -0.04702949523925781, -0.044798851013183594, -0.042568206787109375, -0.040337562561035156, -0.03810691833496094, -0.03587627410888672, -0.0336456298828125, -0.03141498565673828, -0.029184341430664062, -0.026953697204589844, -0.024723052978515625, -0.022492408752441406, -0.020261764526367188, -0.01803112030029297, -0.01580047607421875, -0.013569831848144531, -0.011339187622070312, -0.009108543395996094, -0.006877899169921875, -0.004647254943847656, -0.0024166107177734375, -0.00018596649169921875, 0.002044677734375, 0.004275321960449219, 0.0065059661865234375, 0.008736610412597656, 0.010967254638671875, 0.013197898864746094, 0.015428543090820312, 0.01765918731689453, 0.01988983154296875, 0.02212047576904297, 0.024351119995117188, 0.026581764221191406, 0.028812408447265625, 0.031043052673339844, 0.03327369689941406, 0.03550434112548828, 0.0377349853515625, 0.03996562957763672, 0.04219627380371094, 0.044426918029785156, 0.046657562255859375, 0.048888206481933594, 0.05111885070800781, 0.05334949493408203, 0.05558013916015625, 0.05781078338623047, 0.06004142761230469, 0.062272071838378906, 0.06450271606445312, 0.06673336029052734, 0.06896400451660156, 0.07119464874267578, 0.07342529296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 12.0, 12.0, 26.0, 82.0, 180.0, 360.0, 192.0, 70.0, 38.0, 11.0, 12.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0154266357421875, -0.01484537124633789, -0.014264106750488281, -0.013682842254638672, -0.013101577758789062, -0.012520313262939453, -0.011939048767089844, -0.011357784271240234, -0.010776519775390625, -0.010195255279541016, -0.009613990783691406, -0.009032726287841797, -0.008451461791992188, -0.007870197296142578, -0.007288932800292969, -0.006707668304443359, -0.00612640380859375, -0.005545139312744141, -0.004963874816894531, -0.004382610321044922, -0.0038013458251953125, -0.003220081329345703, -0.0026388168334960938, -0.0020575523376464844, -0.001476287841796875, -0.0008950233459472656, -0.00031375885009765625, 0.0002675056457519531, 0.0008487701416015625, 0.0014300346374511719, 0.0020112991333007812, 0.0025925636291503906, 0.003173828125, 0.0037550926208496094, 0.004336357116699219, 0.004917621612548828, 0.0054988861083984375, 0.006080150604248047, 0.006661415100097656, 0.007242679595947266, 0.007823944091796875, 0.008405208587646484, 0.008986473083496094, 0.009567737579345703, 0.010149002075195312, 0.010730266571044922, 0.011311531066894531, 0.01189279556274414, 0.01247406005859375, 0.01305532455444336, 0.013636589050292969, 0.014217853546142578, 0.014799118041992188, 0.015380382537841797, 0.015961647033691406, 0.016542911529541016, 0.017124176025390625, 0.017705440521240234, 0.018286705017089844, 0.018867969512939453, 0.019449234008789062, 0.020030498504638672, 0.02061176300048828, 0.02119302749633789, 0.0217742919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 13.0, 13.0, 17.0, 21.0, 32.0, 38.0, 47.0, 54.0, 99.0, 112.0, 181.0, 322.0, 837.0, 16906.0, 1009734.0, 18283.0, 929.0, 296.0, 173.0, 127.0, 78.0, 43.0, 56.0, 36.0, 20.0, 20.0, 15.0, 15.0, 10.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.08580875396728516, -0.08268928527832031, -0.07956981658935547, -0.07645034790039062, -0.07333087921142578, -0.07021141052246094, -0.0670919418334961, -0.06397247314453125, -0.060853004455566406, -0.05773353576660156, -0.05461406707763672, -0.051494598388671875, -0.04837512969970703, -0.04525566101074219, -0.042136192321777344, -0.0390167236328125, -0.035897254943847656, -0.03277778625488281, -0.02965831756591797, -0.026538848876953125, -0.02341938018798828, -0.020299911499023438, -0.017180442810058594, -0.01406097412109375, -0.010941505432128906, -0.007822036743164062, -0.004702568054199219, -0.001583099365234375, 0.0015363693237304688, 0.0046558380126953125, 0.007775306701660156, 0.010894775390625, 0.014014244079589844, 0.017133712768554688, 0.02025318145751953, 0.023372650146484375, 0.02649211883544922, 0.029611587524414062, 0.032731056213378906, 0.03585052490234375, 0.038969993591308594, 0.04208946228027344, 0.04520893096923828, 0.048328399658203125, 0.05144786834716797, 0.05456733703613281, 0.057686805725097656, 0.0608062744140625, 0.06392574310302734, 0.06704521179199219, 0.07016468048095703, 0.07328414916992188, 0.07640361785888672, 0.07952308654785156, 0.0826425552368164, 0.08576202392578125, 0.0888814926147461, 0.09200096130371094, 0.09512042999267578, 0.09823989868164062, 0.10135936737060547, 0.10447883605957031, 0.10759830474853516, 0.1107177734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 6.0, 14.0, 12.0, 13.0, 23.0, 24.0, 27.0, 31.0, 41.0, 41.0, 41.0, 56.0, 55.0, 61.0, 63.0, 51.0, 49.0, 70.0, 45.0, 51.0, 46.0, 23.0, 28.0, 31.0, 20.0, 16.0, 11.0, 11.0, 13.0, 6.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01403045654296875, -0.013530611991882324, -0.013030767440795898, -0.012530922889709473, -0.012031078338623047, -0.011531233787536621, -0.011031389236450195, -0.01053154468536377, -0.010031700134277344, -0.009531855583190918, -0.009032011032104492, -0.008532166481018066, -0.00803232192993164, -0.007532477378845215, -0.007032632827758789, -0.006532788276672363, -0.0060329437255859375, -0.005533099174499512, -0.005033254623413086, -0.00453341007232666, -0.004033565521240234, -0.0035337209701538086, -0.003033876419067383, -0.002534031867980957, -0.0020341873168945312, -0.0015343427658081055, -0.0010344982147216797, -0.0005346536636352539, -3.4809112548828125e-05, 0.00046503543853759766, 0.0009648799896240234, 0.0014647245407104492, 0.001964569091796875, 0.0024644136428833008, 0.0029642581939697266, 0.0034641027450561523, 0.003963947296142578, 0.004463791847229004, 0.00496363639831543, 0.0054634809494018555, 0.005963325500488281, 0.006463170051574707, 0.006963014602661133, 0.007462859153747559, 0.007962703704833984, 0.00846254825592041, 0.008962392807006836, 0.009462237358093262, 0.009962081909179688, 0.010461926460266113, 0.010961771011352539, 0.011461615562438965, 0.01196146011352539, 0.012461304664611816, 0.012961149215698242, 0.013460993766784668, 0.013960838317871094, 0.01446068286895752, 0.014960527420043945, 0.015460371971130371, 0.015960216522216797, 0.016460061073303223, 0.01695990562438965, 0.017459750175476074, 0.0179595947265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 7.0, 9.0, 15.0, 17.0, 37.0, 51.0, 106.0, 283.0, 932.0, 4851.0, 89068.0, 938777.0, 11754.0, 1777.0, 447.0, 153.0, 84.0, 40.0, 33.0, 31.0, 20.0, 13.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03436279296875, -0.03318643569946289, -0.03201007843017578, -0.030833721160888672, -0.029657363891601562, -0.028481006622314453, -0.027304649353027344, -0.026128292083740234, -0.024951934814453125, -0.023775577545166016, -0.022599220275878906, -0.021422863006591797, -0.020246505737304688, -0.019070148468017578, -0.01789379119873047, -0.01671743392944336, -0.01554107666015625, -0.01436471939086914, -0.013188362121582031, -0.012012004852294922, -0.010835647583007812, -0.009659290313720703, -0.008482933044433594, -0.007306575775146484, -0.006130218505859375, -0.004953861236572266, -0.0037775039672851562, -0.002601146697998047, -0.0014247894287109375, -0.0002484321594238281, 0.0009279251098632812, 0.0021042823791503906, 0.0032806396484375, 0.004456996917724609, 0.005633354187011719, 0.006809711456298828, 0.007986068725585938, 0.009162425994873047, 0.010338783264160156, 0.011515140533447266, 0.012691497802734375, 0.013867855072021484, 0.015044212341308594, 0.016220569610595703, 0.017396926879882812, 0.018573284149169922, 0.01974964141845703, 0.02092599868774414, 0.02210235595703125, 0.02327871322631836, 0.02445507049560547, 0.025631427764892578, 0.026807785034179688, 0.027984142303466797, 0.029160499572753906, 0.030336856842041016, 0.031513214111328125, 0.032689571380615234, 0.033865928649902344, 0.03504228591918945, 0.03621864318847656, 0.03739500045776367, 0.03857135772705078, 0.03974771499633789, 0.040924072265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 14.0, 21.0, 22.0, 33.0, 45.0, 66.0, 98.0, 138.0, 132.0, 115.0, 90.0, 55.0, 51.0, 30.0, 25.0, 14.0, 18.0, 8.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000148773193359375, -0.00014458410441875458, -0.00014039501547813416, -0.00013620592653751373, -0.0001320168375968933, -0.0001278277486562729, -0.00012363865971565247, -0.00011944957077503204, -0.00011526048183441162, -0.0001110713928937912, -0.00010688230395317078, -0.00010269321501255035, -9.850412607192993e-05, -9.431503713130951e-05, -9.012594819068909e-05, -8.593685925006866e-05, -8.174777030944824e-05, -7.755868136882782e-05, -7.33695924282074e-05, -6.918050348758698e-05, -6.499141454696655e-05, -6.080232560634613e-05, -5.661323666572571e-05, -5.2424147725105286e-05, -4.823505878448486e-05, -4.404596984386444e-05, -3.985688090324402e-05, -3.5667791962623596e-05, -3.1478703022003174e-05, -2.728961408138275e-05, -2.310052514076233e-05, -1.8911436200141907e-05, -1.4722347259521484e-05, -1.0533258318901062e-05, -6.34416937828064e-06, -2.1550804376602173e-06, 2.034008502960205e-06, 6.2230974435806274e-06, 1.041218638420105e-05, 1.4601275324821472e-05, 1.8790364265441895e-05, 2.2979453206062317e-05, 2.716854214668274e-05, 3.135763108730316e-05, 3.5546720027923584e-05, 3.9735808968544006e-05, 4.392489790916443e-05, 4.811398684978485e-05, 5.2303075790405273e-05, 5.6492164731025696e-05, 6.068125367164612e-05, 6.487034261226654e-05, 6.905943155288696e-05, 7.324852049350739e-05, 7.743760943412781e-05, 8.162669837474823e-05, 8.581578731536865e-05, 9.000487625598907e-05, 9.41939651966095e-05, 9.838305413722992e-05, 0.00010257214307785034, 0.00010676123201847076, 0.00011095032095909119, 0.00011513940989971161, 0.00011932849884033203]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 10.0, 7.0, 17.0, 11.0, 20.0, 29.0, 19.0, 47.0, 50.0, 82.0, 147.0, 393.0, 5009.0, 1010823.0, 30473.0, 842.0, 184.0, 107.0, 67.0, 49.0, 31.0, 28.0, 22.0, 9.0, 14.0, 22.0, 8.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0235748291015625, -0.02269148826599121, -0.021808147430419922, -0.020924806594848633, -0.020041465759277344, -0.019158124923706055, -0.018274784088134766, -0.017391443252563477, -0.016508102416992188, -0.015624761581420898, -0.01474142074584961, -0.01385807991027832, -0.012974739074707031, -0.012091398239135742, -0.011208057403564453, -0.010324716567993164, -0.009441375732421875, -0.008558034896850586, -0.007674694061279297, -0.006791353225708008, -0.005908012390136719, -0.00502467155456543, -0.004141330718994141, -0.0032579898834228516, -0.0023746490478515625, -0.0014913082122802734, -0.0006079673767089844, 0.0002753734588623047, 0.0011587142944335938, 0.002042055130004883, 0.002925395965576172, 0.003808736801147461, 0.00469207763671875, 0.005575418472290039, 0.006458759307861328, 0.007342100143432617, 0.008225440979003906, 0.009108781814575195, 0.009992122650146484, 0.010875463485717773, 0.011758804321289062, 0.012642145156860352, 0.01352548599243164, 0.01440882682800293, 0.015292167663574219, 0.016175508499145508, 0.017058849334716797, 0.017942190170288086, 0.018825531005859375, 0.019708871841430664, 0.020592212677001953, 0.021475553512573242, 0.02235889434814453, 0.02324223518371582, 0.02412557601928711, 0.0250089168548584, 0.025892257690429688, 0.026775598526000977, 0.027658939361572266, 0.028542280197143555, 0.029425621032714844, 0.030308961868286133, 0.031192302703857422, 0.03207564353942871, 0.032958984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 7.0, 15.0, 9.0, 17.0, 23.0, 14.0, 35.0, 24.0, 41.0, 44.0, 54.0, 92.0, 120.0, 113.0, 83.0, 48.0, 54.0, 35.0, 37.0, 27.0, 11.0, 19.0, 11.0, 7.0, 16.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003673553466796875, -0.0035366415977478027, -0.0033997297286987305, -0.003262817859649658, -0.003125905990600586, -0.0029889941215515137, -0.0028520822525024414, -0.002715170383453369, -0.002578258514404297, -0.0024413466453552246, -0.0023044347763061523, -0.00216752290725708, -0.002030611038208008, -0.0018936991691589355, -0.0017567873001098633, -0.001619875431060791, -0.0014829635620117188, -0.0013460516929626465, -0.0012091398239135742, -0.001072227954864502, -0.0009353160858154297, -0.0007984042167663574, -0.0006614923477172852, -0.0005245804786682129, -0.0003876686096191406, -0.00025075674057006836, -0.0001138448715209961, 2.3066997528076172e-05, 0.00015997886657714844, 0.0002968907356262207, 0.00043380260467529297, 0.0005707144737243652, 0.0007076263427734375, 0.0008445382118225098, 0.000981450080871582, 0.0011183619499206543, 0.0012552738189697266, 0.0013921856880187988, 0.001529097557067871, 0.0016660094261169434, 0.0018029212951660156, 0.0019398331642150879, 0.00207674503326416, 0.0022136569023132324, 0.0023505687713623047, 0.002487480640411377, 0.0026243925094604492, 0.0027613043785095215, 0.0028982162475585938, 0.003035128116607666, 0.0031720399856567383, 0.0033089518547058105, 0.003445863723754883, 0.003582775592803955, 0.0037196874618530273, 0.0038565993309020996, 0.003993511199951172, 0.004130423069000244, 0.004267334938049316, 0.004404246807098389, 0.004541158676147461, 0.004678070545196533, 0.0048149824142456055, 0.004951894283294678, 0.00508880615234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 57.0, 345.0, 495.0, 82.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2985553741455078, -0.29031455516815186, -0.2820737659931183, -0.27383294701576233, -0.26559212803840637, -0.2573513388633728, -0.24911051988601685, -0.2408697009086609, -0.23262889683246613, -0.22438809275627136, -0.2161472737789154, -0.20790646970272064, -0.19966566562652588, -0.19142484664916992, -0.18318404257297516, -0.1749432384967804, -0.16670241951942444, -0.15846161544322968, -0.15022079646587372, -0.14197999238967896, -0.133739173412323, -0.12549836933612823, -0.11725756525993347, -0.10901675373315811, -0.10077594220638275, -0.09253513067960739, -0.08429431915283203, -0.07605351507663727, -0.06781270354986191, -0.05957189202308655, -0.051331084221601486, -0.043090276420116425, -0.03484943509101868, -0.026608625426888466, -0.018367815762758255, -0.010127006098628044, -0.0018861964344978333, 0.006354615092277527, 0.014595422893762589, 0.02283623069524765, 0.03107704222202301, 0.03931785374879837, 0.04755866155028343, 0.055799469351768494, 0.06404028087854385, 0.07228109240531921, 0.08052189648151398, 0.08876270800828934, 0.0970035195350647, 0.10524433106184006, 0.11348514258861542, 0.12172594666481018, 0.12996676564216614, 0.1382075697183609, 0.14644837379455566, 0.15468919277191162, 0.16292999684810638, 0.17117080092430115, 0.1794116199016571, 0.18765242397785187, 0.19589322805404663, 0.2041340470314026, 0.21237485110759735, 0.22061565518379211, 0.22885647416114807]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 9.0, 6.0, 2.0, 15.0, 11.0, 14.0, 21.0, 19.0, 24.0, 23.0, 39.0, 37.0, 47.0, 36.0, 55.0, 44.0, 49.0, 44.0, 56.0, 52.0, 40.0, 48.0, 49.0, 42.0, 28.0, 25.0, 23.0, 25.0, 21.0, 20.0, 14.0, 12.0, 13.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055844008922576904, -0.05409380793571472, -0.05234360694885254, -0.05059340223670006, -0.048843201249837875, -0.04709300026297569, -0.04534279555082321, -0.04359259456396103, -0.041842393577098846, -0.040092192590236664, -0.03834199160337448, -0.036591786891222, -0.03484158590435982, -0.033091384917497635, -0.031341180205345154, -0.02959097921848297, -0.02784077823162079, -0.026090577244758606, -0.024340374395251274, -0.022590171545743942, -0.02083997055888176, -0.019089769572019577, -0.017339566722512245, -0.015589364804327488, -0.01383916288614273, -0.012088960967957973, -0.010338759049773216, -0.008588557131588459, -0.006838355213403702, -0.0050881532952189445, -0.0033379513770341873, -0.00158774945884943, 0.00016245245933532715, 0.0019126543775200844, 0.0036628562957048416, 0.005413058213889599, 0.007163260132074356, 0.008913462050259113, 0.01066366396844387, 0.012413865886628628, 0.014164067804813385, 0.015914268791675568, 0.0176644716411829, 0.01941467449069023, 0.021164875477552414, 0.022915076464414597, 0.02466527931392193, 0.02641548216342926, 0.028165683150291443, 0.029915884137153625, 0.03166608512401581, 0.03341628983616829, 0.03516649082303047, 0.036916691809892654, 0.038666896522045135, 0.04041709750890732, 0.0421672984957695, 0.04391749948263168, 0.045667700469493866, 0.04741790518164635, 0.04916810616850853, 0.05091830715537071, 0.05266851186752319, 0.054418712854385376, 0.05616891384124756]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 10.0, 15.0, 48.0, 104.0, 362.0, 3037.0, 4155366.0, 33491.0, 1346.0, 292.0, 99.0, 39.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11883544921875, -0.11440372467041016, -0.10997200012207031, -0.10554027557373047, -0.10110855102539062, -0.09667682647705078, -0.09224510192871094, -0.0878133773803711, -0.08338165283203125, -0.0789499282836914, -0.07451820373535156, -0.07008647918701172, -0.06565475463867188, -0.06122303009033203, -0.05679130554199219, -0.052359580993652344, -0.0479278564453125, -0.043496131896972656, -0.03906440734863281, -0.03463268280029297, -0.030200958251953125, -0.02576923370361328, -0.021337509155273438, -0.016905784606933594, -0.01247406005859375, -0.008042335510253906, -0.0036106109619140625, 0.0008211135864257812, 0.005252838134765625, 0.009684562683105469, 0.014116287231445312, 0.018548011779785156, 0.022979736328125, 0.027411460876464844, 0.03184318542480469, 0.03627490997314453, 0.040706634521484375, 0.04513835906982422, 0.04957008361816406, 0.054001808166503906, 0.05843353271484375, 0.0628652572631836, 0.06729698181152344, 0.07172870635986328, 0.07616043090820312, 0.08059215545654297, 0.08502388000488281, 0.08945560455322266, 0.0938873291015625, 0.09831905364990234, 0.10275077819824219, 0.10718250274658203, 0.11161422729492188, 0.11604595184326172, 0.12047767639160156, 0.1249094009399414, 0.12934112548828125, 0.1337728500366211, 0.13820457458496094, 0.14263629913330078, 0.14706802368164062, 0.15149974822998047, 0.1559314727783203, 0.16036319732666016, 0.164794921875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 9.0, 22.0, 54.0, 139.0, 305.0, 272.0, 109.0, 47.0, 18.0, 13.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0160369873046875, -0.015441656112670898, -0.014846324920654297, -0.014250993728637695, -0.013655662536621094, -0.013060331344604492, -0.01246500015258789, -0.011869668960571289, -0.011274337768554688, -0.010679006576538086, -0.010083675384521484, -0.009488344192504883, -0.008893013000488281, -0.00829768180847168, -0.007702350616455078, -0.0071070194244384766, -0.006511688232421875, -0.0059163570404052734, -0.005321025848388672, -0.00472569465637207, -0.004130363464355469, -0.003535032272338867, -0.0029397010803222656, -0.002344369888305664, -0.0017490386962890625, -0.001153707504272461, -0.0005583763122558594, 3.695487976074219e-05, 0.0006322860717773438, 0.0012276172637939453, 0.0018229484558105469, 0.0024182796478271484, 0.00301361083984375, 0.0036089420318603516, 0.004204273223876953, 0.004799604415893555, 0.005394935607910156, 0.005990266799926758, 0.006585597991943359, 0.007180929183959961, 0.0077762603759765625, 0.008371591567993164, 0.008966922760009766, 0.009562253952026367, 0.010157585144042969, 0.01075291633605957, 0.011348247528076172, 0.011943578720092773, 0.012538909912109375, 0.013134241104125977, 0.013729572296142578, 0.01432490348815918, 0.014920234680175781, 0.015515565872192383, 0.016110897064208984, 0.016706228256225586, 0.017301559448242188, 0.01789689064025879, 0.01849222183227539, 0.019087553024291992, 0.019682884216308594, 0.020278215408325195, 0.020873546600341797, 0.0214688777923584, 0.022064208984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 13.0, 11.0, 19.0, 34.0, 69.0, 110.0, 317.0, 620.0, 1597.0, 6343.0, 136290.0, 3988130.0, 54024.0, 4246.0, 1287.0, 552.0, 251.0, 146.0, 86.0, 39.0, 33.0, 17.0, 11.0, 13.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.048415184020996094, -0.04687309265136719, -0.04533100128173828, -0.043788909912109375, -0.04224681854248047, -0.04070472717285156, -0.039162635803222656, -0.03762054443359375, -0.036078453063964844, -0.03453636169433594, -0.03299427032470703, -0.031452178955078125, -0.02991008758544922, -0.028367996215820312, -0.026825904846191406, -0.0252838134765625, -0.023741722106933594, -0.022199630737304688, -0.02065753936767578, -0.019115447998046875, -0.01757335662841797, -0.016031265258789062, -0.014489173889160156, -0.01294708251953125, -0.011404991149902344, -0.009862899780273438, -0.008320808410644531, -0.006778717041015625, -0.005236625671386719, -0.0036945343017578125, -0.0021524429321289062, -0.0006103515625, 0.0009317398071289062, 0.0024738311767578125, 0.004015922546386719, 0.005558013916015625, 0.007100105285644531, 0.008642196655273438, 0.010184288024902344, 0.01172637939453125, 0.013268470764160156, 0.014810562133789062, 0.01635265350341797, 0.017894744873046875, 0.01943683624267578, 0.020978927612304688, 0.022521018981933594, 0.0240631103515625, 0.025605201721191406, 0.027147293090820312, 0.02868938446044922, 0.030231475830078125, 0.03177356719970703, 0.03331565856933594, 0.034857749938964844, 0.03639984130859375, 0.037941932678222656, 0.03948402404785156, 0.04102611541748047, 0.042568206787109375, 0.04411029815673828, 0.04565238952636719, 0.047194480895996094, 0.048736572265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 9.0, 7.0, 15.0, 21.0, 53.0, 63.0, 100.0, 170.0, 233.0, 442.0, 809.0, 750.0, 486.0, 336.0, 210.0, 116.0, 76.0, 52.0, 50.0, 26.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012743949890136719, -0.012304306030273438, -0.011864662170410156, -0.011425018310546875, -0.010985374450683594, -0.010545730590820312, -0.010106086730957031, -0.00966644287109375, -0.009226799011230469, -0.008787155151367188, -0.008347511291503906, -0.007907867431640625, -0.007468223571777344, -0.0070285797119140625, -0.006588935852050781, -0.0061492919921875, -0.005709648132324219, -0.0052700042724609375, -0.004830360412597656, -0.004390716552734375, -0.003951072692871094, -0.0035114288330078125, -0.0030717849731445312, -0.00263214111328125, -0.0021924972534179688, -0.0017528533935546875, -0.0013132095336914062, -0.000873565673828125, -0.00043392181396484375, 5.7220458984375e-06, 0.00044536590576171875, 0.000885009765625, 0.0013246536254882812, 0.0017642974853515625, 0.0022039413452148438, 0.002643585205078125, 0.0030832290649414062, 0.0035228729248046875, 0.003962516784667969, 0.00440216064453125, 0.004841804504394531, 0.0052814483642578125, 0.005721092224121094, 0.006160736083984375, 0.006600379943847656, 0.0070400238037109375, 0.007479667663574219, 0.0079193115234375, 0.008358955383300781, 0.008798599243164062, 0.009238243103027344, 0.009677886962890625, 0.010117530822753906, 0.010557174682617188, 0.010996818542480469, 0.01143646240234375, 0.011876106262207031, 0.012315750122070312, 0.012755393981933594, 0.013195037841796875, 0.013634681701660156, 0.014074325561523438, 0.014513969421386719, 0.01495361328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 29.0, 647.0, 309.0, 22.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4934025704860687, -0.4796161949634552, -0.4658298194408417, -0.45204344391822815, -0.43825703859329224, -0.4244706630706787, -0.4106842875480652, -0.39689791202545166, -0.38311153650283813, -0.3693251609802246, -0.3555387854576111, -0.34175240993499756, -0.32796603441238403, -0.3141796588897705, -0.3003932535648346, -0.28660687804222107, -0.27282050251960754, -0.259034126996994, -0.2452477514743805, -0.23146136105060577, -0.21767498552799225, -0.20388861000537872, -0.190102219581604, -0.17631584405899048, -0.16252946853637695, -0.14874309301376343, -0.1349567174911499, -0.12117032706737518, -0.10738395154476166, -0.09359757602214813, -0.07981119304895401, -0.06602481007575989, -0.052238404750823975, -0.03845202550292015, -0.024665646255016327, -0.010879267007112503, 0.002907112240791321, 0.016693487763404846, 0.03047987073659897, 0.04426625370979309, 0.058052629232406616, 0.07183900475502014, 0.08562538772821426, 0.09941177070140839, 0.11319814622402191, 0.12698452174663544, 0.14077091217041016, 0.15455728769302368, 0.1683436632156372, 0.18213003873825073, 0.19591641426086426, 0.20970280468463898, 0.2234891802072525, 0.23727555572986603, 0.25106194615364075, 0.2648483216762543, 0.2786346971988678, 0.2924210727214813, 0.30620744824409485, 0.3199938237667084, 0.3337802290916443, 0.3475666046142578, 0.36135298013687134, 0.37513935565948486, 0.3889257311820984]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 10.0, 13.0, 11.0, 14.0, 21.0, 16.0, 17.0, 22.0, 29.0, 30.0, 30.0, 28.0, 45.0, 37.0, 57.0, 51.0, 43.0, 39.0, 41.0, 33.0, 41.0, 36.0, 31.0, 48.0, 27.0, 30.0, 25.0, 19.0, 18.0, 21.0, 17.0, 14.0, 12.0, 9.0, 12.0, 13.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.04567974805831909, -0.04443579912185669, -0.043191853910684586, -0.04194790869951248, -0.04070395976305008, -0.03946001082658768, -0.03821606561541557, -0.03697212040424347, -0.03572817146778107, -0.034484222531318665, -0.03324027732014656, -0.03199633210897446, -0.030752383172512054, -0.0295084360986948, -0.028264489024877548, -0.027020541951060295, -0.025776594877243042, -0.02453264780342579, -0.023288700729608536, -0.022044753655791283, -0.02080080658197403, -0.019556859508156776, -0.018312912434339523, -0.01706896536052227, -0.015825018286705017, -0.014581071212887764, -0.01333712413907051, -0.012093177065253258, -0.010849229991436005, -0.009605282917618752, -0.008361335843801498, -0.007117388769984245, -0.005873441696166992, -0.004629494622349739, -0.003385547548532486, -0.002141600474715233, -0.0008976534008979797, 0.0003462936729192734, 0.0015902407467365265, 0.0028341878205537796, 0.004078134894371033, 0.005322081968188286, 0.006566029042005539, 0.007809976115822792, 0.009053923189640045, 0.010297870263457298, 0.011541817337274551, 0.012785764411091805, 0.014029711484909058, 0.01527365855872631, 0.016517605632543564, 0.017761552706360817, 0.01900549978017807, 0.020249446853995323, 0.021493393927812576, 0.02273734100162983, 0.023981288075447083, 0.025225235149264336, 0.02646918222308159, 0.027713129296898842, 0.028957076370716095, 0.030201023444533348, 0.0314449705183506, 0.032688915729522705, 0.03393286466598511]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 8.0, 28.0, 13.0, 36.0, 26.0, 45.0, 53.0, 75.0, 94.0, 128.0, 202.0, 328.0, 585.0, 1344.0, 6036.0, 94454.0, 913329.0, 26274.0, 3150.0, 934.0, 442.0, 257.0, 179.0, 133.0, 103.0, 63.0, 48.0, 32.0, 28.0, 24.0, 17.0, 14.0, 8.0, 14.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.10711669921875, -0.10416698455810547, -0.10121726989746094, -0.0982675552368164, -0.09531784057617188, -0.09236812591552734, -0.08941841125488281, -0.08646869659423828, -0.08351898193359375, -0.08056926727294922, -0.07761955261230469, -0.07466983795166016, -0.07172012329101562, -0.0687704086303711, -0.06582069396972656, -0.06287097930908203, -0.0599212646484375, -0.05697154998779297, -0.05402183532714844, -0.051072120666503906, -0.048122406005859375, -0.045172691345214844, -0.04222297668457031, -0.03927326202392578, -0.03632354736328125, -0.03337383270263672, -0.030424118041992188, -0.027474403381347656, -0.024524688720703125, -0.021574974060058594, -0.018625259399414062, -0.01567554473876953, -0.012725830078125, -0.009776115417480469, -0.0068264007568359375, -0.0038766860961914062, -0.000926971435546875, 0.0020227432250976562, 0.0049724578857421875, 0.007922172546386719, 0.01087188720703125, 0.013821601867675781, 0.016771316528320312, 0.019721031188964844, 0.022670745849609375, 0.025620460510253906, 0.028570175170898438, 0.03151988983154297, 0.0344696044921875, 0.03741931915283203, 0.04036903381347656, 0.043318748474121094, 0.046268463134765625, 0.049218177795410156, 0.05216789245605469, 0.05511760711669922, 0.05806732177734375, 0.06101703643798828, 0.06396675109863281, 0.06691646575927734, 0.06986618041992188, 0.0728158950805664, 0.07576560974121094, 0.07871532440185547, 0.0816650390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 12.0, 36.0, 101.0, 195.0, 330.0, 174.0, 83.0, 31.0, 15.0, 13.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016021728515625, -0.015438556671142578, -0.014855384826660156, -0.014272212982177734, -0.013689041137695312, -0.01310586929321289, -0.012522697448730469, -0.011939525604248047, -0.011356353759765625, -0.010773181915283203, -0.010190010070800781, -0.00960683822631836, -0.009023666381835938, -0.008440494537353516, -0.007857322692871094, -0.007274150848388672, -0.00669097900390625, -0.006107807159423828, -0.005524635314941406, -0.004941463470458984, -0.0043582916259765625, -0.0037751197814941406, -0.0031919479370117188, -0.002608776092529297, -0.002025604248046875, -0.0014424324035644531, -0.0008592605590820312, -0.0002760887145996094, 0.0003070831298828125, 0.0008902549743652344, 0.0014734268188476562, 0.002056598663330078, 0.0026397705078125, 0.003222942352294922, 0.0038061141967773438, 0.004389286041259766, 0.0049724578857421875, 0.005555629730224609, 0.006138801574707031, 0.006721973419189453, 0.007305145263671875, 0.007888317108154297, 0.008471488952636719, 0.00905466079711914, 0.009637832641601562, 0.010221004486083984, 0.010804176330566406, 0.011387348175048828, 0.01197052001953125, 0.012553691864013672, 0.013136863708496094, 0.013720035552978516, 0.014303207397460938, 0.01488637924194336, 0.015469551086425781, 0.016052722930908203, 0.016635894775390625, 0.017219066619873047, 0.01780223846435547, 0.01838541030883789, 0.018968582153320312, 0.019551753997802734, 0.020134925842285156, 0.020718097686767578, 0.02130126953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 4.0, 6.0, 7.0, 12.0, 12.0, 19.0, 16.0, 24.0, 38.0, 46.0, 73.0, 84.0, 116.0, 140.0, 167.0, 263.0, 393.0, 662.0, 1551.0, 5427.0, 34319.0, 512909.0, 452682.0, 31023.0, 5035.0, 1453.0, 620.0, 381.0, 251.0, 217.0, 140.0, 104.0, 93.0, 64.0, 46.0, 36.0, 25.0, 25.0, 17.0, 13.0, 11.0, 7.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443115234375, -0.04278230667114258, -0.041253089904785156, -0.039723873138427734, -0.03819465637207031, -0.03666543960571289, -0.03513622283935547, -0.03360700607299805, -0.032077789306640625, -0.030548572540283203, -0.02901935577392578, -0.02749013900756836, -0.025960922241210938, -0.024431705474853516, -0.022902488708496094, -0.021373271942138672, -0.01984405517578125, -0.018314838409423828, -0.016785621643066406, -0.015256404876708984, -0.013727188110351562, -0.01219797134399414, -0.010668754577636719, -0.009139537811279297, -0.007610321044921875, -0.006081104278564453, -0.004551887512207031, -0.0030226707458496094, -0.0014934539794921875, 3.5762786865234375e-05, 0.0015649795532226562, 0.003094196319580078, 0.0046234130859375, 0.006152629852294922, 0.007681846618652344, 0.009211063385009766, 0.010740280151367188, 0.01226949691772461, 0.013798713684082031, 0.015327930450439453, 0.016857147216796875, 0.018386363983154297, 0.01991558074951172, 0.02144479751586914, 0.022974014282226562, 0.024503231048583984, 0.026032447814941406, 0.027561664581298828, 0.02909088134765625, 0.030620098114013672, 0.032149314880371094, 0.033678531646728516, 0.03520774841308594, 0.03673696517944336, 0.03826618194580078, 0.0397953987121582, 0.041324615478515625, 0.04285383224487305, 0.04438304901123047, 0.04591226577758789, 0.04744148254394531, 0.048970699310302734, 0.050499916076660156, 0.05202913284301758, 0.053558349609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 9.0, 20.0, 13.0, 18.0, 24.0, 21.0, 23.0, 34.0, 33.0, 43.0, 37.0, 45.0, 50.0, 63.0, 68.0, 49.0, 68.0, 52.0, 49.0, 37.0, 31.0, 31.0, 25.0, 32.0, 23.0, 10.0, 16.0, 11.0, 15.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015838623046875, -0.015334367752075195, -0.01483011245727539, -0.014325857162475586, -0.013821601867675781, -0.013317346572875977, -0.012813091278076172, -0.012308835983276367, -0.011804580688476562, -0.011300325393676758, -0.010796070098876953, -0.010291814804077148, -0.009787559509277344, -0.009283304214477539, -0.008779048919677734, -0.00827479362487793, -0.007770538330078125, -0.00726628303527832, -0.006762027740478516, -0.006257772445678711, -0.005753517150878906, -0.0052492618560791016, -0.004745006561279297, -0.004240751266479492, -0.0037364959716796875, -0.003232240676879883, -0.002727985382080078, -0.0022237300872802734, -0.0017194747924804688, -0.001215219497680664, -0.0007109642028808594, -0.0002067089080810547, 0.00029754638671875, 0.0008018016815185547, 0.0013060569763183594, 0.001810312271118164, 0.0023145675659179688, 0.0028188228607177734, 0.003323078155517578, 0.003827333450317383, 0.0043315887451171875, 0.004835844039916992, 0.005340099334716797, 0.0058443546295166016, 0.006348609924316406, 0.006852865219116211, 0.007357120513916016, 0.00786137580871582, 0.008365631103515625, 0.00886988639831543, 0.009374141693115234, 0.009878396987915039, 0.010382652282714844, 0.010886907577514648, 0.011391162872314453, 0.011895418167114258, 0.012399673461914062, 0.012903928756713867, 0.013408184051513672, 0.013912439346313477, 0.014416694641113281, 0.014920949935913086, 0.01542520523071289, 0.015929460525512695, 0.0164337158203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 17.0, 17.0, 22.0, 43.0, 58.0, 111.0, 178.0, 379.0, 850.0, 2795.0, 14112.0, 218573.0, 777519.0, 27291.0, 4353.0, 1204.0, 427.0, 209.0, 116.0, 73.0, 54.0, 41.0, 21.0, 15.0, 11.0, 8.0, 7.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03778076171875, -0.03656816482543945, -0.035355567932128906, -0.03414297103881836, -0.03293037414550781, -0.031717777252197266, -0.03050518035888672, -0.029292583465576172, -0.028079986572265625, -0.026867389678955078, -0.02565479278564453, -0.024442195892333984, -0.023229598999023438, -0.02201700210571289, -0.020804405212402344, -0.019591808319091797, -0.01837921142578125, -0.017166614532470703, -0.015954017639160156, -0.01474142074584961, -0.013528823852539062, -0.012316226959228516, -0.011103630065917969, -0.009891033172607422, -0.008678436279296875, -0.007465839385986328, -0.006253242492675781, -0.005040645599365234, -0.0038280487060546875, -0.0026154518127441406, -0.0014028549194335938, -0.00019025802612304688, 0.0010223388671875, 0.002234935760498047, 0.0034475326538085938, 0.004660129547119141, 0.0058727264404296875, 0.007085323333740234, 0.008297920227050781, 0.009510517120361328, 0.010723114013671875, 0.011935710906982422, 0.013148307800292969, 0.014360904693603516, 0.015573501586914062, 0.01678609848022461, 0.017998695373535156, 0.019211292266845703, 0.02042388916015625, 0.021636486053466797, 0.022849082946777344, 0.02406167984008789, 0.025274276733398438, 0.026486873626708984, 0.02769947052001953, 0.028912067413330078, 0.030124664306640625, 0.03133726119995117, 0.03254985809326172, 0.033762454986572266, 0.03497505187988281, 0.03618764877319336, 0.037400245666503906, 0.03861284255981445, 0.039825439453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 9.0, 5.0, 11.0, 17.0, 23.0, 32.0, 49.0, 80.0, 108.0, 146.0, 140.0, 99.0, 61.0, 49.0, 44.0, 21.0, 22.0, 7.0, 8.0, 11.0, 11.0, 3.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.565187454223633e-05, -8.17691907286644e-05, -7.788650691509247e-05, -7.400382310152054e-05, -7.012113928794861e-05, -6.623845547437668e-05, -6.235577166080475e-05, -5.847308784723282e-05, -5.459040403366089e-05, -5.070772022008896e-05, -4.682503640651703e-05, -4.29423525929451e-05, -3.905966877937317e-05, -3.517698496580124e-05, -3.129430115222931e-05, -2.741161733865738e-05, -2.352893352508545e-05, -1.964624971151352e-05, -1.576356589794159e-05, -1.188088208436966e-05, -7.99819827079773e-06, -4.1155144572257996e-06, -2.3283064365386963e-07, 3.6498531699180603e-06, 7.53253698348999e-06, 1.141522079706192e-05, 1.529790461063385e-05, 1.918058842420578e-05, 2.306327223777771e-05, 2.694595605134964e-05, 3.082863986492157e-05, 3.47113236784935e-05, 3.859400749206543e-05, 4.247669130563736e-05, 4.635937511920929e-05, 5.024205893278122e-05, 5.412474274635315e-05, 5.800742655992508e-05, 6.189011037349701e-05, 6.577279418706894e-05, 6.965547800064087e-05, 7.35381618142128e-05, 7.742084562778473e-05, 8.130352944135666e-05, 8.518621325492859e-05, 8.906889706850052e-05, 9.295158088207245e-05, 9.683426469564438e-05, 0.00010071694850921631, 0.00010459963232278824, 0.00010848231613636017, 0.0001123649999499321, 0.00011624768376350403, 0.00012013036757707596, 0.0001240130513906479, 0.00012789573520421982, 0.00013177841901779175, 0.00013566110283136368, 0.0001395437866449356, 0.00014342647045850754, 0.00014730915427207947, 0.0001511918380856514, 0.00015507452189922333, 0.00015895720571279526, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 6.0, 5.0, 5.0, 6.0, 9.0, 13.0, 25.0, 29.0, 44.0, 66.0, 98.0, 190.0, 318.0, 732.0, 3193.0, 31776.0, 939788.0, 65757.0, 4624.0, 955.0, 335.0, 201.0, 117.0, 78.0, 54.0, 35.0, 30.0, 19.0, 21.0, 11.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.03274679183959961, -0.03171062469482422, -0.030674457550048828, -0.029638290405273438, -0.028602123260498047, -0.027565956115722656, -0.026529788970947266, -0.025493621826171875, -0.024457454681396484, -0.023421287536621094, -0.022385120391845703, -0.021348953247070312, -0.020312786102294922, -0.01927661895751953, -0.01824045181274414, -0.01720428466796875, -0.01616811752319336, -0.015131950378417969, -0.014095783233642578, -0.013059616088867188, -0.012023448944091797, -0.010987281799316406, -0.009951114654541016, -0.008914947509765625, -0.007878780364990234, -0.006842613220214844, -0.005806446075439453, -0.0047702789306640625, -0.003734111785888672, -0.0026979446411132812, -0.0016617774963378906, -0.0006256103515625, 0.0004105567932128906, 0.0014467239379882812, 0.002482891082763672, 0.0035190582275390625, 0.004555225372314453, 0.005591392517089844, 0.006627559661865234, 0.007663726806640625, 0.008699893951416016, 0.009736061096191406, 0.010772228240966797, 0.011808395385742188, 0.012844562530517578, 0.013880729675292969, 0.01491689682006836, 0.01595306396484375, 0.01698923110961914, 0.01802539825439453, 0.019061565399169922, 0.020097732543945312, 0.021133899688720703, 0.022170066833496094, 0.023206233978271484, 0.024242401123046875, 0.025278568267822266, 0.026314735412597656, 0.027350902557373047, 0.028387069702148438, 0.029423236846923828, 0.03045940399169922, 0.03149557113647461, 0.03253173828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 8.0, 13.0, 9.0, 19.0, 35.0, 43.0, 45.0, 76.0, 94.0, 120.0, 141.0, 90.0, 66.0, 32.0, 31.0, 28.0, 16.0, 12.0, 11.0, 12.0, 11.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00778961181640625, -0.007553398609161377, -0.007317185401916504, -0.007080972194671631, -0.006844758987426758, -0.006608545780181885, -0.006372332572937012, -0.006136119365692139, -0.005899906158447266, -0.005663692951202393, -0.0054274797439575195, -0.0051912665367126465, -0.0049550533294677734, -0.0047188401222229, -0.004482626914978027, -0.004246413707733154, -0.004010200500488281, -0.003773987293243408, -0.003537774085998535, -0.003301560878753662, -0.003065347671508789, -0.002829134464263916, -0.002592921257019043, -0.00235670804977417, -0.002120494842529297, -0.0018842816352844238, -0.0016480684280395508, -0.0014118552207946777, -0.0011756420135498047, -0.0009394288063049316, -0.0007032155990600586, -0.00046700239181518555, -0.0002307891845703125, 5.424022674560547e-06, 0.0002416372299194336, 0.00047785043716430664, 0.0007140636444091797, 0.0009502768516540527, 0.0011864900588989258, 0.0014227032661437988, 0.0016589164733886719, 0.001895129680633545, 0.002131342887878418, 0.002367556095123291, 0.002603769302368164, 0.002839982509613037, 0.00307619571685791, 0.003312408924102783, 0.0035486221313476562, 0.0037848353385925293, 0.004021048545837402, 0.004257261753082275, 0.0044934749603271484, 0.0047296881675720215, 0.0049659013748168945, 0.005202114582061768, 0.005438327789306641, 0.005674540996551514, 0.005910754203796387, 0.00614696741104126, 0.006383180618286133, 0.006619393825531006, 0.006855607032775879, 0.007091820240020752, 0.007328033447265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 14.0, 167.0, 739.0, 80.0, 11.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8121696710586548, -0.7974826693534851, -0.7827956676483154, -0.768108606338501, -0.7534216046333313, -0.7387346029281616, -0.7240476012229919, -0.7093605995178223, -0.6946735382080078, -0.6799865365028381, -0.6652995347976685, -0.650612473487854, -0.6359254717826843, -0.6212384700775146, -0.606551468372345, -0.5918644666671753, -0.5771774649620056, -0.5624904632568359, -0.5478034615516663, -0.5331164002418518, -0.5184293985366821, -0.5037423968315125, -0.4890553951263428, -0.4743683934211731, -0.45968136191368103, -0.44499436020851135, -0.4303073287010193, -0.4156203269958496, -0.40093332529067993, -0.38624629378318787, -0.3715592920780182, -0.3568722605705261, -0.34218522906303406, -0.3274982273578644, -0.3128111958503723, -0.29812419414520264, -0.28343719244003296, -0.2687501609325409, -0.2540631592273712, -0.23937614262104034, -0.22468912601470947, -0.2100021094083786, -0.19531509280204773, -0.18062809109687805, -0.16594107449054718, -0.1512540578842163, -0.13656705617904663, -0.12188003957271576, -0.10719302296638489, -0.09250600636005402, -0.07781899720430374, -0.06313198804855347, -0.048444971442222595, -0.033757954835891724, -0.01907094568014145, -0.004383936524391174, 0.010303080081939697, 0.02499009296298027, 0.039677105844020844, 0.05436411872506142, 0.06905113160610199, 0.08373814821243286, 0.09842515736818314, 0.11311216652393341, 0.12779918313026428]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 9.0, 20.0, 17.0, 27.0, 29.0, 43.0, 43.0, 63.0, 62.0, 63.0, 53.0, 56.0, 73.0, 58.0, 63.0, 58.0, 46.0, 39.0, 42.0, 27.0, 22.0, 24.0, 22.0, 12.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07898873090744019, -0.07669372111558914, -0.0743987038731575, -0.07210369408130646, -0.06980867683887482, -0.06751366704702377, -0.06521865725517273, -0.06292364001274109, -0.060628630220890045, -0.0583336167037487, -0.05603860318660736, -0.05374359339475632, -0.051448579877614975, -0.04915356636047363, -0.04685855656862259, -0.04456354305148125, -0.042268529534339905, -0.03997351601719856, -0.03767850250005722, -0.03538349270820618, -0.033088479191064835, -0.030793465673923492, -0.0284984540194273, -0.026203442364931107, -0.023908428847789764, -0.021613415330648422, -0.01931840367615223, -0.017023392021656036, -0.014728378504514694, -0.012433365918695927, -0.010138353332877159, -0.007843341678380966, -0.005548328161239624, -0.0032533155754208565, -0.0009583029896020889, 0.0013367095962166786, 0.003631722182035446, 0.005926734767854214, 0.008221747353672981, 0.010516759008169174, 0.012811772525310516, 0.015106785111129284, 0.01740179769694805, 0.019696809351444244, 0.021991822868585587, 0.02428683638572693, 0.02658184804022312, 0.028876859694719315, 0.031171873211860657, 0.033466886729002, 0.03576190024614334, 0.038056910037994385, 0.04035192355513573, 0.04264693707227707, 0.04494194686412811, 0.047236960381269455, 0.0495319738984108, 0.05182698741555214, 0.05412200093269348, 0.056417010724544525, 0.05871202424168587, 0.06100703775882721, 0.06330204755067825, 0.0655970573425293, 0.06789207458496094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 17.0, 36.0, 63.0, 187.0, 420.0, 1333.0, 5774.0, 836596.0, 3342253.0, 5120.0, 1349.0, 563.0, 272.0, 123.0, 72.0, 36.0, 17.0, 16.0, 6.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.052211761474609375, -0.05004119873046875, -0.047870635986328125, -0.0457000732421875, -0.043529510498046875, -0.04135894775390625, -0.039188385009765625, -0.037017822265625, -0.034847259521484375, -0.03267669677734375, -0.030506134033203125, -0.0283355712890625, -0.026165008544921875, -0.02399444580078125, -0.021823883056640625, -0.0196533203125, -0.017482757568359375, -0.01531219482421875, -0.013141632080078125, -0.0109710693359375, -0.008800506591796875, -0.00662994384765625, -0.004459381103515625, -0.002288818359375, -0.000118255615234375, 0.00205230712890625, 0.004222869873046875, 0.0063934326171875, 0.008563995361328125, 0.01073455810546875, 0.012905120849609375, 0.01507568359375, 0.017246246337890625, 0.01941680908203125, 0.021587371826171875, 0.0237579345703125, 0.025928497314453125, 0.02809906005859375, 0.030269622802734375, 0.032440185546875, 0.034610748291015625, 0.03678131103515625, 0.038951873779296875, 0.0411224365234375, 0.043292999267578125, 0.04546356201171875, 0.047634124755859375, 0.0498046875, 0.051975250244140625, 0.05414581298828125, 0.056316375732421875, 0.0584869384765625, 0.060657501220703125, 0.06282806396484375, 0.06499862670898438, 0.067169189453125, 0.06933975219726562, 0.07151031494140625, 0.07368087768554688, 0.0758514404296875, 0.07802200317382812, 0.08019256591796875, 0.08236312866210938, 0.08453369140625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 15.0, 38.0, 102.0, 178.0, 276.0, 203.0, 105.0, 40.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.014312744140625, -0.01377415657043457, -0.01323556900024414, -0.012696981430053711, -0.012158393859863281, -0.011619806289672852, -0.011081218719482422, -0.010542631149291992, -0.010004043579101562, -0.009465456008911133, -0.008926868438720703, -0.008388280868530273, -0.007849693298339844, -0.007311105728149414, -0.006772518157958984, -0.006233930587768555, -0.005695343017578125, -0.005156755447387695, -0.004618167877197266, -0.004079580307006836, -0.0035409927368164062, -0.0030024051666259766, -0.002463817596435547, -0.0019252300262451172, -0.0013866424560546875, -0.0008480548858642578, -0.0003094673156738281, 0.00022912025451660156, 0.0007677078247070312, 0.001306295394897461, 0.0018448829650878906, 0.0023834705352783203, 0.00292205810546875, 0.0034606456756591797, 0.003999233245849609, 0.004537820816040039, 0.005076408386230469, 0.0056149959564208984, 0.006153583526611328, 0.006692171096801758, 0.0072307586669921875, 0.007769346237182617, 0.008307933807373047, 0.008846521377563477, 0.009385108947753906, 0.009923696517944336, 0.010462284088134766, 0.011000871658325195, 0.011539459228515625, 0.012078046798706055, 0.012616634368896484, 0.013155221939086914, 0.013693809509277344, 0.014232397079467773, 0.014770984649658203, 0.015309572219848633, 0.015848159790039062, 0.016386747360229492, 0.016925334930419922, 0.01746392250061035, 0.01800251007080078, 0.01854109764099121, 0.01907968521118164, 0.01961827278137207, 0.0201568603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 13.0, 18.0, 30.0, 39.0, 73.0, 102.0, 173.0, 357.0, 578.0, 1280.0, 3354.0, 14962.0, 273142.0, 3718948.0, 163896.0, 11783.0, 3008.0, 1184.0, 550.0, 312.0, 152.0, 97.0, 68.0, 50.0, 18.0, 21.0, 14.0, 13.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.032989501953125, -0.0320584774017334, -0.031127452850341797, -0.030196428298950195, -0.029265403747558594, -0.028334379196166992, -0.02740335464477539, -0.02647233009338379, -0.025541305541992188, -0.024610280990600586, -0.023679256439208984, -0.022748231887817383, -0.02181720733642578, -0.02088618278503418, -0.019955158233642578, -0.019024133682250977, -0.018093109130859375, -0.017162084579467773, -0.016231060028076172, -0.01530003547668457, -0.014369010925292969, -0.013437986373901367, -0.012506961822509766, -0.011575937271118164, -0.010644912719726562, -0.009713888168334961, -0.00878286361694336, -0.007851839065551758, -0.006920814514160156, -0.005989789962768555, -0.005058765411376953, -0.0041277408599853516, -0.00319671630859375, -0.0022656917572021484, -0.0013346672058105469, -0.0004036426544189453, 0.0005273818969726562, 0.0014584064483642578, 0.0023894309997558594, 0.003320455551147461, 0.0042514801025390625, 0.005182504653930664, 0.006113529205322266, 0.007044553756713867, 0.007975578308105469, 0.00890660285949707, 0.009837627410888672, 0.010768651962280273, 0.011699676513671875, 0.012630701065063477, 0.013561725616455078, 0.01449275016784668, 0.015423774719238281, 0.016354799270629883, 0.017285823822021484, 0.018216848373413086, 0.019147872924804688, 0.02007889747619629, 0.02100992202758789, 0.021940946578979492, 0.022871971130371094, 0.023802995681762695, 0.024734020233154297, 0.0256650447845459, 0.0265960693359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 17.0, 25.0, 25.0, 36.0, 72.0, 89.0, 145.0, 188.0, 285.0, 400.0, 578.0, 592.0, 508.0, 323.0, 253.0, 164.0, 111.0, 86.0, 55.0, 33.0, 21.0, 12.0, 9.0, 10.0, 10.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01085662841796875, -0.010440707206726074, -0.010024785995483398, -0.009608864784240723, -0.009192943572998047, -0.008777022361755371, -0.008361101150512695, -0.00794517993927002, -0.007529258728027344, -0.007113337516784668, -0.006697416305541992, -0.006281495094299316, -0.005865573883056641, -0.005449652671813965, -0.005033731460571289, -0.004617810249328613, -0.0042018890380859375, -0.0037859678268432617, -0.003370046615600586, -0.00295412540435791, -0.0025382041931152344, -0.0021222829818725586, -0.0017063617706298828, -0.001290440559387207, -0.0008745193481445312, -0.00045859813690185547, -4.267692565917969e-05, 0.0003732442855834961, 0.0007891654968261719, 0.0012050867080688477, 0.0016210079193115234, 0.0020369291305541992, 0.002452850341796875, 0.0028687715530395508, 0.0032846927642822266, 0.0037006139755249023, 0.004116535186767578, 0.004532456398010254, 0.00494837760925293, 0.0053642988204956055, 0.005780220031738281, 0.006196141242980957, 0.006612062454223633, 0.007027983665466309, 0.007443904876708984, 0.00785982608795166, 0.008275747299194336, 0.008691668510437012, 0.009107589721679688, 0.009523510932922363, 0.009939432144165039, 0.010355353355407715, 0.01077127456665039, 0.011187195777893066, 0.011603116989135742, 0.012019038200378418, 0.012434959411621094, 0.01285088062286377, 0.013266801834106445, 0.013682723045349121, 0.014098644256591797, 0.014514565467834473, 0.014930486679077148, 0.015346407890319824, 0.0157623291015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 13.0, 71.0, 535.0, 329.0, 45.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3723847568035126, -0.3638807535171509, -0.3553767800331116, -0.3468727767467499, -0.3383687734603882, -0.3298647999763489, -0.3213607966899872, -0.3128568232059479, -0.3043528199195862, -0.2958488166332245, -0.2873448431491852, -0.2788408398628235, -0.2703368663787842, -0.2618328630924225, -0.2533288598060608, -0.2448248714208603, -0.2363208830356598, -0.2278168946504593, -0.2193129062652588, -0.2108089029788971, -0.2023049145936966, -0.1938009262084961, -0.1852969229221344, -0.1767929345369339, -0.1682889461517334, -0.1597849577665329, -0.1512809693813324, -0.1427769660949707, -0.1342729777097702, -0.1257689893245697, -0.1172649934887886, -0.10876099765300751, -0.100257009267807, -0.0917530208826065, -0.08324902504682541, -0.07474502921104431, -0.06624104082584381, -0.05773704871535301, -0.04923305660486221, -0.040729064494371414, -0.032225072383880615, -0.023721080273389816, -0.015217088162899017, -0.006713096052408218, 0.0017908960580825806, 0.01029488816857338, 0.01879888027906418, 0.027302872389554977, 0.035806864500045776, 0.044310856610536575, 0.052814848721027374, 0.06131884083151817, 0.06982283294200897, 0.07832682132720947, 0.08683081716299057, 0.09533481299877167, 0.10383880138397217, 0.11234278976917267, 0.12084678560495377, 0.12935078144073486, 0.13785476982593536, 0.14635875821113586, 0.15486276149749756, 0.16336674988269806, 0.17187073826789856]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 9.0, 10.0, 12.0, 13.0, 10.0, 11.0, 34.0, 32.0, 34.0, 32.0, 41.0, 42.0, 46.0, 50.0, 48.0, 55.0, 66.0, 67.0, 39.0, 52.0, 42.0, 47.0, 25.0, 46.0, 31.0, 31.0, 12.0, 17.0, 13.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.06207382678985596, -0.06053691357374191, -0.05900000035762787, -0.057463087141513824, -0.05592617392539978, -0.054389260709285736, -0.05285234749317169, -0.05131543427705765, -0.049778521060943604, -0.04824160784482956, -0.046704694628715515, -0.04516778141260147, -0.04363086819648743, -0.04209395498037338, -0.04055704176425934, -0.039020128548145294, -0.03748321533203125, -0.035946302115917206, -0.03440938889980316, -0.03287247568368912, -0.03133556246757507, -0.02979864925146103, -0.028261736035346985, -0.02672482281923294, -0.025187909603118896, -0.023650996387004852, -0.022114083170890808, -0.020577169954776764, -0.01904025673866272, -0.017503343522548676, -0.01596643030643463, -0.014429517090320587, -0.012892603874206543, -0.011355690658092499, -0.009818777441978455, -0.00828186422586441, -0.006744951009750366, -0.005208037793636322, -0.003671124577522278, -0.0021342113614082336, -0.0005972981452941895, 0.0009396150708198547, 0.002476528286933899, 0.004013441503047943, 0.005550354719161987, 0.0070872679352760315, 0.008624181151390076, 0.01016109436750412, 0.011698007583618164, 0.013234920799732208, 0.014771834015846252, 0.016308747231960297, 0.01784566044807434, 0.019382573664188385, 0.02091948688030243, 0.022456400096416473, 0.023993313312530518, 0.025530226528644562, 0.027067139744758606, 0.02860405296087265, 0.030140966176986694, 0.03167787939310074, 0.03321479260921478, 0.03475170582532883, 0.03628861904144287]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 13.0, 24.0, 27.0, 42.0, 65.0, 69.0, 119.0, 142.0, 222.0, 364.0, 526.0, 1193.0, 6628.0, 277509.0, 745366.0, 12709.0, 1659.0, 645.0, 405.0, 240.0, 153.0, 109.0, 69.0, 69.0, 41.0, 24.0, 24.0, 18.0, 16.0, 10.0, 5.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0806884765625, -0.07845449447631836, -0.07622051239013672, -0.07398653030395508, -0.07175254821777344, -0.0695185661315918, -0.06728458404541016, -0.06505060195922852, -0.06281661987304688, -0.060582637786865234, -0.058348655700683594, -0.05611467361450195, -0.05388069152832031, -0.05164670944213867, -0.04941272735595703, -0.04717874526977539, -0.04494476318359375, -0.04271078109741211, -0.04047679901123047, -0.03824281692504883, -0.03600883483886719, -0.03377485275268555, -0.031540870666503906, -0.029306888580322266, -0.027072906494140625, -0.024838924407958984, -0.022604942321777344, -0.020370960235595703, -0.018136978149414062, -0.015902996063232422, -0.013669013977050781, -0.01143503189086914, -0.0092010498046875, -0.006967067718505859, -0.004733085632324219, -0.002499103546142578, -0.0002651214599609375, 0.001968860626220703, 0.004202842712402344, 0.006436824798583984, 0.008670806884765625, 0.010904788970947266, 0.013138771057128906, 0.015372753143310547, 0.017606735229492188, 0.019840717315673828, 0.02207469940185547, 0.02430868148803711, 0.02654266357421875, 0.02877664566040039, 0.03101062774658203, 0.03324460983276367, 0.03547859191894531, 0.03771257400512695, 0.039946556091308594, 0.042180538177490234, 0.044414520263671875, 0.046648502349853516, 0.048882484436035156, 0.0511164665222168, 0.05335044860839844, 0.05558443069458008, 0.05781841278076172, 0.06005239486694336, 0.062286376953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 17.0, 37.0, 106.0, 186.0, 273.0, 208.0, 95.0, 47.0, 20.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01412200927734375, -0.013590693473815918, -0.013059377670288086, -0.012528061866760254, -0.011996746063232422, -0.01146543025970459, -0.010934114456176758, -0.010402798652648926, -0.009871482849121094, -0.009340167045593262, -0.00880885124206543, -0.008277535438537598, -0.007746219635009766, -0.007214903831481934, -0.0066835880279541016, -0.0061522722244262695, -0.0056209564208984375, -0.0050896406173706055, -0.0045583248138427734, -0.004027009010314941, -0.0034956932067871094, -0.0029643774032592773, -0.0024330615997314453, -0.0019017457962036133, -0.0013704299926757812, -0.0008391141891479492, -0.0003077983856201172, 0.00022351741790771484, 0.0007548332214355469, 0.001286149024963379, 0.001817464828491211, 0.002348780632019043, 0.002880096435546875, 0.003411412239074707, 0.003942728042602539, 0.004474043846130371, 0.005005359649658203, 0.005536675453186035, 0.006067991256713867, 0.006599307060241699, 0.007130622863769531, 0.007661938667297363, 0.008193254470825195, 0.008724570274353027, 0.00925588607788086, 0.009787201881408691, 0.010318517684936523, 0.010849833488464355, 0.011381149291992188, 0.01191246509552002, 0.012443780899047852, 0.012975096702575684, 0.013506412506103516, 0.014037728309631348, 0.01456904411315918, 0.015100359916687012, 0.015631675720214844, 0.016162991523742676, 0.016694307327270508, 0.01722562313079834, 0.017756938934326172, 0.018288254737854004, 0.018819570541381836, 0.019350886344909668, 0.0198822021484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 11.0, 14.0, 27.0, 35.0, 53.0, 77.0, 94.0, 152.0, 199.0, 351.0, 664.0, 1375.0, 5066.0, 37235.0, 546443.0, 420638.0, 28758.0, 4332.0, 1325.0, 640.0, 364.0, 218.0, 140.0, 96.0, 52.0, 49.0, 31.0, 24.0, 12.0, 24.0, 16.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.040737152099609375, -0.03932952880859375, -0.037921905517578125, -0.0365142822265625, -0.035106658935546875, -0.03369903564453125, -0.032291412353515625, -0.0308837890625, -0.029476165771484375, -0.02806854248046875, -0.026660919189453125, -0.0252532958984375, -0.023845672607421875, -0.02243804931640625, -0.021030426025390625, -0.019622802734375, -0.018215179443359375, -0.01680755615234375, -0.015399932861328125, -0.0139923095703125, -0.012584686279296875, -0.01117706298828125, -0.009769439697265625, -0.00836181640625, -0.006954193115234375, -0.00554656982421875, -0.004138946533203125, -0.0027313232421875, -0.001323699951171875, 8.392333984375e-05, 0.001491546630859375, 0.002899169921875, 0.004306793212890625, 0.00571441650390625, 0.007122039794921875, 0.0085296630859375, 0.009937286376953125, 0.01134490966796875, 0.012752532958984375, 0.01416015625, 0.015567779541015625, 0.01697540283203125, 0.018383026123046875, 0.0197906494140625, 0.021198272705078125, 0.02260589599609375, 0.024013519287109375, 0.025421142578125, 0.026828765869140625, 0.02823638916015625, 0.029644012451171875, 0.0310516357421875, 0.032459259033203125, 0.03386688232421875, 0.035274505615234375, 0.03668212890625, 0.038089752197265625, 0.03949737548828125, 0.040904998779296875, 0.0423126220703125, 0.043720245361328125, 0.04512786865234375, 0.046535491943359375, 0.047943115234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 6.0, 11.0, 8.0, 10.0, 11.0, 19.0, 26.0, 27.0, 36.0, 45.0, 31.0, 37.0, 39.0, 46.0, 51.0, 46.0, 37.0, 57.0, 54.0, 44.0, 35.0, 41.0, 31.0, 35.0, 26.0, 27.0, 29.0, 15.0, 17.0, 18.0, 14.0, 7.0, 7.0, 6.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01513671875, -0.014740467071533203, -0.014344215393066406, -0.01394796371459961, -0.013551712036132812, -0.013155460357666016, -0.012759208679199219, -0.012362957000732422, -0.011966705322265625, -0.011570453643798828, -0.011174201965332031, -0.010777950286865234, -0.010381698608398438, -0.00998544692993164, -0.009589195251464844, -0.009192943572998047, -0.00879669189453125, -0.008400440216064453, -0.008004188537597656, -0.007607936859130859, -0.0072116851806640625, -0.006815433502197266, -0.006419181823730469, -0.006022930145263672, -0.005626678466796875, -0.005230426788330078, -0.004834175109863281, -0.004437923431396484, -0.0040416717529296875, -0.0036454200744628906, -0.0032491683959960938, -0.002852916717529297, -0.0024566650390625, -0.002060413360595703, -0.0016641616821289062, -0.0012679100036621094, -0.0008716583251953125, -0.0004754066467285156, -7.915496826171875e-05, 0.0003170967102050781, 0.000713348388671875, 0.0011096000671386719, 0.0015058517456054688, 0.0019021034240722656, 0.0022983551025390625, 0.0026946067810058594, 0.0030908584594726562, 0.003487110137939453, 0.00388336181640625, 0.004279613494873047, 0.004675865173339844, 0.005072116851806641, 0.0054683685302734375, 0.005864620208740234, 0.006260871887207031, 0.006657123565673828, 0.007053375244140625, 0.007449626922607422, 0.007845878601074219, 0.008242130279541016, 0.008638381958007812, 0.00903463363647461, 0.009430885314941406, 0.009827136993408203, 0.010223388671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 13.0, 11.0, 10.0, 26.0, 33.0, 59.0, 96.0, 242.0, 490.0, 1236.0, 3760.0, 16142.0, 260879.0, 730455.0, 26951.0, 5345.0, 1583.0, 642.0, 244.0, 155.0, 59.0, 32.0, 27.0, 18.0, 8.0, 6.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.039337158203125, -0.03835701942443848, -0.03737688064575195, -0.03639674186706543, -0.035416603088378906, -0.03443646430969238, -0.03345632553100586, -0.032476186752319336, -0.03149604797363281, -0.03051590919494629, -0.029535770416259766, -0.028555631637573242, -0.02757549285888672, -0.026595354080200195, -0.025615215301513672, -0.02463507652282715, -0.023654937744140625, -0.0226747989654541, -0.021694660186767578, -0.020714521408081055, -0.01973438262939453, -0.018754243850708008, -0.017774105072021484, -0.01679396629333496, -0.015813827514648438, -0.014833688735961914, -0.01385354995727539, -0.012873411178588867, -0.011893272399902344, -0.01091313362121582, -0.009932994842529297, -0.008952856063842773, -0.00797271728515625, -0.0069925785064697266, -0.006012439727783203, -0.00503230094909668, -0.004052162170410156, -0.003072023391723633, -0.0020918846130371094, -0.001111745834350586, -0.0001316070556640625, 0.0008485317230224609, 0.0018286705017089844, 0.002808809280395508, 0.0037889480590820312, 0.004769086837768555, 0.005749225616455078, 0.0067293643951416016, 0.007709503173828125, 0.008689641952514648, 0.009669780731201172, 0.010649919509887695, 0.011630058288574219, 0.012610197067260742, 0.013590335845947266, 0.014570474624633789, 0.015550613403320312, 0.016530752182006836, 0.01751089096069336, 0.018491029739379883, 0.019471168518066406, 0.02045130729675293, 0.021431446075439453, 0.022411584854125977, 0.0233917236328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 1.0, 7.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 20.0, 18.0, 29.0, 28.0, 30.0, 45.0, 57.0, 46.0, 70.0, 80.0, 84.0, 57.0, 64.0, 42.0, 44.0, 36.0, 34.0, 34.0, 19.0, 15.0, 20.0, 15.0, 11.0, 5.0, 2.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-8.040666580200195e-05, -7.82972201704979e-05, -7.618777453899384e-05, -7.407832890748978e-05, -7.196888327598572e-05, -6.985943764448166e-05, -6.77499920129776e-05, -6.564054638147354e-05, -6.353110074996948e-05, -6.142165511846542e-05, -5.9312209486961365e-05, -5.7202763855457306e-05, -5.509331822395325e-05, -5.298387259244919e-05, -5.087442696094513e-05, -4.876498132944107e-05, -4.665553569793701e-05, -4.454609006643295e-05, -4.2436644434928894e-05, -4.0327198803424835e-05, -3.8217753171920776e-05, -3.610830754041672e-05, -3.399886190891266e-05, -3.18894162774086e-05, -2.977997064590454e-05, -2.7670525014400482e-05, -2.5561079382896423e-05, -2.3451633751392365e-05, -2.1342188119888306e-05, -1.9232742488384247e-05, -1.7123296856880188e-05, -1.5013851225376129e-05, -1.290440559387207e-05, -1.0794959962368011e-05, -8.685514330863953e-06, -6.576068699359894e-06, -4.466623067855835e-06, -2.357177436351776e-06, -2.477318048477173e-07, 1.8617138266563416e-06, 3.9711594581604e-06, 6.080605089664459e-06, 8.190050721168518e-06, 1.0299496352672577e-05, 1.2408941984176636e-05, 1.4518387615680695e-05, 1.6627833247184753e-05, 1.8737278878688812e-05, 2.084672451019287e-05, 2.295617014169693e-05, 2.506561577320099e-05, 2.7175061404705048e-05, 2.9284507036209106e-05, 3.1393952667713165e-05, 3.3503398299217224e-05, 3.561284393072128e-05, 3.772228956222534e-05, 3.98317351937294e-05, 4.194118082523346e-05, 4.405062645673752e-05, 4.616007208824158e-05, 4.8269517719745636e-05, 5.0378963351249695e-05, 5.2488408982753754e-05, 5.459785461425781e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 5.0, 9.0, 12.0, 10.0, 19.0, 18.0, 20.0, 21.0, 36.0, 61.0, 96.0, 143.0, 233.0, 474.0, 1418.0, 6795.0, 74150.0, 927509.0, 31772.0, 3879.0, 956.0, 355.0, 172.0, 106.0, 72.0, 53.0, 32.0, 27.0, 24.0, 15.0, 12.0, 5.0, 10.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034576416015625, -0.03354024887084961, -0.03250408172607422, -0.03146791458129883, -0.030431747436523438, -0.029395580291748047, -0.028359413146972656, -0.027323246002197266, -0.026287078857421875, -0.025250911712646484, -0.024214744567871094, -0.023178577423095703, -0.022142410278320312, -0.021106243133544922, -0.02007007598876953, -0.01903390884399414, -0.01799774169921875, -0.01696157455444336, -0.01592540740966797, -0.014889240264892578, -0.013853073120117188, -0.012816905975341797, -0.011780738830566406, -0.010744571685791016, -0.009708404541015625, -0.008672237396240234, -0.007636070251464844, -0.006599903106689453, -0.0055637359619140625, -0.004527568817138672, -0.0034914016723632812, -0.0024552345275878906, -0.0014190673828125, -0.0003829002380371094, 0.0006532669067382812, 0.0016894340515136719, 0.0027256011962890625, 0.003761768341064453, 0.004797935485839844, 0.005834102630615234, 0.006870269775390625, 0.007906436920166016, 0.008942604064941406, 0.009978771209716797, 0.011014938354492188, 0.012051105499267578, 0.013087272644042969, 0.01412343978881836, 0.01515960693359375, 0.01619577407836914, 0.01723194122314453, 0.018268108367919922, 0.019304275512695312, 0.020340442657470703, 0.021376609802246094, 0.022412776947021484, 0.023448944091796875, 0.024485111236572266, 0.025521278381347656, 0.026557445526123047, 0.027593612670898438, 0.028629779815673828, 0.02966594696044922, 0.03070211410522461, 0.03173828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 8.0, 3.0, 7.0, 6.0, 7.0, 10.0, 12.0, 10.0, 26.0, 40.0, 69.0, 97.0, 128.0, 148.0, 125.0, 81.0, 52.0, 44.0, 20.0, 20.0, 12.0, 14.0, 10.0, 7.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007503509521484375, -0.007229030132293701, -0.006954550743103027, -0.0066800713539123535, -0.00640559196472168, -0.006131112575531006, -0.005856633186340332, -0.005582153797149658, -0.005307674407958984, -0.0050331950187683105, -0.004758715629577637, -0.004484236240386963, -0.004209756851196289, -0.003935277462005615, -0.0036607980728149414, -0.0033863186836242676, -0.0031118392944335938, -0.00283735990524292, -0.002562880516052246, -0.0022884011268615723, -0.0020139217376708984, -0.0017394423484802246, -0.0014649629592895508, -0.001190483570098877, -0.0009160041809082031, -0.0006415247917175293, -0.00036704540252685547, -9.256601333618164e-05, 0.0001819133758544922, 0.000456392765045166, 0.0007308721542358398, 0.0010053515434265137, 0.0012798309326171875, 0.0015543103218078613, 0.0018287897109985352, 0.002103269100189209, 0.002377748489379883, 0.0026522278785705566, 0.0029267072677612305, 0.0032011866569519043, 0.003475666046142578, 0.003750145435333252, 0.004024624824523926, 0.0042991042137146, 0.0045735836029052734, 0.004848062992095947, 0.005122542381286621, 0.005397021770477295, 0.005671501159667969, 0.005945980548858643, 0.006220459938049316, 0.00649493932723999, 0.006769418716430664, 0.007043898105621338, 0.007318377494812012, 0.0075928568840026855, 0.00786733627319336, 0.008141815662384033, 0.008416295051574707, 0.00869077444076538, 0.008965253829956055, 0.009239733219146729, 0.009514212608337402, 0.009788691997528076, 0.01006317138671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 37.0, 97.0, 251.0, 250.0, 172.0, 95.0, 43.0, 18.0, 16.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1545153558254242, -0.15064574778079987, -0.14677613973617554, -0.1429065465927124, -0.13903693854808807, -0.13516733050346375, -0.13129772245883942, -0.1274281144142151, -0.12355852127075195, -0.11968891322612762, -0.11581931263208389, -0.11194970458745956, -0.10808010399341583, -0.1042104959487915, -0.10034088790416718, -0.09647128731012344, -0.09260167926549911, -0.08873207122087479, -0.08486247062683105, -0.08099286258220673, -0.077123261988163, -0.07325365394353867, -0.06938405334949493, -0.0655144453048706, -0.061644840985536575, -0.057775236666202545, -0.053905632346868515, -0.050036028027534485, -0.046166419982910156, -0.042296819388866425, -0.038427211344242096, -0.034557607024908066, -0.030688010156154633, -0.026818405836820602, -0.022948801517486572, -0.019079195335507393, -0.015209591016173363, -0.011339986696839333, -0.007470380514860153, -0.003600776195526123, 0.0002688281238079071, 0.0041384329088032246, 0.008008037693798542, 0.011877642944455147, 0.015747247263789177, 0.019616851583123207, 0.023486457765102386, 0.027356062084436417, 0.031225666403770447, 0.03509527072310448, 0.03896487504243851, 0.042834483087062836, 0.04670408368110657, 0.050573691725730896, 0.054443296045064926, 0.058312900364398956, 0.062182504683732986, 0.06605210900306702, 0.06992171704769135, 0.07379131764173508, 0.0776609256863594, 0.08153052628040314, 0.08540013432502747, 0.0892697423696518, 0.09313934296369553]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 15.0, 18.0, 27.0, 28.0, 40.0, 65.0, 57.0, 64.0, 92.0, 71.0, 70.0, 77.0, 61.0, 72.0, 57.0, 48.0, 36.0, 28.0, 16.0, 17.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.087941013276577, -0.08554999530315399, -0.08315898478031158, -0.08076796680688858, -0.07837694883346558, -0.07598593831062317, -0.07359492033720016, -0.07120390236377716, -0.06881288439035416, -0.06642186641693115, -0.06403085589408875, -0.06163983792066574, -0.05924881994724274, -0.05685780569911003, -0.054466791450977325, -0.05207577347755432, -0.04968475550413132, -0.04729374125599861, -0.044902727007865906, -0.0425117090344429, -0.0401206910610199, -0.03772967681288719, -0.035338662564754486, -0.03294764459133148, -0.030556628480553627, -0.028165612369775772, -0.025774596258997917, -0.023383580148220062, -0.020992564037442207, -0.018601547926664352, -0.016210531815886497, -0.013819515705108643, -0.011428499594330788, -0.009037483483552933, -0.006646467372775078, -0.004255451261997223, -0.001864435151219368, 0.0005265809595584869, 0.002917597070336342, 0.005308613181114197, 0.007699629291892052, 0.010090645402669907, 0.012481661513447762, 0.014872677624225616, 0.01726369373500347, 0.019654709845781326, 0.02204572595655918, 0.024436742067337036, 0.02682775817811489, 0.029218774288892746, 0.03160978853702545, 0.034000806510448456, 0.03639182448387146, 0.038782838732004166, 0.04117385298013687, 0.043564870953559875, 0.04595588892698288, 0.048346903175115585, 0.05073791742324829, 0.053128935396671295, 0.0555199533700943, 0.057910967618227005, 0.06030198186635971, 0.06269299983978271]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 14.0, 7.0, 12.0, 21.0, 62.0, 74.0, 142.0, 271.0, 461.0, 993.0, 2541.0, 8302.0, 461607.0, 3698512.0, 16264.0, 2544.0, 975.0, 571.0, 330.0, 217.0, 129.0, 80.0, 51.0, 32.0, 19.0, 13.0, 10.0, 13.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.03617429733276367, -0.034934043884277344, -0.033693790435791016, -0.03245353698730469, -0.03121328353881836, -0.02997303009033203, -0.028732776641845703, -0.027492523193359375, -0.026252269744873047, -0.02501201629638672, -0.02377176284790039, -0.022531509399414062, -0.021291255950927734, -0.020051002502441406, -0.018810749053955078, -0.01757049560546875, -0.016330242156982422, -0.015089988708496094, -0.013849735260009766, -0.012609481811523438, -0.01136922836303711, -0.010128974914550781, -0.008888721466064453, -0.007648468017578125, -0.006408214569091797, -0.005167961120605469, -0.003927707672119141, -0.0026874542236328125, -0.0014472007751464844, -0.00020694732666015625, 0.0010333061218261719, 0.0022735595703125, 0.003513813018798828, 0.004754066467285156, 0.005994319915771484, 0.0072345733642578125, 0.00847482681274414, 0.009715080261230469, 0.010955333709716797, 0.012195587158203125, 0.013435840606689453, 0.014676094055175781, 0.01591634750366211, 0.017156600952148438, 0.018396854400634766, 0.019637107849121094, 0.020877361297607422, 0.02211761474609375, 0.023357868194580078, 0.024598121643066406, 0.025838375091552734, 0.027078628540039062, 0.02831888198852539, 0.02955913543701172, 0.030799388885498047, 0.032039642333984375, 0.0332798957824707, 0.03452014923095703, 0.03576040267944336, 0.03700065612792969, 0.038240909576416016, 0.039481163024902344, 0.04072141647338867, 0.041961669921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 13.0, 44.0, 105.0, 196.0, 247.0, 207.0, 111.0, 40.0, 23.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01549530029296875, -0.01495349407196045, -0.014411687850952148, -0.013869881629943848, -0.013328075408935547, -0.012786269187927246, -0.012244462966918945, -0.011702656745910645, -0.011160850524902344, -0.010619044303894043, -0.010077238082885742, -0.009535431861877441, -0.00899362564086914, -0.00845181941986084, -0.007910013198852539, -0.007368206977844238, -0.0068264007568359375, -0.006284594535827637, -0.005742788314819336, -0.005200982093811035, -0.004659175872802734, -0.004117369651794434, -0.003575563430786133, -0.003033757209777832, -0.0024919509887695312, -0.0019501447677612305, -0.0014083385467529297, -0.0008665323257446289, -0.0003247261047363281, 0.00021708011627197266, 0.0007588863372802734, 0.0013006925582885742, 0.001842498779296875, 0.0023843050003051758, 0.0029261112213134766, 0.0034679174423217773, 0.004009723663330078, 0.004551529884338379, 0.00509333610534668, 0.0056351423263549805, 0.006176948547363281, 0.006718754768371582, 0.007260560989379883, 0.007802367210388184, 0.008344173431396484, 0.008885979652404785, 0.009427785873413086, 0.009969592094421387, 0.010511398315429688, 0.011053204536437988, 0.011595010757446289, 0.01213681697845459, 0.01267862319946289, 0.013220429420471191, 0.013762235641479492, 0.014304041862487793, 0.014845848083496094, 0.015387654304504395, 0.015929460525512695, 0.016471266746520996, 0.017013072967529297, 0.017554879188537598, 0.0180966854095459, 0.0186384916305542, 0.0191802978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 23.0, 20.0, 23.0, 37.0, 82.0, 137.0, 234.0, 470.0, 1080.0, 2765.0, 11995.0, 230289.0, 3790630.0, 142427.0, 9636.0, 2359.0, 919.0, 484.0, 244.0, 131.0, 82.0, 63.0, 48.0, 33.0, 24.0, 9.0, 10.0, 7.0, 0.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028007030487060547, -0.027022361755371094, -0.02603769302368164, -0.025053024291992188, -0.024068355560302734, -0.02308368682861328, -0.022099018096923828, -0.021114349365234375, -0.020129680633544922, -0.01914501190185547, -0.018160343170166016, -0.017175674438476562, -0.01619100570678711, -0.015206336975097656, -0.014221668243408203, -0.01323699951171875, -0.012252330780029297, -0.011267662048339844, -0.01028299331665039, -0.009298324584960938, -0.008313655853271484, -0.007328987121582031, -0.006344318389892578, -0.005359649658203125, -0.004374980926513672, -0.0033903121948242188, -0.0024056434631347656, -0.0014209747314453125, -0.0004363059997558594, 0.0005483627319335938, 0.0015330314636230469, 0.0025177001953125, 0.003502368927001953, 0.004487037658691406, 0.005471706390380859, 0.0064563751220703125, 0.007441043853759766, 0.008425712585449219, 0.009410381317138672, 0.010395050048828125, 0.011379718780517578, 0.012364387512207031, 0.013349056243896484, 0.014333724975585938, 0.01531839370727539, 0.016303062438964844, 0.017287731170654297, 0.01827239990234375, 0.019257068634033203, 0.020241737365722656, 0.02122640609741211, 0.022211074829101562, 0.023195743560791016, 0.02418041229248047, 0.025165081024169922, 0.026149749755859375, 0.027134418487548828, 0.02811908721923828, 0.029103755950927734, 0.030088424682617188, 0.03107309341430664, 0.032057762145996094, 0.03304243087768555, 0.034027099609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 12.0, 14.0, 24.0, 30.0, 35.0, 57.0, 81.0, 127.0, 176.0, 214.0, 288.0, 396.0, 441.0, 550.0, 385.0, 347.0, 313.0, 204.0, 108.0, 89.0, 62.0, 45.0, 21.0, 19.0, 12.0, 6.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0149688720703125, -0.014580845832824707, -0.014192819595336914, -0.013804793357849121, -0.013416767120361328, -0.013028740882873535, -0.012640714645385742, -0.01225268840789795, -0.011864662170410156, -0.011476635932922363, -0.01108860969543457, -0.010700583457946777, -0.010312557220458984, -0.009924530982971191, -0.009536504745483398, -0.009148478507995605, -0.008760452270507812, -0.00837242603302002, -0.007984399795532227, -0.007596373558044434, -0.007208347320556641, -0.006820321083068848, -0.006432294845581055, -0.006044268608093262, -0.005656242370605469, -0.005268216133117676, -0.004880189895629883, -0.00449216365814209, -0.004104137420654297, -0.003716111183166504, -0.003328084945678711, -0.002940058708190918, -0.002552032470703125, -0.002164006233215332, -0.001775979995727539, -0.001387953758239746, -0.0009999275207519531, -0.0006119012832641602, -0.0002238750457763672, 0.00016415119171142578, 0.0005521774291992188, 0.0009402036666870117, 0.0013282299041748047, 0.0017162561416625977, 0.0021042823791503906, 0.0024923086166381836, 0.0028803348541259766, 0.0032683610916137695, 0.0036563873291015625, 0.0040444135665893555, 0.0044324398040771484, 0.004820466041564941, 0.005208492279052734, 0.005596518516540527, 0.00598454475402832, 0.006372570991516113, 0.006760597229003906, 0.007148623466491699, 0.007536649703979492, 0.007924675941467285, 0.008312702178955078, 0.008700728416442871, 0.009088754653930664, 0.009476780891418457, 0.00986480712890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 38.0, 218.0, 505.0, 203.0, 28.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18809863924980164, -0.1812610775232315, -0.17442351579666138, -0.16758596897125244, -0.1607484072446823, -0.15391084551811218, -0.14707328379154205, -0.14023572206497192, -0.1333981603384018, -0.12656059861183167, -0.11972304433584213, -0.112885482609272, -0.10604792088270187, -0.09921036660671234, -0.09237280488014221, -0.08553524315357208, -0.07869768887758255, -0.07186012715101242, -0.06502257287502289, -0.05818501114845276, -0.05134744942188263, -0.0445098914206028, -0.03767233341932297, -0.030834771692752838, -0.023997213691473007, -0.017159653827548027, -0.010322094894945621, -0.003484535962343216, 0.0033530239015817642, 0.010190583765506744, 0.017028141766786575, 0.023865703493356705, 0.030703261494636536, 0.03754081949591637, 0.044378381222486496, 0.05121593922376633, 0.058053500950336456, 0.06489105522632599, 0.07172861695289612, 0.07856617867946625, 0.08540374040603638, 0.0922413021326065, 0.09907885640859604, 0.10591641813516617, 0.1127539798617363, 0.11959153413772583, 0.12642909586429596, 0.1332666575908661, 0.14010420441627502, 0.14694176614284515, 0.15377932786941528, 0.16061687469482422, 0.16745443642139435, 0.17429199814796448, 0.1811295598745346, 0.18796712160110474, 0.19480468332767487, 0.201642245054245, 0.20847980678081512, 0.21531736850738525, 0.2221549153327942, 0.22899247705936432, 0.23583003878593445, 0.24266760051250458, 0.2495051622390747]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 22.0, 26.0, 31.0, 51.0, 54.0, 67.0, 87.0, 87.0, 66.0, 70.0, 72.0, 72.0, 82.0, 48.0, 49.0, 33.0, 23.0, 17.0, 14.0, 6.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07989686727523804, -0.07736919075250626, -0.07484152168035507, -0.07231384515762329, -0.0697861760854721, -0.06725849956274033, -0.06473082304000854, -0.06220315024256706, -0.05967547744512558, -0.0571478046476841, -0.054620131850242615, -0.052092455327510834, -0.04956478253006935, -0.04703710973262787, -0.04450943320989609, -0.041981760412454605, -0.03945408761501312, -0.03692641481757164, -0.03439874202013016, -0.031871065497398376, -0.029343392699956894, -0.02681571990251541, -0.02428804524242878, -0.021760370582342148, -0.019232697784900665, -0.016705024987459183, -0.014177350327372551, -0.011649676598608494, -0.009122002869844437, -0.0065943291410803795, -0.004066655412316322, -0.0015389807522296906, 0.000988692045211792, 0.003516365773975849, 0.006044039502739906, 0.008571713231503963, 0.01109938696026802, 0.013627060689032078, 0.016154734417796135, 0.018682409077882767, 0.02121008187532425, 0.023737754672765732, 0.026265429332852364, 0.028793103992938995, 0.03132077679038048, 0.03384844958782196, 0.03637612611055374, 0.038903798907995224, 0.04143147170543671, 0.04395914450287819, 0.04648681730031967, 0.04901449382305145, 0.051542166620492935, 0.05406983941793442, 0.0565975159406662, 0.05912518873810768, 0.061652861535549164, 0.06418053805828094, 0.06670820713043213, 0.06923588365316391, 0.07176356017589569, 0.07429122924804688, 0.07681890577077866, 0.07934658229351044, 0.08187425136566162]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 14.0, 6.0, 8.0, 8.0, 15.0, 19.0, 21.0, 35.0, 44.0, 54.0, 73.0, 98.0, 115.0, 145.0, 233.0, 290.0, 419.0, 634.0, 1153.0, 4126.0, 42407.0, 811131.0, 173731.0, 9189.0, 1941.0, 851.0, 451.0, 363.0, 230.0, 170.0, 122.0, 101.0, 80.0, 60.0, 47.0, 35.0, 36.0, 21.0, 11.0, 18.0, 11.0, 9.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04902172088623047, -0.04756736755371094, -0.046113014221191406, -0.044658660888671875, -0.043204307556152344, -0.04174995422363281, -0.04029560089111328, -0.03884124755859375, -0.03738689422607422, -0.03593254089355469, -0.034478187561035156, -0.033023834228515625, -0.031569480895996094, -0.030115127563476562, -0.02866077423095703, -0.0272064208984375, -0.02575206756591797, -0.024297714233398438, -0.022843360900878906, -0.021389007568359375, -0.019934654235839844, -0.018480300903320312, -0.01702594757080078, -0.01557159423828125, -0.014117240905761719, -0.012662887573242188, -0.011208534240722656, -0.009754180908203125, -0.008299827575683594, -0.0068454742431640625, -0.005391120910644531, -0.003936767578125, -0.0024824142456054688, -0.0010280609130859375, 0.00042629241943359375, 0.001880645751953125, 0.0033349990844726562, 0.0047893524169921875, 0.006243705749511719, 0.00769805908203125, 0.009152412414550781, 0.010606765747070312, 0.012061119079589844, 0.013515472412109375, 0.014969825744628906, 0.016424179077148438, 0.01787853240966797, 0.0193328857421875, 0.02078723907470703, 0.022241592407226562, 0.023695945739746094, 0.025150299072265625, 0.026604652404785156, 0.028059005737304688, 0.02951335906982422, 0.03096771240234375, 0.03242206573486328, 0.03387641906738281, 0.035330772399902344, 0.036785125732421875, 0.038239479064941406, 0.03969383239746094, 0.04114818572998047, 0.0426025390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 16.0, 44.0, 108.0, 188.0, 251.0, 191.0, 133.0, 46.0, 16.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01554107666015625, -0.014997124671936035, -0.01445317268371582, -0.013909220695495605, -0.01336526870727539, -0.012821316719055176, -0.012277364730834961, -0.011733412742614746, -0.011189460754394531, -0.010645508766174316, -0.010101556777954102, -0.009557604789733887, -0.009013652801513672, -0.008469700813293457, -0.007925748825073242, -0.007381796836853027, -0.0068378448486328125, -0.006293892860412598, -0.005749940872192383, -0.005205988883972168, -0.004662036895751953, -0.004118084907531738, -0.0035741329193115234, -0.0030301809310913086, -0.0024862289428710938, -0.001942276954650879, -0.001398324966430664, -0.0008543729782104492, -0.0003104209899902344, 0.00023353099822998047, 0.0007774829864501953, 0.0013214349746704102, 0.001865386962890625, 0.00240933895111084, 0.0029532909393310547, 0.0034972429275512695, 0.004041194915771484, 0.004585146903991699, 0.005129098892211914, 0.005673050880432129, 0.006217002868652344, 0.006760954856872559, 0.0073049068450927734, 0.007848858833312988, 0.008392810821533203, 0.008936762809753418, 0.009480714797973633, 0.010024666786193848, 0.010568618774414062, 0.011112570762634277, 0.011656522750854492, 0.012200474739074707, 0.012744426727294922, 0.013288378715515137, 0.013832330703735352, 0.014376282691955566, 0.014920234680175781, 0.015464186668395996, 0.01600813865661621, 0.016552090644836426, 0.01709604263305664, 0.017639994621276855, 0.01818394660949707, 0.018727898597717285, 0.0192718505859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 14.0, 28.0, 25.0, 38.0, 40.0, 87.0, 139.0, 236.0, 430.0, 786.0, 1911.0, 8974.0, 218744.0, 780884.0, 30422.0, 3298.0, 1147.0, 522.0, 292.0, 162.0, 107.0, 76.0, 43.0, 41.0, 18.0, 21.0, 8.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044525146484375, -0.04294776916503906, -0.041370391845703125, -0.03979301452636719, -0.03821563720703125, -0.03663825988769531, -0.035060882568359375, -0.03348350524902344, -0.0319061279296875, -0.030328750610351562, -0.028751373291015625, -0.027173995971679688, -0.02559661865234375, -0.024019241333007812, -0.022441864013671875, -0.020864486694335938, -0.019287109375, -0.017709732055664062, -0.016132354736328125, -0.014554977416992188, -0.01297760009765625, -0.011400222778320312, -0.009822845458984375, -0.008245468139648438, -0.0066680908203125, -0.0050907135009765625, -0.003513336181640625, -0.0019359588623046875, -0.00035858154296875, 0.0012187957763671875, 0.002796173095703125, 0.0043735504150390625, 0.005950927734375, 0.0075283050537109375, 0.009105682373046875, 0.010683059692382812, 0.01226043701171875, 0.013837814331054688, 0.015415191650390625, 0.016992568969726562, 0.0185699462890625, 0.020147323608398438, 0.021724700927734375, 0.023302078247070312, 0.02487945556640625, 0.026456832885742188, 0.028034210205078125, 0.029611587524414062, 0.03118896484375, 0.03276634216308594, 0.034343719482421875, 0.03592109680175781, 0.03749847412109375, 0.03907585144042969, 0.040653228759765625, 0.04223060607910156, 0.0438079833984375, 0.04538536071777344, 0.046962738037109375, 0.04854011535644531, 0.05011749267578125, 0.05169486999511719, 0.053272247314453125, 0.05484962463378906, 0.056427001953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 4.0, 15.0, 11.0, 22.0, 20.0, 21.0, 25.0, 28.0, 30.0, 26.0, 37.0, 40.0, 27.0, 35.0, 43.0, 46.0, 40.0, 48.0, 29.0, 32.0, 31.0, 36.0, 44.0, 38.0, 33.0, 36.0, 35.0, 23.0, 15.0, 18.0, 12.0, 16.0, 9.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01213836669921875, -0.011754989624023438, -0.011371612548828125, -0.010988235473632812, -0.0106048583984375, -0.010221481323242188, -0.009838104248046875, -0.009454727172851562, -0.00907135009765625, -0.008687973022460938, -0.008304595947265625, -0.007921218872070312, -0.007537841796875, -0.0071544647216796875, -0.006771087646484375, -0.0063877105712890625, -0.00600433349609375, -0.0056209564208984375, -0.005237579345703125, -0.0048542022705078125, -0.0044708251953125, -0.0040874481201171875, -0.003704071044921875, -0.0033206939697265625, -0.00293731689453125, -0.0025539398193359375, -0.002170562744140625, -0.0017871856689453125, -0.00140380859375, -0.0010204315185546875, -0.000637054443359375, -0.0002536773681640625, 0.00012969970703125, 0.0005130767822265625, 0.000896453857421875, 0.0012798309326171875, 0.0016632080078125, 0.0020465850830078125, 0.002429962158203125, 0.0028133392333984375, 0.00319671630859375, 0.0035800933837890625, 0.003963470458984375, 0.0043468475341796875, 0.004730224609375, 0.0051136016845703125, 0.005496978759765625, 0.0058803558349609375, 0.00626373291015625, 0.0066471099853515625, 0.007030487060546875, 0.0074138641357421875, 0.0077972412109375, 0.008180618286132812, 0.008563995361328125, 0.008947372436523438, 0.00933074951171875, 0.009714126586914062, 0.010097503662109375, 0.010480880737304688, 0.0108642578125, 0.011247634887695312, 0.011631011962890625, 0.012014389038085938, 0.01239776611328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 6.0, 6.0, 12.0, 18.0, 28.0, 44.0, 65.0, 98.0, 181.0, 374.0, 874.0, 2171.0, 6945.0, 38067.0, 560182.0, 401083.0, 29071.0, 5882.0, 1890.0, 753.0, 331.0, 172.0, 99.0, 62.0, 35.0, 23.0, 15.0, 16.0, 9.0, 5.0, 4.0, 4.0, 3.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.014801025390625, -0.014377355575561523, -0.013953685760498047, -0.01353001594543457, -0.013106346130371094, -0.012682676315307617, -0.01225900650024414, -0.011835336685180664, -0.011411666870117188, -0.010987997055053711, -0.010564327239990234, -0.010140657424926758, -0.009716987609863281, -0.009293317794799805, -0.008869647979736328, -0.008445978164672852, -0.008022308349609375, -0.0075986385345458984, -0.007174968719482422, -0.006751298904418945, -0.006327629089355469, -0.005903959274291992, -0.005480289459228516, -0.005056619644165039, -0.0046329498291015625, -0.004209280014038086, -0.0037856101989746094, -0.003361940383911133, -0.0029382705688476562, -0.0025146007537841797, -0.002090930938720703, -0.0016672611236572266, -0.00124359130859375, -0.0008199214935302734, -0.0003962516784667969, 2.7418136596679688e-05, 0.00045108795166015625, 0.0008747577667236328, 0.0012984275817871094, 0.001722097396850586, 0.0021457672119140625, 0.002569437026977539, 0.0029931068420410156, 0.003416776657104492, 0.0038404464721679688, 0.004264116287231445, 0.004687786102294922, 0.0051114559173583984, 0.005535125732421875, 0.0059587955474853516, 0.006382465362548828, 0.006806135177612305, 0.007229804992675781, 0.007653474807739258, 0.008077144622802734, 0.008500814437866211, 0.008924484252929688, 0.009348154067993164, 0.00977182388305664, 0.010195493698120117, 0.010619163513183594, 0.01104283332824707, 0.011466503143310547, 0.011890172958374023, 0.0123138427734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 15.0, 13.0, 24.0, 33.0, 26.0, 44.0, 44.0, 64.0, 83.0, 83.0, 81.0, 95.0, 71.0, 70.0, 41.0, 41.0, 41.0, 19.0, 17.0, 21.0, 14.0, 5.0, 12.0, 9.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.967782974243164e-05, -6.712786853313446e-05, -6.457790732383728e-05, -6.20279461145401e-05, -5.947798490524292e-05, -5.692802369594574e-05, -5.437806248664856e-05, -5.182810127735138e-05, -4.92781400680542e-05, -4.672817885875702e-05, -4.417821764945984e-05, -4.162825644016266e-05, -3.907829523086548e-05, -3.65283340215683e-05, -3.397837281227112e-05, -3.142841160297394e-05, -2.8878450393676758e-05, -2.6328489184379578e-05, -2.3778527975082397e-05, -2.1228566765785217e-05, -1.8678605556488037e-05, -1.6128644347190857e-05, -1.3578683137893677e-05, -1.1028721928596497e-05, -8.478760719299316e-06, -5.928799510002136e-06, -3.378838300704956e-06, -8.288770914077759e-07, 1.7210841178894043e-06, 4.2710453271865845e-06, 6.821006536483765e-06, 9.370967745780945e-06, 1.1920928955078125e-05, 1.4470890164375305e-05, 1.7020851373672485e-05, 1.9570812582969666e-05, 2.2120773792266846e-05, 2.4670735001564026e-05, 2.7220696210861206e-05, 2.9770657420158386e-05, 3.2320618629455566e-05, 3.4870579838752747e-05, 3.742054104804993e-05, 3.997050225734711e-05, 4.252046346664429e-05, 4.507042467594147e-05, 4.762038588523865e-05, 5.017034709453583e-05, 5.272030830383301e-05, 5.527026951313019e-05, 5.782023072242737e-05, 6.037019193172455e-05, 6.292015314102173e-05, 6.547011435031891e-05, 6.802007555961609e-05, 7.057003676891327e-05, 7.311999797821045e-05, 7.566995918750763e-05, 7.821992039680481e-05, 8.076988160610199e-05, 8.331984281539917e-05, 8.586980402469635e-05, 8.841976523399353e-05, 9.096972644329071e-05, 9.351968765258789e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 20.0, 25.0, 35.0, 45.0, 87.0, 134.0, 297.0, 645.0, 2300.0, 22689.0, 926168.0, 90032.0, 4270.0, 944.0, 362.0, 181.0, 111.0, 53.0, 46.0, 31.0, 24.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.031402587890625, -0.03063058853149414, -0.02985858917236328, -0.029086589813232422, -0.028314590454101562, -0.027542591094970703, -0.026770591735839844, -0.025998592376708984, -0.025226593017578125, -0.024454593658447266, -0.023682594299316406, -0.022910594940185547, -0.022138595581054688, -0.021366596221923828, -0.02059459686279297, -0.01982259750366211, -0.01905059814453125, -0.01827859878540039, -0.01750659942626953, -0.016734600067138672, -0.015962600708007812, -0.015190601348876953, -0.014418601989746094, -0.013646602630615234, -0.012874603271484375, -0.012102603912353516, -0.011330604553222656, -0.010558605194091797, -0.009786605834960938, -0.009014606475830078, -0.008242607116699219, -0.007470607757568359, -0.0066986083984375, -0.005926609039306641, -0.005154609680175781, -0.004382610321044922, -0.0036106109619140625, -0.002838611602783203, -0.0020666122436523438, -0.0012946128845214844, -0.000522613525390625, 0.0002493858337402344, 0.0010213851928710938, 0.0017933845520019531, 0.0025653839111328125, 0.003337383270263672, 0.004109382629394531, 0.004881381988525391, 0.00565338134765625, 0.006425380706787109, 0.007197380065917969, 0.007969379425048828, 0.008741378784179688, 0.009513378143310547, 0.010285377502441406, 0.011057376861572266, 0.011829376220703125, 0.012601375579833984, 0.013373374938964844, 0.014145374298095703, 0.014917373657226562, 0.015689373016357422, 0.01646137237548828, 0.01723337173461914, 0.01800537109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 19.0, 13.0, 23.0, 27.0, 28.0, 56.0, 72.0, 87.0, 125.0, 110.0, 108.0, 100.0, 58.0, 36.0, 25.0, 26.0, 16.0, 16.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005786895751953125, -0.005539357662200928, -0.0052918195724487305, -0.005044281482696533, -0.004796743392944336, -0.004549205303192139, -0.004301667213439941, -0.004054129123687744, -0.003806591033935547, -0.0035590529441833496, -0.0033115148544311523, -0.003063976764678955, -0.002816438674926758, -0.0025689005851745605, -0.0023213624954223633, -0.002073824405670166, -0.0018262863159179688, -0.0015787482261657715, -0.0013312101364135742, -0.001083672046661377, -0.0008361339569091797, -0.0005885958671569824, -0.00034105777740478516, -9.351968765258789e-05, 0.00015401840209960938, 0.00040155649185180664, 0.0006490945816040039, 0.0008966326713562012, 0.0011441707611083984, 0.0013917088508605957, 0.001639246940612793, 0.0018867850303649902, 0.0021343231201171875, 0.0023818612098693848, 0.002629399299621582, 0.0028769373893737793, 0.0031244754791259766, 0.003372013568878174, 0.003619551658630371, 0.0038670897483825684, 0.004114627838134766, 0.004362165927886963, 0.00460970401763916, 0.004857242107391357, 0.005104780197143555, 0.005352318286895752, 0.005599856376647949, 0.0058473944664001465, 0.006094932556152344, 0.006342470645904541, 0.006590008735656738, 0.0068375468254089355, 0.007085084915161133, 0.00733262300491333, 0.007580161094665527, 0.007827699184417725, 0.008075237274169922, 0.00832277536392212, 0.008570313453674316, 0.008817851543426514, 0.009065389633178711, 0.009312927722930908, 0.009560465812683105, 0.009808003902435303, 0.0100555419921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 28.0, 299.0, 516.0, 125.0, 30.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2858009338378906, -0.2782890796661377, -0.2707771956920624, -0.26326534152030945, -0.25575345754623413, -0.2482416033744812, -0.24072974920272827, -0.23321788012981415, -0.22570601105690002, -0.2181941419839859, -0.21068227291107178, -0.20317041873931885, -0.19565854966640472, -0.1881466805934906, -0.18063482642173767, -0.17312295734882355, -0.16561108827590942, -0.1580992192029953, -0.15058735013008118, -0.14307549595832825, -0.13556362688541412, -0.1280517578125, -0.12053989619016647, -0.11302803456783295, -0.10551616549491882, -0.0980042964220047, -0.09049243479967117, -0.08298057317733765, -0.07546870410442352, -0.0679568350315094, -0.06044497340917587, -0.05293310806155205, -0.04542122781276703, -0.037909362465143204, -0.03039749711751938, -0.022885631769895554, -0.015373766422271729, -0.007861901074647903, -0.00035003572702407837, 0.007161829620599747, 0.014673694968223572, 0.022185560315847397, 0.029697425663471222, 0.03720929101109505, 0.04472115635871887, 0.0522330217063427, 0.05974488705396652, 0.06725674867630005, 0.07476861774921417, 0.0822804868221283, 0.08979234844446182, 0.09730421006679535, 0.10481607913970947, 0.1123279482126236, 0.11983980983495712, 0.12735167145729065, 0.13486354053020477, 0.1423754096031189, 0.14988726377487183, 0.15739913284778595, 0.16491100192070007, 0.1724228709936142, 0.17993474006652832, 0.18744659423828125, 0.19495846331119537]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 9.0, 13.0, 13.0, 13.0, 15.0, 22.0, 20.0, 26.0, 34.0, 27.0, 55.0, 36.0, 46.0, 52.0, 63.0, 48.0, 39.0, 58.0, 50.0, 48.0, 46.0, 38.0, 43.0, 39.0, 22.0, 19.0, 13.0, 20.0, 8.0, 16.0, 7.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04639232158660889, -0.044932566583156586, -0.043472807854413986, -0.04201304912567139, -0.040553294122219086, -0.039093539118766785, -0.037633780390024185, -0.036174021661281586, -0.034714266657829285, -0.033254511654376984, -0.031794752925634384, -0.030334996059536934, -0.028875239193439484, -0.027415482327342033, -0.025955725461244583, -0.024495968595147133, -0.023036211729049683, -0.021576454862952232, -0.020116697996854782, -0.018656941130757332, -0.01719718426465988, -0.01573742739856243, -0.014277670532464981, -0.01281791366636753, -0.01135815680027008, -0.00989839993417263, -0.00843864306807518, -0.00697888620197773, -0.0055191293358802795, -0.004059372469782829, -0.002599615603685379, -0.0011398587375879288, 0.0003198981285095215, 0.0017796549946069717, 0.003239411860704422, 0.004699168726801872, 0.0061589255928993225, 0.007618682458996773, 0.009078439325094223, 0.010538196191191673, 0.011997953057289124, 0.013457709923386574, 0.014917466789484024, 0.016377223655581474, 0.017836980521678925, 0.019296737387776375, 0.020756494253873825, 0.022216251119971275, 0.023676007986068726, 0.025135764852166176, 0.026595521718263626, 0.028055278584361076, 0.029515035450458527, 0.030974792316555977, 0.03243454918265343, 0.03389430791139603, 0.03535406291484833, 0.03681381791830063, 0.03827357664704323, 0.03973333537578583, 0.04119309037923813, 0.04265284538269043, 0.04411260411143303, 0.04557236284017563, 0.04703211784362793]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 6.0, 16.0, 34.0, 28.0, 57.0, 72.0, 128.0, 172.0, 321.0, 574.0, 1042.0, 2769.0, 6630.0, 42508.0, 3946726.0, 179045.0, 9150.0, 2402.0, 871.0, 570.0, 364.0, 239.0, 161.0, 93.0, 84.0, 70.0, 38.0, 26.0, 26.0, 14.0, 13.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03173828125, -0.030703067779541016, -0.02966785430908203, -0.028632640838623047, -0.027597427368164062, -0.026562213897705078, -0.025527000427246094, -0.02449178695678711, -0.023456573486328125, -0.02242136001586914, -0.021386146545410156, -0.020350933074951172, -0.019315719604492188, -0.018280506134033203, -0.01724529266357422, -0.016210079193115234, -0.01517486572265625, -0.014139652252197266, -0.013104438781738281, -0.012069225311279297, -0.011034011840820312, -0.009998798370361328, -0.008963584899902344, -0.00792837142944336, -0.006893157958984375, -0.005857944488525391, -0.004822731018066406, -0.003787517547607422, -0.0027523040771484375, -0.0017170906066894531, -0.0006818771362304688, 0.0003533363342285156, 0.0013885498046875, 0.0024237632751464844, 0.0034589767456054688, 0.004494190216064453, 0.0055294036865234375, 0.006564617156982422, 0.007599830627441406, 0.00863504409790039, 0.009670257568359375, 0.01070547103881836, 0.011740684509277344, 0.012775897979736328, 0.013811111450195312, 0.014846324920654297, 0.01588153839111328, 0.016916751861572266, 0.01795196533203125, 0.018987178802490234, 0.02002239227294922, 0.021057605743408203, 0.022092819213867188, 0.023128032684326172, 0.024163246154785156, 0.02519845962524414, 0.026233673095703125, 0.02726888656616211, 0.028304100036621094, 0.029339313507080078, 0.030374526977539062, 0.03140974044799805, 0.03244495391845703, 0.033480167388916016, 0.034515380859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 40.0, 85.0, 190.0, 259.0, 200.0, 142.0, 52.0, 20.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01702880859375, -0.016456127166748047, -0.015883445739746094, -0.01531076431274414, -0.014738082885742188, -0.014165401458740234, -0.013592720031738281, -0.013020038604736328, -0.012447357177734375, -0.011874675750732422, -0.011301994323730469, -0.010729312896728516, -0.010156631469726562, -0.00958395004272461, -0.009011268615722656, -0.008438587188720703, -0.00786590576171875, -0.007293224334716797, -0.006720542907714844, -0.006147861480712891, -0.0055751800537109375, -0.005002498626708984, -0.004429817199707031, -0.003857135772705078, -0.003284454345703125, -0.002711772918701172, -0.0021390914916992188, -0.0015664100646972656, -0.0009937286376953125, -0.0004210472106933594, 0.00015163421630859375, 0.0007243156433105469, 0.0012969970703125, 0.0018696784973144531, 0.0024423599243164062, 0.0030150413513183594, 0.0035877227783203125, 0.004160404205322266, 0.004733085632324219, 0.005305767059326172, 0.005878448486328125, 0.006451129913330078, 0.007023811340332031, 0.007596492767333984, 0.008169174194335938, 0.00874185562133789, 0.009314537048339844, 0.009887218475341797, 0.01045989990234375, 0.011032581329345703, 0.011605262756347656, 0.01217794418334961, 0.012750625610351562, 0.013323307037353516, 0.013895988464355469, 0.014468669891357422, 0.015041351318359375, 0.015614032745361328, 0.01618671417236328, 0.016759395599365234, 0.017332077026367188, 0.01790475845336914, 0.018477439880371094, 0.019050121307373047, 0.019622802734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 16.0, 23.0, 24.0, 37.0, 57.0, 73.0, 135.0, 237.0, 461.0, 946.0, 3401.0, 27760.0, 3553829.0, 592231.0, 11211.0, 2177.0, 780.0, 362.0, 181.0, 104.0, 76.0, 39.0, 29.0, 24.0, 17.0, 7.0, 9.0, 3.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02984619140625, -0.02873373031616211, -0.02762126922607422, -0.026508808135986328, -0.025396347045898438, -0.024283885955810547, -0.023171424865722656, -0.022058963775634766, -0.020946502685546875, -0.019834041595458984, -0.018721580505371094, -0.017609119415283203, -0.016496658325195312, -0.015384197235107422, -0.014271736145019531, -0.01315927505493164, -0.01204681396484375, -0.01093435287475586, -0.009821891784667969, -0.008709430694580078, -0.0075969696044921875, -0.006484508514404297, -0.005372047424316406, -0.004259586334228516, -0.003147125244140625, -0.0020346641540527344, -0.0009222030639648438, 0.00019025802612304688, 0.0013027191162109375, 0.002415180206298828, 0.0035276412963867188, 0.004640102386474609, 0.0057525634765625, 0.006865024566650391, 0.007977485656738281, 0.009089946746826172, 0.010202407836914062, 0.011314868927001953, 0.012427330017089844, 0.013539791107177734, 0.014652252197265625, 0.015764713287353516, 0.016877174377441406, 0.017989635467529297, 0.019102096557617188, 0.020214557647705078, 0.02132701873779297, 0.02243947982788086, 0.02355194091796875, 0.02466440200805664, 0.02577686309814453, 0.026889324188232422, 0.028001785278320312, 0.029114246368408203, 0.030226707458496094, 0.031339168548583984, 0.032451629638671875, 0.033564090728759766, 0.034676551818847656, 0.03578901290893555, 0.03690147399902344, 0.03801393508911133, 0.03912639617919922, 0.04023885726928711, 0.041351318359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 20.0, 18.0, 29.0, 31.0, 60.0, 84.0, 104.0, 135.0, 227.0, 313.0, 495.0, 642.0, 531.0, 391.0, 302.0, 187.0, 139.0, 101.0, 63.0, 54.0, 27.0, 31.0, 21.0, 19.0, 7.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01004791259765625, -0.009709000587463379, -0.009370088577270508, -0.009031176567077637, -0.008692264556884766, -0.008353352546691895, -0.008014440536499023, -0.007675528526306152, -0.007336616516113281, -0.00699770450592041, -0.006658792495727539, -0.006319880485534668, -0.005980968475341797, -0.005642056465148926, -0.005303144454956055, -0.004964232444763184, -0.0046253204345703125, -0.004286408424377441, -0.00394749641418457, -0.0036085844039916992, -0.003269672393798828, -0.002930760383605957, -0.002591848373413086, -0.002252936363220215, -0.0019140243530273438, -0.0015751123428344727, -0.0012362003326416016, -0.0008972883224487305, -0.0005583763122558594, -0.00021946430206298828, 0.00011944770812988281, 0.0004583597183227539, 0.000797271728515625, 0.001136183738708496, 0.0014750957489013672, 0.0018140077590942383, 0.0021529197692871094, 0.0024918317794799805, 0.0028307437896728516, 0.0031696557998657227, 0.0035085678100585938, 0.003847479820251465, 0.004186391830444336, 0.004525303840637207, 0.004864215850830078, 0.005203127861022949, 0.00554203987121582, 0.005880951881408691, 0.0062198638916015625, 0.006558775901794434, 0.006897687911987305, 0.007236599922180176, 0.007575511932373047, 0.007914423942565918, 0.008253335952758789, 0.00859224796295166, 0.008931159973144531, 0.009270071983337402, 0.009608983993530273, 0.009947896003723145, 0.010286808013916016, 0.010625720024108887, 0.010964632034301758, 0.011303544044494629, 0.0116424560546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 20.0, 198.0, 542.0, 200.0, 26.0, 12.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25941604375839233, -0.2524815797805786, -0.2455471158027649, -0.23861265182495117, -0.23167817294597626, -0.22474370896816254, -0.21780924499034882, -0.2108747810125351, -0.20394031703472137, -0.19700585305690765, -0.19007138907909393, -0.18313691020011902, -0.1762024462223053, -0.16926798224449158, -0.16233351826667786, -0.15539905428886414, -0.14846459031105042, -0.1415301263332367, -0.13459566235542297, -0.12766119837760925, -0.12072672694921494, -0.11379225552082062, -0.1068577915430069, -0.09992332756519318, -0.09298884868621826, -0.08605438470840454, -0.07911991328001022, -0.0721854493021965, -0.06525098532438278, -0.05831651762127876, -0.051382049918174744, -0.04444758594036102, -0.0375131219625473, -0.030578656122088432, -0.023644190281629562, -0.016709722578525543, -0.009775256738066673, -0.0028407908976078033, 0.004093676805496216, 0.011028140783309937, 0.017962608486413956, 0.024897074326872826, 0.031831540167331696, 0.038766007870435715, 0.045700475573539734, 0.052634939551353455, 0.059569407254457474, 0.0665038675069809, 0.07343833893537521, 0.08037280291318893, 0.08730727434158325, 0.09424173831939697, 0.1011762022972107, 0.10811066627502441, 0.11504513770341873, 0.12197960168123245, 0.12891407310962677, 0.1358485370874405, 0.1427830010652542, 0.14971747994422913, 0.15665194392204285, 0.16358640789985657, 0.1705208718776703, 0.177455335855484, 0.18438979983329773]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 15.0, 19.0, 26.0, 33.0, 41.0, 37.0, 48.0, 51.0, 63.0, 50.0, 50.0, 61.0, 49.0, 49.0, 59.0, 45.0, 49.0, 45.0, 44.0, 29.0, 19.0, 23.0, 20.0, 14.0, 9.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.05988001823425293, -0.05845063924789429, -0.05702126398682594, -0.0555918887257576, -0.054162509739398956, -0.052733130753040314, -0.05130375549197197, -0.049874380230903625, -0.04844500124454498, -0.04701562225818634, -0.045586246997117996, -0.04415687173604965, -0.04272749274969101, -0.04129811376333237, -0.03986873850226402, -0.03843936324119568, -0.037009984254837036, -0.035580605268478394, -0.03415123000741005, -0.032721854746341705, -0.03129247575998306, -0.02986309863626957, -0.028433721512556076, -0.027004344388842583, -0.02557496726512909, -0.024145590141415596, -0.022716213017702103, -0.02128683589398861, -0.019857458770275116, -0.018428081646561623, -0.01699870452284813, -0.015569327399134636, -0.014139950275421143, -0.01271057315170765, -0.011281196027994156, -0.009851818904280663, -0.00842244178056717, -0.006993064656853676, -0.0055636875331401825, -0.004134310409426689, -0.002704933285713196, -0.0012755561619997025, 0.0001538209617137909, 0.0015831980854272842, 0.0030125752091407776, 0.004441952332854271, 0.005871329456567764, 0.007300706580281258, 0.008730083703994751, 0.010159460827708244, 0.011588837951421738, 0.013018215075135231, 0.014447592198848724, 0.015876969322562218, 0.01730634644627571, 0.018735723569989204, 0.020165100693702698, 0.02159447781741619, 0.023023854941129684, 0.024453232064843178, 0.02588260918855667, 0.027311986312270164, 0.028741363435983658, 0.03017074055969715, 0.031600117683410645]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 6.0, 5.0, 9.0, 15.0, 25.0, 29.0, 44.0, 75.0, 109.0, 123.0, 241.0, 427.0, 654.0, 1389.0, 6929.0, 555890.0, 473217.0, 6183.0, 1381.0, 666.0, 411.0, 236.0, 173.0, 99.0, 69.0, 55.0, 24.0, 19.0, 18.0, 7.0, 10.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05535888671875, -0.053680419921875, -0.052001953125, -0.050323486328125, -0.04864501953125, -0.046966552734375, -0.0452880859375, -0.043609619140625, -0.04193115234375, -0.040252685546875, -0.03857421875, -0.036895751953125, -0.03521728515625, -0.033538818359375, -0.0318603515625, -0.030181884765625, -0.02850341796875, -0.026824951171875, -0.025146484375, -0.023468017578125, -0.02178955078125, -0.020111083984375, -0.0184326171875, -0.016754150390625, -0.01507568359375, -0.013397216796875, -0.01171875, -0.010040283203125, -0.00836181640625, -0.006683349609375, -0.0050048828125, -0.003326416015625, -0.00164794921875, 3.0517578125e-05, 0.001708984375, 0.003387451171875, 0.00506591796875, 0.006744384765625, 0.0084228515625, 0.010101318359375, 0.01177978515625, 0.013458251953125, 0.01513671875, 0.016815185546875, 0.01849365234375, 0.020172119140625, 0.0218505859375, 0.023529052734375, 0.02520751953125, 0.026885986328125, 0.028564453125, 0.030242919921875, 0.03192138671875, 0.033599853515625, 0.0352783203125, 0.036956787109375, 0.03863525390625, 0.040313720703125, 0.0419921875, 0.043670654296875, 0.04534912109375, 0.047027587890625, 0.0487060546875, 0.050384521484375, 0.05206298828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 41.0, 106.0, 220.0, 254.0, 204.0, 123.0, 30.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0169677734375, -0.01639246940612793, -0.01581716537475586, -0.015241861343383789, -0.014666557312011719, -0.014091253280639648, -0.013515949249267578, -0.012940645217895508, -0.012365341186523438, -0.011790037155151367, -0.011214733123779297, -0.010639429092407227, -0.010064125061035156, -0.009488821029663086, -0.008913516998291016, -0.008338212966918945, -0.007762908935546875, -0.007187604904174805, -0.006612300872802734, -0.006036996841430664, -0.005461692810058594, -0.0048863887786865234, -0.004311084747314453, -0.003735780715942383, -0.0031604766845703125, -0.002585172653198242, -0.002009868621826172, -0.0014345645904541016, -0.0008592605590820312, -0.00028395652770996094, 0.0002913475036621094, 0.0008666515350341797, 0.00144195556640625, 0.0020172595977783203, 0.0025925636291503906, 0.003167867660522461, 0.0037431716918945312, 0.0043184757232666016, 0.004893779754638672, 0.005469083786010742, 0.0060443878173828125, 0.006619691848754883, 0.007194995880126953, 0.0077702999114990234, 0.008345603942871094, 0.008920907974243164, 0.009496212005615234, 0.010071516036987305, 0.010646820068359375, 0.011222124099731445, 0.011797428131103516, 0.012372732162475586, 0.012948036193847656, 0.013523340225219727, 0.014098644256591797, 0.014673948287963867, 0.015249252319335938, 0.015824556350708008, 0.016399860382080078, 0.01697516441345215, 0.01755046844482422, 0.01812577247619629, 0.01870107650756836, 0.01927638053894043, 0.0198516845703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 9.0, 19.0, 17.0, 35.0, 51.0, 61.0, 82.0, 101.0, 150.0, 214.0, 329.0, 670.0, 1300.0, 3374.0, 11140.0, 60423.0, 410241.0, 467967.0, 72445.0, 12942.0, 3738.0, 1416.0, 717.0, 373.0, 200.0, 136.0, 111.0, 70.0, 47.0, 44.0, 38.0, 19.0, 18.0, 15.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0205841064453125, -0.020013093948364258, -0.019442081451416016, -0.018871068954467773, -0.01830005645751953, -0.01772904396057129, -0.017158031463623047, -0.016587018966674805, -0.016016006469726562, -0.01544499397277832, -0.014873981475830078, -0.014302968978881836, -0.013731956481933594, -0.013160943984985352, -0.01258993148803711, -0.012018918991088867, -0.011447906494140625, -0.010876893997192383, -0.01030588150024414, -0.009734869003295898, -0.009163856506347656, -0.008592844009399414, -0.008021831512451172, -0.00745081901550293, -0.0068798065185546875, -0.006308794021606445, -0.005737781524658203, -0.005166769027709961, -0.004595756530761719, -0.0040247440338134766, -0.0034537315368652344, -0.002882719039916992, -0.00231170654296875, -0.0017406940460205078, -0.0011696815490722656, -0.0005986690521240234, -2.765655517578125e-05, 0.0005433559417724609, 0.0011143684387207031, 0.0016853809356689453, 0.0022563934326171875, 0.0028274059295654297, 0.003398418426513672, 0.003969430923461914, 0.004540443420410156, 0.0051114559173583984, 0.005682468414306641, 0.006253480911254883, 0.006824493408203125, 0.007395505905151367, 0.00796651840209961, 0.008537530899047852, 0.009108543395996094, 0.009679555892944336, 0.010250568389892578, 0.01082158088684082, 0.011392593383789062, 0.011963605880737305, 0.012534618377685547, 0.013105630874633789, 0.013676643371582031, 0.014247655868530273, 0.014818668365478516, 0.015389680862426758, 0.015960693359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 5.0, 11.0, 14.0, 21.0, 19.0, 19.0, 22.0, 23.0, 19.0, 34.0, 31.0, 28.0, 54.0, 50.0, 54.0, 45.0, 46.0, 41.0, 48.0, 57.0, 41.0, 35.0, 40.0, 35.0, 29.0, 22.0, 23.0, 27.0, 20.0, 20.0, 10.0, 14.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01031494140625, -0.009937524795532227, -0.009560108184814453, -0.00918269157409668, -0.008805274963378906, -0.008427858352661133, -0.00805044174194336, -0.007673025131225586, -0.0072956085205078125, -0.006918191909790039, -0.006540775299072266, -0.006163358688354492, -0.005785942077636719, -0.005408525466918945, -0.005031108856201172, -0.0046536922454833984, -0.004276275634765625, -0.0038988590240478516, -0.003521442413330078, -0.0031440258026123047, -0.0027666091918945312, -0.002389192581176758, -0.0020117759704589844, -0.001634359359741211, -0.0012569427490234375, -0.0008795261383056641, -0.0005021095275878906, -0.0001246929168701172, 0.00025272369384765625, 0.0006301403045654297, 0.0010075569152832031, 0.0013849735260009766, 0.00176239013671875, 0.0021398067474365234, 0.002517223358154297, 0.0028946399688720703, 0.0032720565795898438, 0.003649473190307617, 0.004026889801025391, 0.004404306411743164, 0.0047817230224609375, 0.005159139633178711, 0.005536556243896484, 0.005913972854614258, 0.006291389465332031, 0.006668806076049805, 0.007046222686767578, 0.0074236392974853516, 0.007801055908203125, 0.008178472518920898, 0.008555889129638672, 0.008933305740356445, 0.009310722351074219, 0.009688138961791992, 0.010065555572509766, 0.010442972183227539, 0.010820388793945312, 0.011197805404663086, 0.01157522201538086, 0.011952638626098633, 0.012330055236816406, 0.01270747184753418, 0.013084888458251953, 0.013462305068969727, 0.0138397216796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 10.0, 15.0, 27.0, 32.0, 46.0, 75.0, 147.0, 259.0, 427.0, 846.0, 1690.0, 3580.0, 9713.0, 50437.0, 633139.0, 308926.0, 26531.0, 6911.0, 2795.0, 1352.0, 655.0, 350.0, 226.0, 126.0, 68.0, 50.0, 29.0, 20.0, 16.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.009124755859375, -0.008828878402709961, -0.008533000946044922, -0.008237123489379883, -0.007941246032714844, -0.007645368576049805, -0.007349491119384766, -0.0070536136627197266, -0.0067577362060546875, -0.0064618587493896484, -0.006165981292724609, -0.00587010383605957, -0.005574226379394531, -0.005278348922729492, -0.004982471466064453, -0.004686594009399414, -0.004390716552734375, -0.004094839096069336, -0.003798961639404297, -0.003503084182739258, -0.0032072067260742188, -0.0029113292694091797, -0.0026154518127441406, -0.0023195743560791016, -0.0020236968994140625, -0.0017278194427490234, -0.0014319419860839844, -0.0011360645294189453, -0.0008401870727539062, -0.0005443096160888672, -0.0002484321594238281, 4.744529724121094e-05, 0.00034332275390625, 0.0006392002105712891, 0.0009350776672363281, 0.0012309551239013672, 0.0015268325805664062, 0.0018227100372314453, 0.0021185874938964844, 0.0024144649505615234, 0.0027103424072265625, 0.0030062198638916016, 0.0033020973205566406, 0.0035979747772216797, 0.0038938522338867188, 0.004189729690551758, 0.004485607147216797, 0.004781484603881836, 0.005077362060546875, 0.005373239517211914, 0.005669116973876953, 0.005964994430541992, 0.006260871887207031, 0.00655674934387207, 0.006852626800537109, 0.0071485042572021484, 0.0074443817138671875, 0.0077402591705322266, 0.008036136627197266, 0.008332014083862305, 0.008627891540527344, 0.008923768997192383, 0.009219646453857422, 0.009515523910522461, 0.0098114013671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 8.0, 10.0, 16.0, 17.0, 17.0, 24.0, 34.0, 39.0, 36.0, 39.0, 55.0, 61.0, 101.0, 91.0, 61.0, 48.0, 62.0, 33.0, 33.0, 34.0, 33.0, 26.0, 17.0, 10.0, 21.0, 3.0, 11.0, 10.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.164478302001953e-05, -6.9422647356987e-05, -6.720051169395447e-05, -6.497837603092194e-05, -6.27562403678894e-05, -6.053410470485687e-05, -5.831196904182434e-05, -5.608983337879181e-05, -5.386769771575928e-05, -5.1645562052726746e-05, -4.9423426389694214e-05, -4.720129072666168e-05, -4.497915506362915e-05, -4.275701940059662e-05, -4.053488373756409e-05, -3.8312748074531555e-05, -3.6090612411499023e-05, -3.386847674846649e-05, -3.164634108543396e-05, -2.9424205422401428e-05, -2.7202069759368896e-05, -2.4979934096336365e-05, -2.2757798433303833e-05, -2.05356627702713e-05, -1.831352710723877e-05, -1.6091391444206238e-05, -1.3869255781173706e-05, -1.1647120118141174e-05, -9.424984455108643e-06, -7.202848792076111e-06, -4.980713129043579e-06, -2.7585774660110474e-06, -5.364418029785156e-07, 1.6856938600540161e-06, 3.907829523086548e-06, 6.12996518611908e-06, 8.352100849151611e-06, 1.0574236512184143e-05, 1.2796372175216675e-05, 1.5018507838249207e-05, 1.7240643501281738e-05, 1.946277916431427e-05, 2.1684914827346802e-05, 2.3907050490379333e-05, 2.6129186153411865e-05, 2.8351321816444397e-05, 3.057345747947693e-05, 3.279559314250946e-05, 3.501772880554199e-05, 3.7239864468574524e-05, 3.9462000131607056e-05, 4.168413579463959e-05, 4.390627145767212e-05, 4.612840712070465e-05, 4.835054278373718e-05, 5.0572678446769714e-05, 5.2794814109802246e-05, 5.501694977283478e-05, 5.723908543586731e-05, 5.946122109889984e-05, 6.168335676193237e-05, 6.39054924249649e-05, 6.612762808799744e-05, 6.834976375102997e-05, 7.05718994140625e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 11.0, 26.0, 17.0, 42.0, 65.0, 94.0, 220.0, 315.0, 593.0, 1198.0, 2434.0, 5313.0, 15129.0, 100262.0, 745527.0, 146805.0, 18738.0, 6104.0, 2751.0, 1361.0, 640.0, 389.0, 216.0, 105.0, 54.0, 38.0, 16.0, 14.0, 11.0, 10.0, 13.0, 6.0, 2.0, 1.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00913238525390625, -0.008852005004882812, -0.008571624755859375, -0.008291244506835938, -0.0080108642578125, -0.0077304840087890625, -0.007450103759765625, -0.0071697235107421875, -0.00688934326171875, -0.0066089630126953125, -0.006328582763671875, -0.0060482025146484375, -0.005767822265625, -0.0054874420166015625, -0.005207061767578125, -0.0049266815185546875, -0.00464630126953125, -0.0043659210205078125, -0.004085540771484375, -0.0038051605224609375, -0.0035247802734375, -0.0032444000244140625, -0.002964019775390625, -0.0026836395263671875, -0.00240325927734375, -0.0021228790283203125, -0.001842498779296875, -0.0015621185302734375, -0.00128173828125, -0.0010013580322265625, -0.000720977783203125, -0.0004405975341796875, -0.00016021728515625, 0.0001201629638671875, 0.000400543212890625, 0.0006809234619140625, 0.0009613037109375, 0.0012416839599609375, 0.001522064208984375, 0.0018024444580078125, 0.00208282470703125, 0.0023632049560546875, 0.002643585205078125, 0.0029239654541015625, 0.003204345703125, 0.0034847259521484375, 0.003765106201171875, 0.0040454864501953125, 0.00432586669921875, 0.0046062469482421875, 0.004886627197265625, 0.0051670074462890625, 0.0054473876953125, 0.0057277679443359375, 0.006008148193359375, 0.0062885284423828125, 0.00656890869140625, 0.0068492889404296875, 0.007129669189453125, 0.0074100494384765625, 0.0076904296875, 0.007970809936523438, 0.008251190185546875, 0.008531570434570312, 0.00881195068359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 20.0, 27.0, 25.0, 50.0, 64.0, 82.0, 123.0, 120.0, 119.0, 119.0, 73.0, 50.0, 27.0, 25.0, 13.0, 11.0, 4.0, 1.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006717681884765625, -0.006518185138702393, -0.00631868839263916, -0.006119191646575928, -0.005919694900512695, -0.005720198154449463, -0.0055207014083862305, -0.005321204662322998, -0.005121707916259766, -0.004922211170196533, -0.004722714424133301, -0.004523217678070068, -0.004323720932006836, -0.0041242241859436035, -0.003924727439880371, -0.0037252306938171387, -0.0035257339477539062, -0.003326237201690674, -0.0031267404556274414, -0.002927243709564209, -0.0027277469635009766, -0.002528250217437744, -0.0023287534713745117, -0.0021292567253112793, -0.0019297599792480469, -0.0017302632331848145, -0.001530766487121582, -0.0013312697410583496, -0.0011317729949951172, -0.0009322762489318848, -0.0007327795028686523, -0.0005332827568054199, -0.0003337860107421875, -0.00013428926467895508, 6.520748138427734e-05, 0.00026470422744750977, 0.0004642009735107422, 0.0006636977195739746, 0.000863194465637207, 0.0010626912117004395, 0.0012621879577636719, 0.0014616847038269043, 0.0016611814498901367, 0.0018606781959533691, 0.0020601749420166016, 0.002259671688079834, 0.0024591684341430664, 0.002658665180206299, 0.0028581619262695312, 0.0030576586723327637, 0.003257155418395996, 0.0034566521644592285, 0.003656148910522461, 0.0038556456565856934, 0.004055142402648926, 0.004254639148712158, 0.004454135894775391, 0.004653632640838623, 0.0048531293869018555, 0.005052626132965088, 0.00525212287902832, 0.005451619625091553, 0.005651116371154785, 0.005850613117218018, 0.00605010986328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 14.0, 321.0, 596.0, 58.0, 17.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08801757544279099, -0.07925599068403244, -0.0704943984746933, -0.06173281371593475, -0.05297122523188591, -0.04420963674783707, -0.03544805198907852, -0.02668646350502968, -0.017924875020980835, -0.009163287468254566, -0.0004016999155282974, 0.008359886705875397, 0.01712147518992424, 0.025883063673973083, 0.03464464843273163, 0.04340623691678047, 0.052167825400829315, 0.06092941388487816, 0.069691002368927, 0.07845258712768555, 0.08721417188644409, 0.09597576409578323, 0.10473734885454178, 0.11349894106388092, 0.12226052582263947, 0.131022110581398, 0.13978369534015656, 0.1485452950000763, 0.15730687975883484, 0.16606846451759338, 0.17483004927635193, 0.18359163403511047, 0.19235321879386902, 0.20111480355262756, 0.2098763883113861, 0.21863797307014465, 0.2273995727300644, 0.23616115748882294, 0.24492274224758148, 0.2536843419075012, 0.26244592666625977, 0.2712075114250183, 0.27996909618377686, 0.2887306809425354, 0.29749226570129395, 0.3062538504600525, 0.31501543521881104, 0.32377704977989197, 0.3325386047363281, 0.34130018949508667, 0.3500617742538452, 0.35882335901260376, 0.3675849437713623, 0.37634652853012085, 0.3851081132888794, 0.3938697278499603, 0.40263131260871887, 0.4113928973674774, 0.42015448212623596, 0.4289160668849945, 0.43767765164375305, 0.446439266204834, 0.45520085096359253, 0.4639624357223511, 0.4727240204811096]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 11.0, 24.0, 22.0, 33.0, 15.0, 41.0, 38.0, 42.0, 47.0, 47.0, 51.0, 51.0, 68.0, 47.0, 55.0, 53.0, 46.0, 51.0, 41.0, 34.0, 34.0, 30.0, 18.0, 20.0, 16.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0587925910949707, -0.05727876350283623, -0.05576493591070175, -0.05425110459327698, -0.0527372770011425, -0.051223449409008026, -0.04970961809158325, -0.048195790499448776, -0.0466819629073143, -0.045168135315179825, -0.04365430772304535, -0.042140476405620575, -0.0406266488134861, -0.039112821221351624, -0.03759898990392685, -0.036085162311792374, -0.0345713347196579, -0.03305750712752342, -0.03154367953538895, -0.030029848217964172, -0.028516020625829697, -0.02700219303369522, -0.025488363578915596, -0.02397453412413597, -0.022460706532001495, -0.02094687893986702, -0.019433049485087395, -0.01791922003030777, -0.016405392438173294, -0.014891563914716244, -0.013377735391259193, -0.011863906867802143, -0.010350078344345093, -0.008836249820888042, -0.007322421297430992, -0.005808592773973942, -0.0042947642505168915, -0.002780935727059841, -0.0012671072036027908, 0.0002467213198542595, 0.0017605498433113098, 0.00327437836676836, 0.0047882068902254105, 0.006302035413682461, 0.007815863937139511, 0.009329692460596561, 0.010843520984053612, 0.012357349507510662, 0.013871178030967712, 0.015385006554424763, 0.016898835077881813, 0.018412664532661438, 0.019926492124795914, 0.02144031971693039, 0.022954149171710014, 0.02446797862648964, 0.025981806218624115, 0.02749563381075859, 0.029009463265538216, 0.03052329272031784, 0.032037120312452316, 0.03355094790458679, 0.035064779222011566, 0.03657860681414604, 0.03809243440628052]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 14.0, 15.0, 36.0, 60.0, 103.0, 162.0, 305.0, 545.0, 1085.0, 3635.0, 10355.0, 877198.0, 3279855.0, 15663.0, 2881.0, 965.0, 490.0, 328.0, 190.0, 131.0, 83.0, 55.0, 41.0, 21.0, 17.0, 14.0, 9.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.02870965003967285, -0.027466297149658203, -0.026222944259643555, -0.024979591369628906, -0.023736238479614258, -0.02249288558959961, -0.02124953269958496, -0.020006179809570312, -0.018762826919555664, -0.017519474029541016, -0.016276121139526367, -0.015032768249511719, -0.01378941535949707, -0.012546062469482422, -0.011302709579467773, -0.010059356689453125, -0.008816003799438477, -0.007572650909423828, -0.00632929801940918, -0.005085945129394531, -0.003842592239379883, -0.0025992393493652344, -0.001355886459350586, -0.0001125335693359375, 0.001130819320678711, 0.0023741722106933594, 0.003617525100708008, 0.004860877990722656, 0.006104230880737305, 0.007347583770751953, 0.008590936660766602, 0.00983428955078125, 0.011077642440795898, 0.012320995330810547, 0.013564348220825195, 0.014807701110839844, 0.016051054000854492, 0.01729440689086914, 0.01853775978088379, 0.019781112670898438, 0.021024465560913086, 0.022267818450927734, 0.023511171340942383, 0.02475452423095703, 0.02599787712097168, 0.027241230010986328, 0.028484582901000977, 0.029727935791015625, 0.030971288681030273, 0.03221464157104492, 0.03345799446105957, 0.03470134735107422, 0.03594470024108887, 0.037188053131103516, 0.038431406021118164, 0.03967475891113281, 0.04091811180114746, 0.04216146469116211, 0.04340481758117676, 0.044648170471191406, 0.045891523361206055, 0.0471348762512207, 0.04837822914123535, 0.04962158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 23.0, 83.0, 168.0, 232.0, 242.0, 158.0, 67.0, 19.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.017822265625, -0.0172271728515625, -0.016632080078125, -0.0160369873046875, -0.01544189453125, -0.0148468017578125, -0.014251708984375, -0.0136566162109375, -0.0130615234375, -0.0124664306640625, -0.011871337890625, -0.0112762451171875, -0.01068115234375, -0.0100860595703125, -0.009490966796875, -0.0088958740234375, -0.00830078125, -0.0077056884765625, -0.007110595703125, -0.0065155029296875, -0.00592041015625, -0.0053253173828125, -0.004730224609375, -0.0041351318359375, -0.0035400390625, -0.0029449462890625, -0.002349853515625, -0.0017547607421875, -0.00115966796875, -0.0005645751953125, 3.0517578125e-05, 0.0006256103515625, 0.001220703125, 0.0018157958984375, 0.002410888671875, 0.0030059814453125, 0.00360107421875, 0.0041961669921875, 0.004791259765625, 0.0053863525390625, 0.0059814453125, 0.0065765380859375, 0.007171630859375, 0.0077667236328125, 0.00836181640625, 0.0089569091796875, 0.009552001953125, 0.0101470947265625, 0.0107421875, 0.0113372802734375, 0.011932373046875, 0.0125274658203125, 0.01312255859375, 0.0137176513671875, 0.014312744140625, 0.0149078369140625, 0.0155029296875, 0.0160980224609375, 0.016693115234375, 0.0172882080078125, 0.01788330078125, 0.0184783935546875, 0.019073486328125, 0.0196685791015625, 0.020263671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 3.0, 10.0, 9.0, 16.0, 18.0, 24.0, 60.0, 75.0, 110.0, 151.0, 347.0, 744.0, 2591.0, 17151.0, 2792830.0, 1362892.0, 13617.0, 2254.0, 670.0, 285.0, 151.0, 89.0, 52.0, 32.0, 26.0, 23.0, 13.0, 8.0, 9.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03533935546875, -0.03426694869995117, -0.033194541931152344, -0.032122135162353516, -0.031049728393554688, -0.02997732162475586, -0.02890491485595703, -0.027832508087158203, -0.026760101318359375, -0.025687694549560547, -0.02461528778076172, -0.02354288101196289, -0.022470474243164062, -0.021398067474365234, -0.020325660705566406, -0.019253253936767578, -0.01818084716796875, -0.017108440399169922, -0.016036033630371094, -0.014963626861572266, -0.013891220092773438, -0.01281881332397461, -0.011746406555175781, -0.010673999786376953, -0.009601593017578125, -0.008529186248779297, -0.007456779479980469, -0.006384372711181641, -0.0053119659423828125, -0.004239559173583984, -0.0031671524047851562, -0.002094745635986328, -0.0010223388671875, 5.0067901611328125e-05, 0.0011224746704101562, 0.0021948814392089844, 0.0032672882080078125, 0.004339694976806641, 0.005412101745605469, 0.006484508514404297, 0.007556915283203125, 0.008629322052001953, 0.009701728820800781, 0.01077413558959961, 0.011846542358398438, 0.012918949127197266, 0.013991355895996094, 0.015063762664794922, 0.01613616943359375, 0.017208576202392578, 0.018280982971191406, 0.019353389739990234, 0.020425796508789062, 0.02149820327758789, 0.02257061004638672, 0.023643016815185547, 0.024715423583984375, 0.025787830352783203, 0.02686023712158203, 0.02793264389038086, 0.029005050659179688, 0.030077457427978516, 0.031149864196777344, 0.03222227096557617, 0.033294677734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 10.0, 21.0, 13.0, 25.0, 25.0, 54.0, 56.0, 89.0, 111.0, 173.0, 261.0, 407.0, 621.0, 597.0, 505.0, 298.0, 223.0, 141.0, 125.0, 76.0, 53.0, 45.0, 37.0, 25.0, 21.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00888824462890625, -0.008593559265136719, -0.008298873901367188, -0.008004188537597656, -0.007709503173828125, -0.007414817810058594, -0.0071201324462890625, -0.006825447082519531, -0.00653076171875, -0.006236076354980469, -0.0059413909912109375, -0.005646705627441406, -0.005352020263671875, -0.005057334899902344, -0.0047626495361328125, -0.004467964172363281, -0.00417327880859375, -0.0038785934448242188, -0.0035839080810546875, -0.0032892227172851562, -0.002994537353515625, -0.0026998519897460938, -0.0024051666259765625, -0.0021104812622070312, -0.0018157958984375, -0.0015211105346679688, -0.0012264251708984375, -0.0009317398071289062, -0.000637054443359375, -0.00034236907958984375, -4.76837158203125e-05, 0.00024700164794921875, 0.00054168701171875, 0.0008363723754882812, 0.0011310577392578125, 0.0014257431030273438, 0.001720428466796875, 0.0020151138305664062, 0.0023097991943359375, 0.0026044845581054688, 0.002899169921875, 0.0031938552856445312, 0.0034885406494140625, 0.0037832260131835938, 0.004077911376953125, 0.004372596740722656, 0.0046672821044921875, 0.004961967468261719, 0.00525665283203125, 0.005551338195800781, 0.0058460235595703125, 0.006140708923339844, 0.006435394287109375, 0.006730079650878906, 0.0070247650146484375, 0.007319450378417969, 0.0076141357421875, 0.007908821105957031, 0.008203506469726562, 0.008498191833496094, 0.008792877197265625, 0.009087562561035156, 0.009382247924804688, 0.009676933288574219, 0.00997161865234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 27.0, 71.0, 247.0, 347.0, 192.0, 67.0, 29.0, 9.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14066481590270996, -0.13717256486415863, -0.1336803138256073, -0.13018806278705597, -0.12669581174850464, -0.12320356070995331, -0.11971130967140198, -0.11621905863285065, -0.11272680759429932, -0.10923455655574799, -0.10574230551719666, -0.10225005447864532, -0.098757803440094, -0.09526555240154266, -0.09177330136299133, -0.08828105032444, -0.08478880673646927, -0.08129655569791794, -0.07780430465936661, -0.07431205362081528, -0.07081980258226395, -0.06732755154371262, -0.06383530795574188, -0.06034305319190025, -0.05685080215334892, -0.05335855111479759, -0.04986630007624626, -0.04637405276298523, -0.0428818017244339, -0.03938955068588257, -0.03589729964733124, -0.03240504860877991, -0.02891279011964798, -0.02542053908109665, -0.02192828804254532, -0.018436038866639137, -0.014943787828087807, -0.011451536789536476, -0.007959287613630295, -0.004467036575078964, -0.0009747855365276337, 0.0025174650363624096, 0.006009715609252453, 0.009501965716481209, 0.01299421675503254, 0.01648646779358387, 0.01997871696949005, 0.023470968008041382, 0.026963219046592712, 0.030455470085144043, 0.033947721123695374, 0.037439972162246704, 0.040932223200798035, 0.044424474239349365, 0.0479167215526104, 0.05140897259116173, 0.05490122362971306, 0.05839347466826439, 0.06188572570681572, 0.06537797302007675, 0.06887022405862808, 0.07236247509717941, 0.07585472613573074, 0.07934697717428207, 0.0828392282128334]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 9.0, 8.0, 19.0, 22.0, 23.0, 38.0, 45.0, 52.0, 66.0, 78.0, 69.0, 67.0, 71.0, 65.0, 69.0, 48.0, 41.0, 45.0, 42.0, 39.0, 28.0, 17.0, 15.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046460628509521484, -0.045007091015577316, -0.04355355352163315, -0.04210001602768898, -0.04064647853374481, -0.039192941039800644, -0.037739403545856476, -0.03628586605191231, -0.03483232855796814, -0.03337879106402397, -0.0319252535700798, -0.030471716076135635, -0.029018178582191467, -0.0275646410882473, -0.02611110359430313, -0.024657566100358963, -0.023204028606414795, -0.021750491112470627, -0.02029695361852646, -0.01884341612458229, -0.017389878630638123, -0.015936341136693954, -0.014482803642749786, -0.013029266148805618, -0.01157572865486145, -0.010122191160917282, -0.008668653666973114, -0.007215116173028946, -0.005761578679084778, -0.00430804118514061, -0.0028545036911964417, -0.0014009661972522736, 5.257129669189453e-05, 0.0015061087906360626, 0.0029596462845802307, 0.004413183778524399, 0.005866721272468567, 0.007320258766412735, 0.008773796260356903, 0.010227333754301071, 0.01168087124824524, 0.013134408742189407, 0.014587946236133575, 0.016041483730077744, 0.01749502122402191, 0.01894855871796608, 0.020402096211910248, 0.021855633705854416, 0.023309171199798584, 0.024762708693742752, 0.02621624618768692, 0.027669783681631088, 0.029123321175575256, 0.030576858669519424, 0.03203039616346359, 0.03348393365740776, 0.03493747115135193, 0.0363910086452961, 0.037844546139240265, 0.03929808363318443, 0.0407516211271286, 0.04220515862107277, 0.04365869611501694, 0.045112233608961105, 0.04656577110290527]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 16.0, 2.0, 8.0, 11.0, 16.0, 17.0, 26.0, 24.0, 40.0, 50.0, 73.0, 101.0, 122.0, 180.0, 235.0, 303.0, 439.0, 641.0, 1030.0, 2527.0, 13713.0, 277570.0, 709128.0, 34325.0, 3989.0, 1302.0, 720.0, 540.0, 352.0, 234.0, 215.0, 150.0, 104.0, 86.0, 68.0, 53.0, 36.0, 24.0, 21.0, 14.0, 10.0, 12.0, 11.0, 10.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04833984375, -0.047003746032714844, -0.04566764831542969, -0.04433155059814453, -0.042995452880859375, -0.04165935516357422, -0.04032325744628906, -0.038987159729003906, -0.03765106201171875, -0.036314964294433594, -0.03497886657714844, -0.03364276885986328, -0.032306671142578125, -0.03097057342529297, -0.029634475708007812, -0.028298377990722656, -0.0269622802734375, -0.025626182556152344, -0.024290084838867188, -0.02295398712158203, -0.021617889404296875, -0.02028179168701172, -0.018945693969726562, -0.017609596252441406, -0.01627349853515625, -0.014937400817871094, -0.013601303100585938, -0.012265205383300781, -0.010929107666015625, -0.009593009948730469, -0.008256912231445312, -0.006920814514160156, -0.005584716796875, -0.004248619079589844, -0.0029125213623046875, -0.0015764236450195312, -0.000240325927734375, 0.0010957717895507812, 0.0024318695068359375, 0.0037679672241210938, 0.00510406494140625, 0.006440162658691406, 0.0077762603759765625, 0.009112358093261719, 0.010448455810546875, 0.011784553527832031, 0.013120651245117188, 0.014456748962402344, 0.0157928466796875, 0.017128944396972656, 0.018465042114257812, 0.01980113983154297, 0.021137237548828125, 0.02247333526611328, 0.023809432983398438, 0.025145530700683594, 0.02648162841796875, 0.027817726135253906, 0.029153823852539062, 0.03048992156982422, 0.031826019287109375, 0.03316211700439453, 0.03449821472167969, 0.035834312438964844, 0.03717041015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 19.0, 74.0, 193.0, 246.0, 257.0, 154.0, 35.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017822265625, -0.017203807830810547, -0.016585350036621094, -0.01596689224243164, -0.015348434448242188, -0.014729976654052734, -0.014111518859863281, -0.013493061065673828, -0.012874603271484375, -0.012256145477294922, -0.011637687683105469, -0.011019229888916016, -0.010400772094726562, -0.00978231430053711, -0.009163856506347656, -0.008545398712158203, -0.00792694091796875, -0.007308483123779297, -0.006690025329589844, -0.006071567535400391, -0.0054531097412109375, -0.004834651947021484, -0.004216194152832031, -0.003597736358642578, -0.002979278564453125, -0.002360820770263672, -0.0017423629760742188, -0.0011239051818847656, -0.0005054473876953125, 0.00011301040649414062, 0.0007314682006835938, 0.0013499259948730469, 0.0019683837890625, 0.002586841583251953, 0.0032052993774414062, 0.0038237571716308594, 0.0044422149658203125, 0.005060672760009766, 0.005679130554199219, 0.006297588348388672, 0.006916046142578125, 0.007534503936767578, 0.008152961730957031, 0.008771419525146484, 0.009389877319335938, 0.01000833511352539, 0.010626792907714844, 0.011245250701904297, 0.01186370849609375, 0.012482166290283203, 0.013100624084472656, 0.01371908187866211, 0.014337539672851562, 0.014955997467041016, 0.015574455261230469, 0.016192913055419922, 0.016811370849609375, 0.017429828643798828, 0.01804828643798828, 0.018666744232177734, 0.019285202026367188, 0.01990365982055664, 0.020522117614746094, 0.021140575408935547, 0.021759033203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 4.0, 4.0, 10.0, 13.0, 14.0, 11.0, 22.0, 37.0, 37.0, 53.0, 97.0, 120.0, 207.0, 293.0, 489.0, 764.0, 1500.0, 3957.0, 15112.0, 97306.0, 629217.0, 256204.0, 31643.0, 6627.0, 2232.0, 932.0, 549.0, 356.0, 220.0, 146.0, 109.0, 70.0, 59.0, 41.0, 26.0, 21.0, 16.0, 9.0, 11.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024017333984375, -0.023209095001220703, -0.022400856018066406, -0.02159261703491211, -0.020784378051757812, -0.019976139068603516, -0.01916790008544922, -0.018359661102294922, -0.017551422119140625, -0.016743183135986328, -0.01593494415283203, -0.015126705169677734, -0.014318466186523438, -0.01351022720336914, -0.012701988220214844, -0.011893749237060547, -0.01108551025390625, -0.010277271270751953, -0.009469032287597656, -0.00866079330444336, -0.007852554321289062, -0.007044315338134766, -0.006236076354980469, -0.005427837371826172, -0.004619598388671875, -0.003811359405517578, -0.0030031204223632812, -0.0021948814392089844, -0.0013866424560546875, -0.0005784034729003906, 0.00022983551025390625, 0.0010380744934082031, 0.0018463134765625, 0.002654552459716797, 0.0034627914428710938, 0.004271030426025391, 0.0050792694091796875, 0.005887508392333984, 0.006695747375488281, 0.007503986358642578, 0.008312225341796875, 0.009120464324951172, 0.009928703308105469, 0.010736942291259766, 0.011545181274414062, 0.01235342025756836, 0.013161659240722656, 0.013969898223876953, 0.01477813720703125, 0.015586376190185547, 0.016394615173339844, 0.01720285415649414, 0.018011093139648438, 0.018819332122802734, 0.01962757110595703, 0.020435810089111328, 0.021244049072265625, 0.022052288055419922, 0.02286052703857422, 0.023668766021728516, 0.024477005004882812, 0.02528524398803711, 0.026093482971191406, 0.026901721954345703, 0.0277099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 13.0, 10.0, 7.0, 11.0, 9.0, 20.0, 17.0, 18.0, 27.0, 25.0, 33.0, 25.0, 30.0, 40.0, 52.0, 45.0, 44.0, 40.0, 41.0, 38.0, 37.0, 28.0, 40.0, 34.0, 35.0, 45.0, 31.0, 25.0, 34.0, 22.0, 14.0, 22.0, 17.0, 12.0, 12.0, 7.0, 10.0, 2.0, 11.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01218414306640625, -0.011808991432189941, -0.011433839797973633, -0.011058688163757324, -0.010683536529541016, -0.010308384895324707, -0.009933233261108398, -0.00955808162689209, -0.009182929992675781, -0.008807778358459473, -0.008432626724243164, -0.008057475090026855, -0.007682323455810547, -0.007307171821594238, -0.00693202018737793, -0.006556868553161621, -0.0061817169189453125, -0.005806565284729004, -0.005431413650512695, -0.005056262016296387, -0.004681110382080078, -0.0043059587478637695, -0.003930807113647461, -0.0035556554794311523, -0.0031805038452148438, -0.002805352210998535, -0.0024302005767822266, -0.002055048942565918, -0.0016798973083496094, -0.0013047456741333008, -0.0009295940399169922, -0.0005544424057006836, -0.000179290771484375, 0.0001958608627319336, 0.0005710124969482422, 0.0009461641311645508, 0.0013213157653808594, 0.001696467399597168, 0.0020716190338134766, 0.002446770668029785, 0.0028219223022460938, 0.0031970739364624023, 0.003572225570678711, 0.0039473772048950195, 0.004322528839111328, 0.004697680473327637, 0.005072832107543945, 0.005447983741760254, 0.0058231353759765625, 0.006198287010192871, 0.00657343864440918, 0.006948590278625488, 0.007323741912841797, 0.0076988935470581055, 0.008074045181274414, 0.008449196815490723, 0.008824348449707031, 0.00919950008392334, 0.009574651718139648, 0.009949803352355957, 0.010324954986572266, 0.010700106620788574, 0.011075258255004883, 0.011450409889221191, 0.0118255615234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 19.0, 22.0, 31.0, 44.0, 68.0, 145.0, 225.0, 409.0, 967.0, 2505.0, 8571.0, 42659.0, 560637.0, 388645.0, 32633.0, 7108.0, 2125.0, 852.0, 368.0, 202.0, 102.0, 53.0, 41.0, 25.0, 26.0, 10.0, 13.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01122283935546875, -0.010820984840393066, -0.010419130325317383, -0.0100172758102417, -0.009615421295166016, -0.009213566780090332, -0.008811712265014648, -0.008409857749938965, -0.008008003234863281, -0.007606148719787598, -0.007204294204711914, -0.0068024396896362305, -0.006400585174560547, -0.005998730659484863, -0.00559687614440918, -0.005195021629333496, -0.0047931671142578125, -0.004391312599182129, -0.003989458084106445, -0.0035876035690307617, -0.003185749053955078, -0.0027838945388793945, -0.002382040023803711, -0.0019801855087280273, -0.0015783309936523438, -0.0011764764785766602, -0.0007746219635009766, -0.00037276744842529297, 2.9087066650390625e-05, 0.0004309415817260742, 0.0008327960968017578, 0.0012346506118774414, 0.001636505126953125, 0.0020383596420288086, 0.002440214157104492, 0.0028420686721801758, 0.0032439231872558594, 0.003645777702331543, 0.0040476322174072266, 0.00444948673248291, 0.004851341247558594, 0.005253195762634277, 0.005655050277709961, 0.0060569047927856445, 0.006458759307861328, 0.006860613822937012, 0.007262468338012695, 0.007664322853088379, 0.008066177368164062, 0.008468031883239746, 0.00886988639831543, 0.009271740913391113, 0.009673595428466797, 0.01007544994354248, 0.010477304458618164, 0.010879158973693848, 0.011281013488769531, 0.011682868003845215, 0.012084722518920898, 0.012486577033996582, 0.012888431549072266, 0.01329028606414795, 0.013692140579223633, 0.014093995094299316, 0.014495849609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 2.0, 4.0, 8.0, 7.0, 18.0, 15.0, 25.0, 40.0, 28.0, 56.0, 73.0, 88.0, 111.0, 102.0, 90.0, 77.0, 58.0, 45.0, 34.0, 34.0, 23.0, 15.0, 14.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0], "bins": [-0.00015151500701904297, -0.00014815572649240494, -0.0001447964459657669, -0.00014143716543912888, -0.00013807788491249084, -0.00013471860438585281, -0.00013135932385921478, -0.00012800004333257675, -0.00012464076280593872, -0.00012128148227930069, -0.00011792220175266266, -0.00011456292122602463, -0.0001112036406993866, -0.00010784436017274857, -0.00010448507964611053, -0.0001011257991194725, -9.776651859283447e-05, -9.440723806619644e-05, -9.104795753955841e-05, -8.768867701292038e-05, -8.432939648628235e-05, -8.097011595964432e-05, -7.761083543300629e-05, -7.425155490636826e-05, -7.089227437973022e-05, -6.75329938530922e-05, -6.417371332645416e-05, -6.081443279981613e-05, -5.74551522731781e-05, -5.409587174654007e-05, -5.073659121990204e-05, -4.737731069326401e-05, -4.4018030166625977e-05, -4.0658749639987946e-05, -3.7299469113349915e-05, -3.3940188586711884e-05, -3.058090806007385e-05, -2.722162753343582e-05, -2.386234700679779e-05, -2.050306648015976e-05, -1.714378595352173e-05, -1.3784505426883698e-05, -1.0425224900245667e-05, -7.0659443736076355e-06, -3.7066638469696045e-06, -3.473833203315735e-07, 3.0118972063064575e-06, 6.3711777329444885e-06, 9.73045825958252e-06, 1.308973878622055e-05, 1.644901931285858e-05, 1.9808299839496613e-05, 2.3167580366134644e-05, 2.6526860892772675e-05, 2.9886141419410706e-05, 3.3245421946048737e-05, 3.660470247268677e-05, 3.99639829993248e-05, 4.332326352596283e-05, 4.668254405260086e-05, 5.004182457923889e-05, 5.340110510587692e-05, 5.6760385632514954e-05, 6.0119666159152985e-05, 6.347894668579102e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 10.0, 9.0, 16.0, 17.0, 28.0, 33.0, 36.0, 64.0, 92.0, 135.0, 218.0, 508.0, 1497.0, 6852.0, 60354.0, 877746.0, 88860.0, 8861.0, 1808.0, 592.0, 299.0, 163.0, 105.0, 72.0, 48.0, 31.0, 24.0, 19.0, 11.0, 8.0, 7.0, 8.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016265869140625, -0.015781283378601074, -0.015296697616577148, -0.014812111854553223, -0.014327526092529297, -0.013842940330505371, -0.013358354568481445, -0.01287376880645752, -0.012389183044433594, -0.011904597282409668, -0.011420011520385742, -0.010935425758361816, -0.01045083999633789, -0.009966254234313965, -0.009481668472290039, -0.008997082710266113, -0.008512496948242188, -0.008027911186218262, -0.007543325424194336, -0.00705873966217041, -0.006574153900146484, -0.006089568138122559, -0.005604982376098633, -0.005120396614074707, -0.004635810852050781, -0.0041512250900268555, -0.0036666393280029297, -0.003182053565979004, -0.002697467803955078, -0.0022128820419311523, -0.0017282962799072266, -0.0012437105178833008, -0.000759124755859375, -0.0002745389938354492, 0.00021004676818847656, 0.0006946325302124023, 0.0011792182922363281, 0.001663804054260254, 0.0021483898162841797, 0.0026329755783081055, 0.0031175613403320312, 0.003602147102355957, 0.004086732864379883, 0.004571318626403809, 0.005055904388427734, 0.00554049015045166, 0.006025075912475586, 0.006509661674499512, 0.0069942474365234375, 0.007478833198547363, 0.007963418960571289, 0.008448004722595215, 0.00893259048461914, 0.009417176246643066, 0.009901762008666992, 0.010386347770690918, 0.010870933532714844, 0.01135551929473877, 0.011840105056762695, 0.012324690818786621, 0.012809276580810547, 0.013293862342834473, 0.013778448104858398, 0.014263033866882324, 0.01474761962890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 8.0, 5.0, 6.0, 15.0, 13.0, 14.0, 16.0, 32.0, 33.0, 48.0, 65.0, 110.0, 123.0, 144.0, 108.0, 68.0, 50.0, 33.0, 20.0, 12.0, 11.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00505828857421875, -0.004864096641540527, -0.004669904708862305, -0.004475712776184082, -0.004281520843505859, -0.004087328910827637, -0.003893136978149414, -0.0036989450454711914, -0.0035047531127929688, -0.003310561180114746, -0.0031163692474365234, -0.0029221773147583008, -0.002727985382080078, -0.0025337934494018555, -0.002339601516723633, -0.00214540958404541, -0.0019512176513671875, -0.0017570257186889648, -0.0015628337860107422, -0.0013686418533325195, -0.0011744499206542969, -0.0009802579879760742, -0.0007860660552978516, -0.0005918741226196289, -0.00039768218994140625, -0.0002034902572631836, -9.298324584960938e-06, 0.00018489360809326172, 0.0003790855407714844, 0.000573277473449707, 0.0007674694061279297, 0.0009616613388061523, 0.001155853271484375, 0.0013500452041625977, 0.0015442371368408203, 0.001738429069519043, 0.0019326210021972656, 0.0021268129348754883, 0.002321004867553711, 0.0025151968002319336, 0.0027093887329101562, 0.002903580665588379, 0.0030977725982666016, 0.0032919645309448242, 0.003486156463623047, 0.0036803483963012695, 0.003874540328979492, 0.004068732261657715, 0.0042629241943359375, 0.00445711612701416, 0.004651308059692383, 0.0048454999923706055, 0.005039691925048828, 0.005233883857727051, 0.0054280757904052734, 0.005622267723083496, 0.005816459655761719, 0.006010651588439941, 0.006204843521118164, 0.006399035453796387, 0.006593227386474609, 0.006787419319152832, 0.006981611251831055, 0.007175803184509277, 0.0073699951171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 31.0, 384.0, 513.0, 57.0, 11.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27292537689208984, -0.2628140151500702, -0.25270265340805054, -0.2425912618637085, -0.23247990012168884, -0.2223685383796692, -0.21225716173648834, -0.2021457850933075, -0.19203442335128784, -0.1819230616092682, -0.17181168496608734, -0.1617003083229065, -0.15158894658088684, -0.1414775848388672, -0.13136620819568634, -0.12125483900308609, -0.11114346981048584, -0.10103210061788559, -0.09092073142528534, -0.08080936223268509, -0.07069799304008484, -0.06058662384748459, -0.05047525465488434, -0.04036388546228409, -0.030252516269683838, -0.020141147077083588, -0.010029777884483337, 8.159130811691284e-05, 0.010192960500717163, 0.020304329693317413, 0.030415698885917664, 0.040527068078517914, 0.050638437271118164, 0.060749806463718414, 0.07086117565631866, 0.08097254484891891, 0.09108391404151917, 0.10119528323411942, 0.11130665242671967, 0.12141802161931992, 0.13152939081192017, 0.14164075255393982, 0.15175212919712067, 0.1618635058403015, 0.17197486758232117, 0.18208622932434082, 0.19219760596752167, 0.20230898261070251, 0.21242034435272217, 0.22253170609474182, 0.23264308273792267, 0.24275445938110352, 0.25286582112312317, 0.2629771828651428, 0.27308857440948486, 0.2831999361515045, 0.29331129789352417, 0.3034226596355438, 0.3135340213775635, 0.3236454129219055, 0.33375677466392517, 0.3438681364059448, 0.35397952795028687, 0.3640908896923065, 0.37420225143432617]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 6.0, 9.0, 8.0, 12.0, 14.0, 20.0, 26.0, 27.0, 28.0, 38.0, 30.0, 46.0, 36.0, 49.0, 51.0, 60.0, 63.0, 56.0, 50.0, 48.0, 53.0, 50.0, 43.0, 36.0, 37.0, 35.0, 16.0, 14.0, 10.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06178915500640869, -0.05994928628206253, -0.05810941383242607, -0.05626954138278961, -0.05442967265844345, -0.05258980393409729, -0.05074993148446083, -0.04891005903482437, -0.04707019031047821, -0.04523032158613205, -0.04339044913649559, -0.04155057668685913, -0.03971070796251297, -0.03787083923816681, -0.03603096678853035, -0.03419109433889389, -0.03235122561454773, -0.03051135502755642, -0.02867148444056511, -0.0268316138535738, -0.02499174326658249, -0.02315187267959118, -0.02131200209259987, -0.01947213150560856, -0.01763226091861725, -0.01579239033162594, -0.013952519744634628, -0.012112649157643318, -0.010272778570652008, -0.008432907983660698, -0.006593037396669388, -0.004753166809678078, -0.0029132962226867676, -0.0010734256356954575, 0.0007664449512958527, 0.0026063155382871628, 0.004446186125278473, 0.006286056712269783, 0.008125927299261093, 0.009965797886252403, 0.011805668473243713, 0.013645539060235023, 0.015485409647226334, 0.017325280234217644, 0.019165150821208954, 0.021005021408200264, 0.022844891995191574, 0.024684762582182884, 0.026524633169174194, 0.028364503756165504, 0.030204374343156815, 0.032044246792793274, 0.033884115517139435, 0.035723984241485596, 0.037563856691122055, 0.039403729140758514, 0.041243597865104675, 0.043083466589450836, 0.044923339039087296, 0.046763211488723755, 0.048603080213069916, 0.05044294893741608, 0.052282821387052536, 0.054122693836688995, 0.055962562561035156]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 13.0, 18.0, 22.0, 23.0, 43.0, 52.0, 98.0, 135.0, 204.0, 350.0, 529.0, 1251.0, 3119.0, 5223.0, 22479.0, 2291070.0, 1836239.0, 24562.0, 4886.0, 1889.0, 748.0, 382.0, 273.0, 193.0, 140.0, 93.0, 55.0, 45.0, 28.0, 23.0, 24.0, 16.0, 16.0, 6.0, 5.0, 2.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252838134765625, -0.02449321746826172, -0.023702621459960938, -0.022912025451660156, -0.022121429443359375, -0.021330833435058594, -0.020540237426757812, -0.01974964141845703, -0.01895904541015625, -0.01816844940185547, -0.017377853393554688, -0.016587257385253906, -0.015796661376953125, -0.015006065368652344, -0.014215469360351562, -0.013424873352050781, -0.01263427734375, -0.011843681335449219, -0.011053085327148438, -0.010262489318847656, -0.009471893310546875, -0.008681297302246094, -0.007890701293945312, -0.007100105285644531, -0.00630950927734375, -0.005518913269042969, -0.0047283172607421875, -0.003937721252441406, -0.003147125244140625, -0.0023565292358398438, -0.0015659332275390625, -0.0007753372192382812, 1.52587890625e-05, 0.0008058547973632812, 0.0015964508056640625, 0.0023870468139648438, 0.003177642822265625, 0.003968238830566406, 0.0047588348388671875, 0.005549430847167969, 0.00634002685546875, 0.007130622863769531, 0.007921218872070312, 0.008711814880371094, 0.009502410888671875, 0.010293006896972656, 0.011083602905273438, 0.011874198913574219, 0.012664794921875, 0.013455390930175781, 0.014245986938476562, 0.015036582946777344, 0.015827178955078125, 0.016617774963378906, 0.017408370971679688, 0.01819896697998047, 0.01898956298828125, 0.01978015899658203, 0.020570755004882812, 0.021361351013183594, 0.022151947021484375, 0.022942543029785156, 0.023733139038085938, 0.02452373504638672, 0.0253143310546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 38.0, 105.0, 187.0, 244.0, 225.0, 129.0, 41.0, 15.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.01784038543701172, -0.017217636108398438, -0.016594886779785156, -0.015972137451171875, -0.015349388122558594, -0.014726638793945312, -0.014103889465332031, -0.01348114013671875, -0.012858390808105469, -0.012235641479492188, -0.011612892150878906, -0.010990142822265625, -0.010367393493652344, -0.009744644165039062, -0.009121894836425781, -0.0084991455078125, -0.007876396179199219, -0.0072536468505859375, -0.006630897521972656, -0.006008148193359375, -0.005385398864746094, -0.0047626495361328125, -0.004139900207519531, -0.00351715087890625, -0.0028944015502929688, -0.0022716522216796875, -0.0016489028930664062, -0.001026153564453125, -0.00040340423583984375, 0.0002193450927734375, 0.0008420944213867188, 0.00146484375, 0.0020875930786132812, 0.0027103424072265625, 0.0033330917358398438, 0.003955841064453125, 0.004578590393066406, 0.0052013397216796875, 0.005824089050292969, 0.00644683837890625, 0.007069587707519531, 0.0076923370361328125, 0.008315086364746094, 0.008937835693359375, 0.009560585021972656, 0.010183334350585938, 0.010806083679199219, 0.0114288330078125, 0.012051582336425781, 0.012674331665039062, 0.013297080993652344, 0.013919830322265625, 0.014542579650878906, 0.015165328979492188, 0.01578807830810547, 0.01641082763671875, 0.01703357696533203, 0.017656326293945312, 0.018279075622558594, 0.018901824951171875, 0.019524574279785156, 0.020147323608398438, 0.02077007293701172, 0.021392822265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 14.0, 16.0, 9.0, 21.0, 36.0, 49.0, 87.0, 159.0, 282.0, 735.0, 2084.0, 9501.0, 116151.0, 3898505.0, 151940.0, 10989.0, 2273.0, 733.0, 288.0, 148.0, 88.0, 61.0, 38.0, 15.0, 16.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0237884521484375, -0.023034095764160156, -0.022279739379882812, -0.02152538299560547, -0.020771026611328125, -0.02001667022705078, -0.019262313842773438, -0.018507957458496094, -0.01775360107421875, -0.016999244689941406, -0.016244888305664062, -0.015490531921386719, -0.014736175537109375, -0.013981819152832031, -0.013227462768554688, -0.012473106384277344, -0.01171875, -0.010964393615722656, -0.010210037231445312, -0.009455680847167969, -0.008701324462890625, -0.007946968078613281, -0.0071926116943359375, -0.006438255310058594, -0.00568389892578125, -0.004929542541503906, -0.0041751861572265625, -0.0034208297729492188, -0.002666473388671875, -0.0019121170043945312, -0.0011577606201171875, -0.00040340423583984375, 0.0003509521484375, 0.0011053085327148438, 0.0018596649169921875, 0.0026140213012695312, 0.003368377685546875, 0.004122734069824219, 0.0048770904541015625, 0.005631446838378906, 0.00638580322265625, 0.007140159606933594, 0.007894515991210938, 0.008648872375488281, 0.009403228759765625, 0.010157585144042969, 0.010911941528320312, 0.011666297912597656, 0.012420654296875, 0.013175010681152344, 0.013929367065429688, 0.014683723449707031, 0.015438079833984375, 0.01619243621826172, 0.016946792602539062, 0.017701148986816406, 0.01845550537109375, 0.019209861755371094, 0.019964218139648438, 0.02071857452392578, 0.021472930908203125, 0.02222728729248047, 0.022981643676757812, 0.023736000061035156, 0.0244903564453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 10.0, 13.0, 24.0, 13.0, 26.0, 36.0, 49.0, 68.0, 90.0, 123.0, 248.0, 436.0, 807.0, 734.0, 499.0, 270.0, 166.0, 115.0, 80.0, 77.0, 34.0, 31.0, 23.0, 26.0, 12.0, 13.0, 10.0, 3.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00994873046875, -0.009656786918640137, -0.009364843368530273, -0.00907289981842041, -0.008780956268310547, -0.008489012718200684, -0.00819706916809082, -0.007905125617980957, -0.007613182067871094, -0.0073212385177612305, -0.007029294967651367, -0.006737351417541504, -0.006445407867431641, -0.006153464317321777, -0.005861520767211914, -0.005569577217102051, -0.0052776336669921875, -0.004985690116882324, -0.004693746566772461, -0.004401803016662598, -0.004109859466552734, -0.003817915916442871, -0.003525972366333008, -0.0032340288162231445, -0.0029420852661132812, -0.002650141716003418, -0.0023581981658935547, -0.0020662546157836914, -0.0017743110656738281, -0.0014823675155639648, -0.0011904239654541016, -0.0008984804153442383, -0.000606536865234375, -0.0003145933151245117, -2.2649765014648438e-05, 0.00026929378509521484, 0.0005612373352050781, 0.0008531808853149414, 0.0011451244354248047, 0.001437067985534668, 0.0017290115356445312, 0.0020209550857543945, 0.002312898635864258, 0.002604842185974121, 0.0028967857360839844, 0.0031887292861938477, 0.003480672836303711, 0.0037726163864135742, 0.0040645599365234375, 0.004356503486633301, 0.004648447036743164, 0.004940390586853027, 0.005232334136962891, 0.005524277687072754, 0.005816221237182617, 0.0061081647872924805, 0.006400108337402344, 0.006692051887512207, 0.00698399543762207, 0.007275938987731934, 0.007567882537841797, 0.00785982608795166, 0.008151769638061523, 0.008443713188171387, 0.00873565673828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 12.0, 35.0, 219.0, 453.0, 227.0, 41.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1722070723772049, -0.16772635281085968, -0.16324561834335327, -0.15876489877700806, -0.15428416430950165, -0.14980344474315643, -0.14532271027565002, -0.1408419907093048, -0.1363612711429596, -0.13188055157661438, -0.12739981710910797, -0.12291909009218216, -0.11843836307525635, -0.11395764350891113, -0.10947691649198532, -0.10499618947505951, -0.1005154550075531, -0.09603472799062729, -0.09155400097370148, -0.08707327395677567, -0.08259254693984985, -0.07811182737350464, -0.07363110035657883, -0.06915037333965302, -0.0646696463227272, -0.06018891930580139, -0.05570819228887558, -0.051227468997240067, -0.046746741980314255, -0.04226601496338844, -0.03778529167175293, -0.03330456465482712, -0.028823837637901306, -0.024343110620975494, -0.019862385466694832, -0.015381659381091595, -0.010900933295488358, -0.006420206278562546, -0.0019394811242818832, 0.0025412440299987793, 0.007021971046924591, 0.011502697132527828, 0.015983423218131065, 0.020464148372411728, 0.02494487538933754, 0.02942560240626335, 0.033906325697898865, 0.038387052714824677, 0.04286777973175049, 0.0473485067486763, 0.05182923376560211, 0.056309957057237625, 0.06079068407416344, 0.06527140736579895, 0.06975213438272476, 0.07423286139965057, 0.07871358841657639, 0.0831943154335022, 0.08767504245042801, 0.09215576946735382, 0.09663648903369904, 0.10111722350120544, 0.10559794306755066, 0.11007867008447647, 0.11455939710140228]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 17.0, 24.0, 34.0, 33.0, 62.0, 44.0, 58.0, 68.0, 63.0, 61.0, 72.0, 78.0, 50.0, 58.0, 50.0, 43.0, 31.0, 28.0, 29.0, 15.0, 23.0, 8.0, 11.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0522761344909668, -0.05100224167108536, -0.04972834885120392, -0.04845445230603218, -0.04718055948615074, -0.0459066666662693, -0.044632770121097565, -0.043358877301216125, -0.042084984481334686, -0.04081109166145325, -0.03953719884157181, -0.03826330229640007, -0.03698940947651863, -0.03571551665663719, -0.034441620111465454, -0.033167727291584015, -0.031893834471702576, -0.030619941651821136, -0.029346046969294548, -0.02807215228676796, -0.02679825946688652, -0.02552436664700508, -0.024250471964478493, -0.022976577281951904, -0.021702684462070465, -0.020428791642189026, -0.019154896959662437, -0.01788100227713585, -0.01660710945725441, -0.015333215706050396, -0.014059321954846382, -0.012785428203642368, -0.011511534452438354, -0.01023764070123434, -0.008963746950030327, -0.007689853198826313, -0.006415959447622299, -0.005142065696418285, -0.0038681719452142715, -0.0025942781940102577, -0.001320384442806244, -4.649069160223007e-05, 0.0012274030596017838, 0.0025012968108057976, 0.0037751905620098114, 0.005049084313213825, 0.006322978064417839, 0.007596871815621853, 0.008870765566825867, 0.01014465931802988, 0.011418553069233894, 0.012692446820437908, 0.013966340571641922, 0.015240234322845936, 0.01651412807404995, 0.017788022756576538, 0.019061915576457977, 0.020335808396339417, 0.021609703078866005, 0.022883597761392593, 0.024157490581274033, 0.025431383401155472, 0.02670527808368206, 0.02797917276620865, 0.029253065586090088]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 21.0, 11.0, 29.0, 17.0, 38.0, 53.0, 49.0, 87.0, 106.0, 156.0, 193.0, 292.0, 431.0, 834.0, 1953.0, 9212.0, 259234.0, 750668.0, 19416.0, 2860.0, 1100.0, 568.0, 345.0, 224.0, 145.0, 123.0, 107.0, 70.0, 53.0, 30.0, 26.0, 21.0, 11.0, 11.0, 11.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.037200927734375, -0.036006927490234375, -0.03481292724609375, -0.033618927001953125, -0.0324249267578125, -0.031230926513671875, -0.03003692626953125, -0.028842926025390625, -0.02764892578125, -0.026454925537109375, -0.02526092529296875, -0.024066925048828125, -0.0228729248046875, -0.021678924560546875, -0.02048492431640625, -0.019290924072265625, -0.018096923828125, -0.016902923583984375, -0.01570892333984375, -0.014514923095703125, -0.0133209228515625, -0.012126922607421875, -0.01093292236328125, -0.009738922119140625, -0.008544921875, -0.007350921630859375, -0.00615692138671875, -0.004962921142578125, -0.0037689208984375, -0.002574920654296875, -0.00138092041015625, -0.000186920166015625, 0.001007080078125, 0.002201080322265625, 0.00339508056640625, 0.004589080810546875, 0.0057830810546875, 0.006977081298828125, 0.00817108154296875, 0.009365081787109375, 0.01055908203125, 0.011753082275390625, 0.01294708251953125, 0.014141082763671875, 0.0153350830078125, 0.016529083251953125, 0.01772308349609375, 0.018917083740234375, 0.020111083984375, 0.021305084228515625, 0.02249908447265625, 0.023693084716796875, 0.0248870849609375, 0.026081085205078125, 0.02727508544921875, 0.028469085693359375, 0.0296630859375, 0.030857086181640625, 0.03205108642578125, 0.033245086669921875, 0.0344390869140625, 0.035633087158203125, 0.03682708740234375, 0.038021087646484375, 0.039215087890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 26.0, 81.0, 176.0, 244.0, 228.0, 158.0, 55.0, 18.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180511474609375, -0.01742696762084961, -0.01680278778076172, -0.016178607940673828, -0.015554428100585938, -0.014930248260498047, -0.014306068420410156, -0.013681888580322266, -0.013057708740234375, -0.012433528900146484, -0.011809349060058594, -0.011185169219970703, -0.010560989379882812, -0.009936809539794922, -0.009312629699707031, -0.00868844985961914, -0.00806427001953125, -0.007440090179443359, -0.006815910339355469, -0.006191730499267578, -0.0055675506591796875, -0.004943370819091797, -0.004319190979003906, -0.0036950111389160156, -0.003070831298828125, -0.0024466514587402344, -0.0018224716186523438, -0.0011982917785644531, -0.0005741119384765625, 5.0067901611328125e-05, 0.0006742477416992188, 0.0012984275817871094, 0.001922607421875, 0.0025467872619628906, 0.0031709671020507812, 0.003795146942138672, 0.0044193267822265625, 0.005043506622314453, 0.005667686462402344, 0.006291866302490234, 0.006916046142578125, 0.007540225982666016, 0.008164405822753906, 0.008788585662841797, 0.009412765502929688, 0.010036945343017578, 0.010661125183105469, 0.01128530502319336, 0.01190948486328125, 0.01253366470336914, 0.013157844543457031, 0.013782024383544922, 0.014406204223632812, 0.015030384063720703, 0.015654563903808594, 0.016278743743896484, 0.016902923583984375, 0.017527103424072266, 0.018151283264160156, 0.018775463104248047, 0.019399642944335938, 0.020023822784423828, 0.02064800262451172, 0.02127218246459961, 0.0218963623046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 10.0, 7.0, 13.0, 20.0, 38.0, 50.0, 51.0, 74.0, 137.0, 235.0, 368.0, 815.0, 2529.0, 13518.0, 267276.0, 723911.0, 32824.0, 4256.0, 1182.0, 503.0, 273.0, 158.0, 103.0, 69.0, 39.0, 26.0, 15.0, 9.0, 10.0, 8.0, 2.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0307464599609375, -0.02979111671447754, -0.028835773468017578, -0.027880430221557617, -0.026925086975097656, -0.025969743728637695, -0.025014400482177734, -0.024059057235717773, -0.023103713989257812, -0.02214837074279785, -0.02119302749633789, -0.02023768424987793, -0.01928234100341797, -0.018326997756958008, -0.017371654510498047, -0.016416311264038086, -0.015460968017578125, -0.014505624771118164, -0.013550281524658203, -0.012594938278198242, -0.011639595031738281, -0.01068425178527832, -0.00972890853881836, -0.008773565292358398, -0.007818222045898438, -0.0068628787994384766, -0.005907535552978516, -0.004952192306518555, -0.003996849060058594, -0.003041505813598633, -0.002086162567138672, -0.001130819320678711, -0.00017547607421875, 0.0007798671722412109, 0.0017352104187011719, 0.002690553665161133, 0.0036458969116210938, 0.004601240158081055, 0.005556583404541016, 0.0065119266510009766, 0.0074672698974609375, 0.008422613143920898, 0.00937795639038086, 0.01033329963684082, 0.011288642883300781, 0.012243986129760742, 0.013199329376220703, 0.014154672622680664, 0.015110015869140625, 0.016065359115600586, 0.017020702362060547, 0.017976045608520508, 0.01893138885498047, 0.01988673210144043, 0.02084207534790039, 0.02179741859436035, 0.022752761840820312, 0.023708105087280273, 0.024663448333740234, 0.025618791580200195, 0.026574134826660156, 0.027529478073120117, 0.028484821319580078, 0.02944016456604004, 0.0303955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 2.0, 12.0, 8.0, 11.0, 8.0, 20.0, 22.0, 18.0, 23.0, 29.0, 31.0, 34.0, 51.0, 41.0, 45.0, 63.0, 43.0, 48.0, 50.0, 46.0, 42.0, 45.0, 43.0, 43.0, 41.0, 24.0, 26.0, 16.0, 17.0, 19.0, 16.0, 19.0, 7.0, 8.0, 8.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01168060302734375, -0.011255979537963867, -0.010831356048583984, -0.010406732559204102, -0.009982109069824219, -0.009557485580444336, -0.009132862091064453, -0.00870823860168457, -0.008283615112304688, -0.007858991622924805, -0.007434368133544922, -0.007009744644165039, -0.006585121154785156, -0.0061604976654052734, -0.005735874176025391, -0.005311250686645508, -0.004886627197265625, -0.004462003707885742, -0.004037380218505859, -0.0036127567291259766, -0.0031881332397460938, -0.002763509750366211, -0.002338886260986328, -0.0019142627716064453, -0.0014896392822265625, -0.0010650157928466797, -0.0006403923034667969, -0.00021576881408691406, 0.00020885467529296875, 0.0006334781646728516, 0.0010581016540527344, 0.0014827251434326172, 0.0019073486328125, 0.002331972122192383, 0.0027565956115722656, 0.0031812191009521484, 0.0036058425903320312, 0.004030466079711914, 0.004455089569091797, 0.00487971305847168, 0.0053043365478515625, 0.005728960037231445, 0.006153583526611328, 0.006578207015991211, 0.007002830505371094, 0.0074274539947509766, 0.00785207748413086, 0.008276700973510742, 0.008701324462890625, 0.009125947952270508, 0.00955057144165039, 0.009975194931030273, 0.010399818420410156, 0.010824441909790039, 0.011249065399169922, 0.011673688888549805, 0.012098312377929688, 0.01252293586730957, 0.012947559356689453, 0.013372182846069336, 0.013796806335449219, 0.014221429824829102, 0.014646053314208984, 0.015070676803588867, 0.01549530029296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 13.0, 21.0, 37.0, 38.0, 69.0, 102.0, 160.0, 311.0, 648.0, 1531.0, 4150.0, 14669.0, 86075.0, 706493.0, 199230.0, 24902.0, 6343.0, 1991.0, 813.0, 367.0, 202.0, 107.0, 78.0, 61.0, 26.0, 22.0, 21.0, 14.0, 9.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007602691650390625, -0.007346451282501221, -0.007090210914611816, -0.006833970546722412, -0.006577730178833008, -0.0063214898109436035, -0.006065249443054199, -0.005809009075164795, -0.005552768707275391, -0.005296528339385986, -0.005040287971496582, -0.004784047603607178, -0.0045278072357177734, -0.004271566867828369, -0.004015326499938965, -0.0037590861320495605, -0.0035028457641601562, -0.003246605396270752, -0.0029903650283813477, -0.0027341246604919434, -0.002477884292602539, -0.0022216439247131348, -0.0019654035568237305, -0.0017091631889343262, -0.0014529228210449219, -0.0011966824531555176, -0.0009404420852661133, -0.000684201717376709, -0.0004279613494873047, -0.0001717209815979004, 8.45193862915039e-05, 0.0003407597541809082, 0.0005970001220703125, 0.0008532404899597168, 0.001109480857849121, 0.0013657212257385254, 0.0016219615936279297, 0.001878201961517334, 0.0021344423294067383, 0.0023906826972961426, 0.002646923065185547, 0.002903163433074951, 0.0031594038009643555, 0.0034156441688537598, 0.003671884536743164, 0.003928124904632568, 0.004184365272521973, 0.004440605640411377, 0.004696846008300781, 0.0049530863761901855, 0.00520932674407959, 0.005465567111968994, 0.0057218074798583984, 0.005978047847747803, 0.006234288215637207, 0.006490528583526611, 0.006746768951416016, 0.00700300931930542, 0.007259249687194824, 0.0075154900550842285, 0.007771730422973633, 0.008027970790863037, 0.008284211158752441, 0.008540451526641846, 0.00879669189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 3.0, 7.0, 10.0, 10.0, 7.0, 9.0, 11.0, 20.0, 16.0, 22.0, 18.0, 30.0, 31.0, 33.0, 48.0, 49.0, 64.0, 62.0, 78.0, 56.0, 58.0, 53.0, 45.0, 32.0, 31.0, 26.0, 24.0, 23.0, 23.0, 18.0, 20.0, 8.0, 12.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.786252975463867e-05, -4.6232715249061584e-05, -4.46029007434845e-05, -4.297308623790741e-05, -4.134327173233032e-05, -3.9713457226753235e-05, -3.808364272117615e-05, -3.645382821559906e-05, -3.482401371002197e-05, -3.3194199204444885e-05, -3.15643846988678e-05, -2.993457019329071e-05, -2.8304755687713623e-05, -2.6674941182136536e-05, -2.5045126676559448e-05, -2.341531217098236e-05, -2.1785497665405273e-05, -2.0155683159828186e-05, -1.85258686542511e-05, -1.689605414867401e-05, -1.5266239643096924e-05, -1.3636425137519836e-05, -1.2006610631942749e-05, -1.0376796126365662e-05, -8.746981620788574e-06, -7.117167115211487e-06, -5.487352609634399e-06, -3.857538104057312e-06, -2.2277235984802246e-06, -5.979090929031372e-07, 1.0319054126739502e-06, 2.6617199182510376e-06, 4.291534423828125e-06, 5.921348929405212e-06, 7.5511634349823e-06, 9.180977940559387e-06, 1.0810792446136475e-05, 1.2440606951713562e-05, 1.407042145729065e-05, 1.5700235962867737e-05, 1.7330050468444824e-05, 1.895986497402191e-05, 2.0589679479599e-05, 2.2219493985176086e-05, 2.3849308490753174e-05, 2.547912299633026e-05, 2.710893750190735e-05, 2.8738752007484436e-05, 3.0368566513061523e-05, 3.199838101863861e-05, 3.36281955242157e-05, 3.5258010029792786e-05, 3.688782453536987e-05, 3.851763904094696e-05, 4.014745354652405e-05, 4.1777268052101135e-05, 4.340708255767822e-05, 4.503689706325531e-05, 4.66667115688324e-05, 4.8296526074409485e-05, 4.992634057998657e-05, 5.155615508556366e-05, 5.318596959114075e-05, 5.4815784096717834e-05, 5.644559860229492e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 4.0, 9.0, 12.0, 18.0, 17.0, 20.0, 33.0, 55.0, 66.0, 130.0, 231.0, 446.0, 953.0, 2507.0, 7605.0, 34361.0, 372961.0, 565636.0, 48406.0, 9755.0, 3044.0, 1103.0, 491.0, 227.0, 148.0, 84.0, 59.0, 35.0, 32.0, 22.0, 17.0, 6.0, 10.0, 10.0, 4.0, 5.0, 5.0, 1.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00797271728515625, -0.007698655128479004, -0.007424592971801758, -0.007150530815124512, -0.006876468658447266, -0.0066024065017700195, -0.0063283443450927734, -0.006054282188415527, -0.005780220031738281, -0.005506157875061035, -0.005232095718383789, -0.004958033561706543, -0.004683971405029297, -0.004409909248352051, -0.004135847091674805, -0.0038617849349975586, -0.0035877227783203125, -0.0033136606216430664, -0.0030395984649658203, -0.0027655363082885742, -0.002491474151611328, -0.002217411994934082, -0.001943349838256836, -0.0016692876815795898, -0.0013952255249023438, -0.0011211633682250977, -0.0008471012115478516, -0.0005730390548706055, -0.0002989768981933594, -2.491474151611328e-05, 0.0002491474151611328, 0.0005232095718383789, 0.000797271728515625, 0.001071333885192871, 0.0013453960418701172, 0.0016194581985473633, 0.0018935203552246094, 0.0021675825119018555, 0.0024416446685791016, 0.0027157068252563477, 0.0029897689819335938, 0.00326383113861084, 0.003537893295288086, 0.003811955451965332, 0.004086017608642578, 0.004360079765319824, 0.00463414192199707, 0.004908204078674316, 0.0051822662353515625, 0.005456328392028809, 0.005730390548706055, 0.006004452705383301, 0.006278514862060547, 0.006552577018737793, 0.006826639175415039, 0.007100701332092285, 0.007374763488769531, 0.007648825645446777, 0.007922887802124023, 0.00819694995880127, 0.008471012115478516, 0.008745074272155762, 0.009019136428833008, 0.009293198585510254, 0.0095672607421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 8.0, 6.0, 10.0, 12.0, 18.0, 17.0, 26.0, 33.0, 35.0, 56.0, 62.0, 66.0, 91.0, 74.0, 89.0, 70.0, 69.0, 51.0, 43.0, 24.0, 30.0, 21.0, 15.0, 14.0, 11.0, 11.0, 2.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004266858100891113, -0.0041315555572509766, -0.00399625301361084, -0.003860950469970703, -0.0037256479263305664, -0.0035903453826904297, -0.003455042839050293, -0.0033197402954101562, -0.0031844377517700195, -0.003049135208129883, -0.002913832664489746, -0.0027785301208496094, -0.0026432275772094727, -0.002507925033569336, -0.0023726224899291992, -0.0022373199462890625, -0.0021020174026489258, -0.001966714859008789, -0.0018314123153686523, -0.0016961097717285156, -0.001560807228088379, -0.0014255046844482422, -0.0012902021408081055, -0.0011548995971679688, -0.001019597053527832, -0.0008842945098876953, -0.0007489919662475586, -0.0006136894226074219, -0.00047838687896728516, -0.00034308433532714844, -0.00020778179168701172, -7.2479248046875e-05, 6.282329559326172e-05, 0.00019812583923339844, 0.00033342838287353516, 0.0004687309265136719, 0.0006040334701538086, 0.0007393360137939453, 0.000874638557434082, 0.0010099411010742188, 0.0011452436447143555, 0.0012805461883544922, 0.001415848731994629, 0.0015511512756347656, 0.0016864538192749023, 0.001821756362915039, 0.0019570589065551758, 0.0020923614501953125, 0.0022276639938354492, 0.002362966537475586, 0.0024982690811157227, 0.0026335716247558594, 0.002768874168395996, 0.002904176712036133, 0.0030394792556762695, 0.0031747817993164062, 0.003310084342956543, 0.0034453868865966797, 0.0035806894302368164, 0.003715991973876953, 0.00385129451751709, 0.0039865970611572266, 0.004121899604797363, 0.0042572021484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 51.0, 895.0, 59.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13441069424152374, -0.11848713457584381, -0.10256357491016388, -0.08664000779390335, -0.07071644812822342, -0.05479288846254349, -0.03886932134628296, -0.022945761680603027, -0.007022202014923096, 0.008901359513401985, 0.024824921041727066, 0.040748484432697296, 0.05667204409837723, 0.07259560376405716, 0.08851917088031769, 0.10444273054599762, 0.12036629021167755, 0.13628984987735748, 0.15221340954303741, 0.16813698410987854, 0.18406054377555847, 0.1999841034412384, 0.21590766310691833, 0.23183122277259827, 0.2477547824382782, 0.26367834210395813, 0.27960190176963806, 0.295525461435318, 0.3114490211009979, 0.32737258076667786, 0.3432961702346802, 0.3592197299003601, 0.37514322996139526, 0.3910667896270752, 0.4069903492927551, 0.42291390895843506, 0.438837468624115, 0.4547610282897949, 0.47068458795547485, 0.4866081476211548, 0.5025317072868347, 0.5184552669525146, 0.5343788266181946, 0.5503023862838745, 0.5662259459495544, 0.5821495056152344, 0.5980730652809143, 0.6139966249465942, 0.629920244216919, 0.6458438038825989, 0.6617673635482788, 0.6776909232139587, 0.6936144828796387, 0.7095380425453186, 0.7254616022109985, 0.7413851618766785, 0.7573087215423584, 0.7732322812080383, 0.7891558408737183, 0.8050794005393982, 0.8210029602050781, 0.8369265198707581, 0.852850079536438, 0.8687736392021179, 0.8846971988677979]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 7.0, 3.0, 9.0, 12.0, 8.0, 13.0, 11.0, 16.0, 21.0, 23.0, 20.0, 30.0, 31.0, 44.0, 27.0, 47.0, 37.0, 44.0, 40.0, 40.0, 40.0, 57.0, 43.0, 37.0, 30.0, 45.0, 22.0, 45.0, 27.0, 18.0, 28.0, 16.0, 15.0, 20.0, 12.0, 16.0, 9.0, 6.0, 5.0, 7.0, 10.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04222053289413452, -0.04105687886476517, -0.03989322483539581, -0.03872957080602646, -0.037565916776657104, -0.03640226274728775, -0.035238608717918396, -0.03407495468854904, -0.03291130065917969, -0.03174764662981033, -0.03058399260044098, -0.029420338571071625, -0.02825668454170227, -0.027093030512332916, -0.025929376482963562, -0.024765722453594208, -0.023602068424224854, -0.0224384143948555, -0.021274760365486145, -0.02011110633611679, -0.018947452306747437, -0.017783798277378082, -0.016620144248008728, -0.015456490218639374, -0.01429283618927002, -0.013129182159900665, -0.011965528130531311, -0.010801874101161957, -0.009638220071792603, -0.008474566042423248, -0.007310912013053894, -0.00614725798368454, -0.0049836039543151855, -0.0038199499249458313, -0.002656295895576477, -0.0014926418662071228, -0.00032898783683776855, 0.0008346661925315857, 0.00199832022190094, 0.003161974251270294, 0.0043256282806396484, 0.005489282310009003, 0.006652936339378357, 0.007816590368747711, 0.008980244398117065, 0.01014389842748642, 0.011307552456855774, 0.012471206486225128, 0.013634860515594482, 0.014798514544963837, 0.01596216857433319, 0.017125822603702545, 0.0182894766330719, 0.019453130662441254, 0.020616784691810608, 0.021780438721179962, 0.022944092750549316, 0.02410774677991867, 0.025271400809288025, 0.02643505483865738, 0.027598708868026733, 0.028762362897396088, 0.029926016926765442, 0.031089670956134796, 0.03225332498550415]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 11.0, 4.0, 9.0, 13.0, 16.0, 24.0, 40.0, 44.0, 60.0, 83.0, 110.0, 154.0, 212.0, 349.0, 555.0, 1054.0, 2834.0, 5660.0, 21859.0, 1716014.0, 2406170.0, 28828.0, 5905.0, 1959.0, 761.0, 424.0, 284.0, 203.0, 158.0, 116.0, 77.0, 59.0, 47.0, 40.0, 29.0, 20.0, 20.0, 13.0, 13.0, 7.0, 9.0, 11.0, 1.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023162841796875, -0.02236485481262207, -0.02156686782836914, -0.02076888084411621, -0.01997089385986328, -0.01917290687561035, -0.018374919891357422, -0.017576932907104492, -0.016778945922851562, -0.015980958938598633, -0.015182971954345703, -0.014384984970092773, -0.013586997985839844, -0.012789011001586914, -0.011991024017333984, -0.011193037033081055, -0.010395050048828125, -0.009597063064575195, -0.008799076080322266, -0.008001089096069336, -0.007203102111816406, -0.0064051151275634766, -0.005607128143310547, -0.004809141159057617, -0.0040111541748046875, -0.003213167190551758, -0.002415180206298828, -0.0016171932220458984, -0.0008192062377929688, -2.1219253540039062e-05, 0.0007767677307128906, 0.0015747547149658203, 0.00237274169921875, 0.0031707286834716797, 0.003968715667724609, 0.004766702651977539, 0.005564689636230469, 0.0063626766204833984, 0.007160663604736328, 0.007958650588989258, 0.008756637573242188, 0.009554624557495117, 0.010352611541748047, 0.011150598526000977, 0.011948585510253906, 0.012746572494506836, 0.013544559478759766, 0.014342546463012695, 0.015140533447265625, 0.015938520431518555, 0.016736507415771484, 0.017534494400024414, 0.018332481384277344, 0.019130468368530273, 0.019928455352783203, 0.020726442337036133, 0.021524429321289062, 0.022322416305541992, 0.023120403289794922, 0.02391839027404785, 0.02471637725830078, 0.02551436424255371, 0.02631235122680664, 0.02711033821105957, 0.0279083251953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 11.0, 39.0, 95.0, 195.0, 209.0, 226.0, 143.0, 51.0, 18.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0177154541015625, -0.017119646072387695, -0.01652383804321289, -0.015928030014038086, -0.015332221984863281, -0.014736413955688477, -0.014140605926513672, -0.013544797897338867, -0.012948989868164062, -0.012353181838989258, -0.011757373809814453, -0.011161565780639648, -0.010565757751464844, -0.009969949722290039, -0.009374141693115234, -0.00877833366394043, -0.008182525634765625, -0.00758671760559082, -0.006990909576416016, -0.006395101547241211, -0.005799293518066406, -0.0052034854888916016, -0.004607677459716797, -0.004011869430541992, -0.0034160614013671875, -0.002820253372192383, -0.002224445343017578, -0.0016286373138427734, -0.0010328292846679688, -0.00043702125549316406, 0.00015878677368164062, 0.0007545948028564453, 0.00135040283203125, 0.0019462108612060547, 0.0025420188903808594, 0.003137826919555664, 0.0037336349487304688, 0.0043294429779052734, 0.004925251007080078, 0.005521059036254883, 0.0061168670654296875, 0.006712675094604492, 0.007308483123779297, 0.007904291152954102, 0.008500099182128906, 0.009095907211303711, 0.009691715240478516, 0.01028752326965332, 0.010883331298828125, 0.01147913932800293, 0.012074947357177734, 0.012670755386352539, 0.013266563415527344, 0.013862371444702148, 0.014458179473876953, 0.015053987503051758, 0.015649795532226562, 0.016245603561401367, 0.016841411590576172, 0.017437219619750977, 0.01803302764892578, 0.018628835678100586, 0.01922464370727539, 0.019820451736450195, 0.020416259765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 11.0, 17.0, 15.0, 24.0, 40.0, 91.0, 129.0, 257.0, 463.0, 944.0, 2120.0, 5955.0, 26025.0, 327979.0, 3661258.0, 144366.0, 16572.0, 4587.0, 1749.0, 782.0, 391.0, 213.0, 96.0, 69.0, 41.0, 30.0, 15.0, 11.0, 13.0, 5.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186004638671875, -0.018043041229248047, -0.017485618591308594, -0.01692819595336914, -0.016370773315429688, -0.015813350677490234, -0.015255928039550781, -0.014698505401611328, -0.014141082763671875, -0.013583660125732422, -0.013026237487792969, -0.012468814849853516, -0.011911392211914062, -0.01135396957397461, -0.010796546936035156, -0.010239124298095703, -0.00968170166015625, -0.009124279022216797, -0.008566856384277344, -0.00800943374633789, -0.0074520111083984375, -0.006894588470458984, -0.006337165832519531, -0.005779743194580078, -0.005222320556640625, -0.004664897918701172, -0.004107475280761719, -0.0035500526428222656, -0.0029926300048828125, -0.0024352073669433594, -0.0018777847290039062, -0.0013203620910644531, -0.000762939453125, -0.00020551681518554688, 0.00035190582275390625, 0.0009093284606933594, 0.0014667510986328125, 0.0020241737365722656, 0.0025815963745117188, 0.003139019012451172, 0.003696441650390625, 0.004253864288330078, 0.004811286926269531, 0.005368709564208984, 0.0059261322021484375, 0.006483554840087891, 0.007040977478027344, 0.007598400115966797, 0.00815582275390625, 0.008713245391845703, 0.009270668029785156, 0.00982809066772461, 0.010385513305664062, 0.010942935943603516, 0.011500358581542969, 0.012057781219482422, 0.012615203857421875, 0.013172626495361328, 0.013730049133300781, 0.014287471771240234, 0.014844894409179688, 0.01540231704711914, 0.015959739685058594, 0.016517162322998047, 0.0170745849609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 9.0, 3.0, 10.0, 11.0, 19.0, 46.0, 52.0, 108.0, 227.0, 526.0, 1147.0, 981.0, 372.0, 195.0, 131.0, 80.0, 45.0, 36.0, 25.0, 14.0, 10.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109405517578125, -0.01049947738647461, -0.010058403015136719, -0.009617328643798828, -0.009176254272460938, -0.008735179901123047, -0.008294105529785156, -0.007853031158447266, -0.007411956787109375, -0.006970882415771484, -0.006529808044433594, -0.006088733673095703, -0.0056476593017578125, -0.005206584930419922, -0.004765510559082031, -0.004324436187744141, -0.00388336181640625, -0.0034422874450683594, -0.0030012130737304688, -0.002560138702392578, -0.0021190643310546875, -0.0016779899597167969, -0.0012369155883789062, -0.0007958412170410156, -0.000354766845703125, 8.630752563476562e-05, 0.0005273818969726562, 0.0009684562683105469, 0.0014095306396484375, 0.0018506050109863281, 0.0022916793823242188, 0.0027327537536621094, 0.003173828125, 0.0036149024963378906, 0.004055976867675781, 0.004497051239013672, 0.0049381256103515625, 0.005379199981689453, 0.005820274353027344, 0.006261348724365234, 0.006702423095703125, 0.007143497467041016, 0.007584571838378906, 0.008025646209716797, 0.008466720581054688, 0.008907794952392578, 0.009348869323730469, 0.00978994369506836, 0.01023101806640625, 0.01067209243774414, 0.011113166809082031, 0.011554241180419922, 0.011995315551757812, 0.012436389923095703, 0.012877464294433594, 0.013318538665771484, 0.013759613037109375, 0.014200687408447266, 0.014641761779785156, 0.015082836151123047, 0.015523910522460938, 0.015964984893798828, 0.01640605926513672, 0.01684713363647461, 0.0172882080078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 30.0, 635.0, 305.0, 25.0, 11.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.5228489637374878, -0.5134583711624146, -0.5040677785873413, -0.4946771562099457, -0.48528656363487244, -0.4758959710597992, -0.46650537848472595, -0.4571147859096527, -0.4477241635322571, -0.43833357095718384, -0.4289429783821106, -0.41955235600471497, -0.4101617634296417, -0.4007711708545685, -0.39138057827949524, -0.381989985704422, -0.37259939312934875, -0.3632088005542755, -0.35381820797920227, -0.34442758560180664, -0.3350369930267334, -0.32564640045166016, -0.3162558078765869, -0.30686521530151367, -0.29747462272644043, -0.2880840301513672, -0.27869343757629395, -0.2693028151988983, -0.2599122226238251, -0.25052163004875183, -0.2411310374736786, -0.23174044489860535, -0.22234980762004852, -0.21295921504497528, -0.20356860756874084, -0.1941780149936676, -0.18478742241859436, -0.17539681494235992, -0.16600622236728668, -0.15661561489105225, -0.147225022315979, -0.13783442974090576, -0.12844382226467133, -0.11905322968959808, -0.10966262966394424, -0.1002720296382904, -0.09088143706321716, -0.08149083703756332, -0.07210023701190948, -0.06270963698625565, -0.053319040685892105, -0.043928444385528564, -0.034537844359874725, -0.025147244334220886, -0.015756648033857346, -0.006366051733493805, 0.003024548292160034, 0.012415146455168724, 0.021805744618177414, 0.031196342781186104, 0.040586940944194794, 0.04997754096984863, 0.05936813727021217, 0.06875873357057571, 0.07814933359622955]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 13.0, 5.0, 16.0, 27.0, 31.0, 47.0, 53.0, 57.0, 67.0, 96.0, 90.0, 95.0, 91.0, 66.0, 60.0, 49.0, 36.0, 33.0, 22.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0744444727897644, -0.07252074033021927, -0.07059701532125473, -0.0686732828617096, -0.06674955785274506, -0.06482582539319992, -0.06290209293365479, -0.06097836419939995, -0.05905463546514511, -0.057130906730890274, -0.05520717799663544, -0.0532834455370903, -0.051359716802835464, -0.04943598806858063, -0.04751225560903549, -0.045588526874780655, -0.04366479814052582, -0.04174106940627098, -0.039817340672016144, -0.03789360821247101, -0.03596987947821617, -0.034046150743961334, -0.0321224182844162, -0.03019868955016136, -0.028274960815906525, -0.026351232081651688, -0.0244275014847517, -0.022503770887851715, -0.020580042153596878, -0.01865631341934204, -0.016732582822442055, -0.014808853156864643, -0.012885123491287231, -0.01096139382570982, -0.009037664160132408, -0.0071139344945549965, -0.005190204828977585, -0.003266475163400173, -0.0013427454978227615, 0.0005809841677546501, 0.0025047138333320618, 0.004428443498909473, 0.006352173164486885, 0.008275902830064297, 0.010199632495641708, 0.01212336216121912, 0.014047091826796532, 0.015970822423696518, 0.017894551157951355, 0.019818279892206192, 0.02174201048910618, 0.023665741086006165, 0.025589469820261, 0.02751319855451584, 0.029436929151415825, 0.03136065974831581, 0.03328438848257065, 0.035208117216825485, 0.03713184595108032, 0.03905557841062546, 0.040979307144880295, 0.04290303587913513, 0.04482676833868027, 0.046750497072935104, 0.04867422580718994]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 29.0, 40.0, 52.0, 78.0, 112.0, 167.0, 260.0, 383.0, 598.0, 941.0, 2102.0, 17034.0, 758098.0, 257925.0, 6991.0, 1492.0, 732.0, 465.0, 322.0, 247.0, 154.0, 98.0, 72.0, 51.0, 35.0, 21.0, 14.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.044580936431884766, -0.04326343536376953, -0.0419459342956543, -0.04062843322753906, -0.03931093215942383, -0.037993431091308594, -0.03667593002319336, -0.035358428955078125, -0.03404092788696289, -0.032723426818847656, -0.03140592575073242, -0.030088424682617188, -0.028770923614501953, -0.02745342254638672, -0.026135921478271484, -0.02481842041015625, -0.023500919342041016, -0.02218341827392578, -0.020865917205810547, -0.019548416137695312, -0.018230915069580078, -0.016913414001464844, -0.01559591293334961, -0.014278411865234375, -0.01296091079711914, -0.011643409729003906, -0.010325908660888672, -0.009008407592773438, -0.007690906524658203, -0.006373405456542969, -0.005055904388427734, -0.0037384033203125, -0.0024209022521972656, -0.0011034011840820312, 0.00021409988403320312, 0.0015316009521484375, 0.002849102020263672, 0.004166603088378906, 0.005484104156494141, 0.006801605224609375, 0.00811910629272461, 0.009436607360839844, 0.010754108428955078, 0.012071609497070312, 0.013389110565185547, 0.014706611633300781, 0.016024112701416016, 0.01734161376953125, 0.018659114837646484, 0.01997661590576172, 0.021294116973876953, 0.022611618041992188, 0.023929119110107422, 0.025246620178222656, 0.02656412124633789, 0.027881622314453125, 0.02919912338256836, 0.030516624450683594, 0.03183412551879883, 0.03315162658691406, 0.0344691276550293, 0.03578662872314453, 0.037104129791259766, 0.038421630859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 13.0, 34.0, 122.0, 214.0, 230.0, 211.0, 117.0, 35.0, 12.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0191192626953125, -0.018492460250854492, -0.017865657806396484, -0.017238855361938477, -0.01661205291748047, -0.01598525047302246, -0.015358448028564453, -0.014731645584106445, -0.014104843139648438, -0.01347804069519043, -0.012851238250732422, -0.012224435806274414, -0.011597633361816406, -0.010970830917358398, -0.01034402847290039, -0.009717226028442383, -0.009090423583984375, -0.008463621139526367, -0.00783681869506836, -0.0072100162506103516, -0.006583213806152344, -0.005956411361694336, -0.005329608917236328, -0.00470280647277832, -0.0040760040283203125, -0.0034492015838623047, -0.002822399139404297, -0.002195596694946289, -0.0015687942504882812, -0.0009419918060302734, -0.0003151893615722656, 0.0003116130828857422, 0.00093841552734375, 0.0015652179718017578, 0.0021920204162597656, 0.0028188228607177734, 0.0034456253051757812, 0.004072427749633789, 0.004699230194091797, 0.005326032638549805, 0.0059528350830078125, 0.00657963752746582, 0.007206439971923828, 0.007833242416381836, 0.008460044860839844, 0.009086847305297852, 0.00971364974975586, 0.010340452194213867, 0.010967254638671875, 0.011594057083129883, 0.01222085952758789, 0.012847661972045898, 0.013474464416503906, 0.014101266860961914, 0.014728069305419922, 0.01535487174987793, 0.015981674194335938, 0.016608476638793945, 0.017235279083251953, 0.01786208152770996, 0.01848888397216797, 0.019115686416625977, 0.019742488861083984, 0.020369291305541992, 0.02099609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 3.0, 15.0, 17.0, 22.0, 27.0, 34.0, 46.0, 49.0, 72.0, 85.0, 139.0, 187.0, 339.0, 603.0, 1094.0, 2457.0, 6196.0, 20237.0, 87947.0, 386308.0, 411359.0, 96816.0, 22482.0, 6657.0, 2521.0, 1141.0, 617.0, 339.0, 206.0, 125.0, 99.0, 86.0, 55.0, 31.0, 39.0, 21.0, 15.0, 15.0, 9.0, 8.0, 11.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01233673095703125, -0.011925935745239258, -0.011515140533447266, -0.011104345321655273, -0.010693550109863281, -0.010282754898071289, -0.009871959686279297, -0.009461164474487305, -0.009050369262695312, -0.00863957405090332, -0.008228778839111328, -0.007817983627319336, -0.007407188415527344, -0.0069963932037353516, -0.006585597991943359, -0.006174802780151367, -0.005764007568359375, -0.005353212356567383, -0.004942417144775391, -0.0045316219329833984, -0.004120826721191406, -0.003710031509399414, -0.003299236297607422, -0.0028884410858154297, -0.0024776458740234375, -0.0020668506622314453, -0.0016560554504394531, -0.001245260238647461, -0.0008344650268554688, -0.00042366981506347656, -1.2874603271484375e-05, 0.0003979206085205078, 0.0008087158203125, 0.0012195110321044922, 0.0016303062438964844, 0.0020411014556884766, 0.0024518966674804688, 0.002862691879272461, 0.003273487091064453, 0.0036842823028564453, 0.0040950775146484375, 0.00450587272644043, 0.004916667938232422, 0.005327463150024414, 0.005738258361816406, 0.0061490535736083984, 0.006559848785400391, 0.006970643997192383, 0.007381439208984375, 0.007792234420776367, 0.00820302963256836, 0.008613824844360352, 0.009024620056152344, 0.009435415267944336, 0.009846210479736328, 0.01025700569152832, 0.010667800903320312, 0.011078596115112305, 0.011489391326904297, 0.011900186538696289, 0.012310981750488281, 0.012721776962280273, 0.013132572174072266, 0.013543367385864258, 0.01395416259765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 10.0, 17.0, 15.0, 28.0, 27.0, 22.0, 26.0, 38.0, 27.0, 46.0, 44.0, 31.0, 50.0, 54.0, 40.0, 47.0, 44.0, 45.0, 48.0, 51.0, 46.0, 28.0, 32.0, 25.0, 27.0, 19.0, 11.0, 12.0, 13.0, 11.0, 5.0, 10.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.011688232421875, -0.0113145112991333, -0.010940790176391602, -0.010567069053649902, -0.010193347930908203, -0.009819626808166504, -0.009445905685424805, -0.009072184562683105, -0.008698463439941406, -0.008324742317199707, -0.007951021194458008, -0.007577300071716309, -0.007203578948974609, -0.00682985782623291, -0.006456136703491211, -0.006082415580749512, -0.0057086944580078125, -0.005334973335266113, -0.004961252212524414, -0.004587531089782715, -0.004213809967041016, -0.0038400888442993164, -0.003466367721557617, -0.003092646598815918, -0.0027189254760742188, -0.0023452043533325195, -0.0019714832305908203, -0.001597762107849121, -0.0012240409851074219, -0.0008503198623657227, -0.00047659873962402344, -0.00010287761688232422, 0.000270843505859375, 0.0006445646286010742, 0.0010182857513427734, 0.0013920068740844727, 0.0017657279968261719, 0.002139449119567871, 0.0025131702423095703, 0.0028868913650512695, 0.0032606124877929688, 0.003634333610534668, 0.004008054733276367, 0.004381775856018066, 0.004755496978759766, 0.005129218101501465, 0.005502939224243164, 0.005876660346984863, 0.0062503814697265625, 0.006624102592468262, 0.006997823715209961, 0.00737154483795166, 0.007745265960693359, 0.008118987083435059, 0.008492708206176758, 0.008866429328918457, 0.009240150451660156, 0.009613871574401855, 0.009987592697143555, 0.010361313819885254, 0.010735034942626953, 0.011108756065368652, 0.011482477188110352, 0.01185619831085205, 0.01222991943359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 3.0, 11.0, 4.0, 13.0, 18.0, 23.0, 29.0, 50.0, 100.0, 154.0, 269.0, 448.0, 787.0, 1550.0, 3178.0, 9135.0, 54608.0, 707963.0, 239944.0, 20129.0, 5285.0, 2213.0, 1125.0, 623.0, 332.0, 226.0, 108.0, 79.0, 41.0, 24.0, 21.0, 8.0, 9.0, 13.0, 5.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00786590576171875, -0.0076258182525634766, -0.007385730743408203, -0.00714564323425293, -0.006905555725097656, -0.006665468215942383, -0.006425380706787109, -0.006185293197631836, -0.0059452056884765625, -0.005705118179321289, -0.005465030670166016, -0.005224943161010742, -0.004984855651855469, -0.004744768142700195, -0.004504680633544922, -0.0042645931243896484, -0.004024505615234375, -0.0037844181060791016, -0.003544330596923828, -0.0033042430877685547, -0.0030641555786132812, -0.002824068069458008, -0.0025839805603027344, -0.002343893051147461, -0.0021038055419921875, -0.001863718032836914, -0.0016236305236816406, -0.0013835430145263672, -0.0011434555053710938, -0.0009033679962158203, -0.0006632804870605469, -0.00042319297790527344, -0.00018310546875, 5.698204040527344e-05, 0.0002970695495605469, 0.0005371570587158203, 0.0007772445678710938, 0.0010173320770263672, 0.0012574195861816406, 0.001497507095336914, 0.0017375946044921875, 0.001977682113647461, 0.0022177696228027344, 0.002457857131958008, 0.0026979446411132812, 0.0029380321502685547, 0.003178119659423828, 0.0034182071685791016, 0.003658294677734375, 0.0038983821868896484, 0.004138469696044922, 0.004378557205200195, 0.004618644714355469, 0.004858732223510742, 0.005098819732666016, 0.005338907241821289, 0.0055789947509765625, 0.005819082260131836, 0.006059169769287109, 0.006299257278442383, 0.006539344787597656, 0.00677943229675293, 0.007019519805908203, 0.0072596073150634766, 0.00749969482421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 12.0, 10.0, 17.0, 24.0, 26.0, 53.0, 36.0, 65.0, 55.0, 65.0, 69.0, 82.0, 83.0, 69.0, 67.0, 52.0, 43.0, 33.0, 26.0, 19.0, 13.0, 20.0, 9.0, 7.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.730722427368164e-05, -7.440242916345596e-05, -7.149763405323029e-05, -6.859283894300461e-05, -6.568804383277893e-05, -6.278324872255325e-05, -5.9878453612327576e-05, -5.69736585021019e-05, -5.406886339187622e-05, -5.116406828165054e-05, -4.8259273171424866e-05, -4.535447806119919e-05, -4.244968295097351e-05, -3.954488784074783e-05, -3.6640092730522156e-05, -3.373529762029648e-05, -3.08305025100708e-05, -2.7925707399845123e-05, -2.5020912289619446e-05, -2.211611717939377e-05, -1.921132206916809e-05, -1.6306526958942413e-05, -1.3401731848716736e-05, -1.0496936738491058e-05, -7.592141628265381e-06, -4.687346518039703e-06, -1.7825514078140259e-06, 1.1222437024116516e-06, 4.027038812637329e-06, 6.931833922863007e-06, 9.836629033088684e-06, 1.2741424143314362e-05, 1.564621925354004e-05, 1.8551014363765717e-05, 2.1455809473991394e-05, 2.436060458421707e-05, 2.726539969444275e-05, 3.0170194804668427e-05, 3.3074989914894104e-05, 3.597978502511978e-05, 3.888458013534546e-05, 4.1789375245571136e-05, 4.4694170355796814e-05, 4.759896546602249e-05, 5.050376057624817e-05, 5.3408555686473846e-05, 5.6313350796699524e-05, 5.92181459069252e-05, 6.212294101715088e-05, 6.502773612737656e-05, 6.793253123760223e-05, 7.083732634782791e-05, 7.374212145805359e-05, 7.664691656827927e-05, 7.955171167850494e-05, 8.245650678873062e-05, 8.53613018989563e-05, 8.826609700918198e-05, 9.117089211940765e-05, 9.407568722963333e-05, 9.698048233985901e-05, 9.988527745008469e-05, 0.00010279007256031036, 0.00010569486767053604, 0.00010859966278076172]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 12.0, 9.0, 9.0, 14.0, 16.0, 41.0, 68.0, 124.0, 229.0, 461.0, 836.0, 1542.0, 3532.0, 13105.0, 266729.0, 728251.0, 24686.0, 4752.0, 1916.0, 1064.0, 503.0, 292.0, 161.0, 77.0, 50.0, 12.0, 12.0, 10.0, 8.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01268768310546875, -0.012326717376708984, -0.011965751647949219, -0.011604785919189453, -0.011243820190429688, -0.010882854461669922, -0.010521888732910156, -0.01016092300415039, -0.009799957275390625, -0.00943899154663086, -0.009078025817871094, -0.008717060089111328, -0.008356094360351562, -0.007995128631591797, -0.007634162902832031, -0.007273197174072266, -0.0069122314453125, -0.006551265716552734, -0.006190299987792969, -0.005829334259033203, -0.0054683685302734375, -0.005107402801513672, -0.004746437072753906, -0.004385471343994141, -0.004024505615234375, -0.0036635398864746094, -0.0033025741577148438, -0.002941608428955078, -0.0025806427001953125, -0.002219676971435547, -0.0018587112426757812, -0.0014977455139160156, -0.00113677978515625, -0.0007758140563964844, -0.00041484832763671875, -5.3882598876953125e-05, 0.0003070831298828125, 0.0006680488586425781, 0.0010290145874023438, 0.0013899803161621094, 0.001750946044921875, 0.0021119117736816406, 0.0024728775024414062, 0.002833843231201172, 0.0031948089599609375, 0.003555774688720703, 0.003916740417480469, 0.004277706146240234, 0.004638671875, 0.004999637603759766, 0.005360603332519531, 0.005721569061279297, 0.0060825347900390625, 0.006443500518798828, 0.006804466247558594, 0.007165431976318359, 0.007526397705078125, 0.00788736343383789, 0.008248329162597656, 0.008609294891357422, 0.008970260620117188, 0.009331226348876953, 0.009692192077636719, 0.010053157806396484, 0.01041412353515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 9.0, 16.0, 10.0, 19.0, 26.0, 33.0, 45.0, 63.0, 76.0, 101.0, 115.0, 115.0, 79.0, 65.0, 42.0, 38.0, 41.0, 25.0, 21.0, 20.0, 10.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0045013427734375, -0.004375845193862915, -0.00425034761428833, -0.004124850034713745, -0.00399935245513916, -0.003873854875564575, -0.0037483572959899902, -0.0036228597164154053, -0.0034973621368408203, -0.0033718645572662354, -0.0032463669776916504, -0.0031208693981170654, -0.0029953718185424805, -0.0028698742389678955, -0.0027443766593933105, -0.0026188790798187256, -0.0024933815002441406, -0.0023678839206695557, -0.0022423863410949707, -0.0021168887615203857, -0.0019913911819458008, -0.0018658936023712158, -0.0017403960227966309, -0.001614898443222046, -0.001489400863647461, -0.001363903284072876, -0.001238405704498291, -0.001112908124923706, -0.000987410545349121, -0.0008619129657745361, -0.0007364153861999512, -0.0006109178066253662, -0.00048542022705078125, -0.0003599226474761963, -0.00023442506790161133, -0.00010892748832702637, 1.6570091247558594e-05, 0.00014206767082214355, 0.0002675652503967285, 0.0003930628299713135, 0.0005185604095458984, 0.0006440579891204834, 0.0007695555686950684, 0.0008950531482696533, 0.0010205507278442383, 0.0011460483074188232, 0.0012715458869934082, 0.0013970434665679932, 0.0015225410461425781, 0.001648038625717163, 0.001773536205291748, 0.001899033784866333, 0.002024531364440918, 0.002150028944015503, 0.002275526523590088, 0.002401024103164673, 0.002526521682739258, 0.0026520192623138428, 0.0027775168418884277, 0.0029030144214630127, 0.0030285120010375977, 0.0031540095806121826, 0.0032795071601867676, 0.0034050047397613525, 0.0035305023193359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 25.0, 246.0, 547.0, 154.0, 26.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03863357752561569, -0.03248655050992966, -0.02633952535688877, -0.020192500203847885, -0.01404547318816185, -0.007898446172475815, -0.0017514228820800781, 0.004395604133605957, 0.010542631149291992, 0.016689658164978027, 0.022836683318018913, 0.0289837084710598, 0.035130735486745834, 0.04127776250243187, 0.047424785792827606, 0.05357181280851364, 0.059718839824199677, 0.06586586683988571, 0.07201289385557175, 0.07815991342067719, 0.08430694043636322, 0.09045396745204926, 0.09660099446773529, 0.10274802148342133, 0.10889504849910736, 0.1150420755147934, 0.12118910253047943, 0.12733612954616547, 0.1334831565618515, 0.13963018357753754, 0.14577719569206238, 0.1519242227077484, 0.15807124972343445, 0.16421827673912048, 0.17036530375480652, 0.17651233077049255, 0.1826593577861786, 0.18880638480186462, 0.19495341181755066, 0.2011004388332367, 0.20724746584892273, 0.21339449286460876, 0.2195415198802948, 0.22568854689598083, 0.23183557391166687, 0.2379826009273529, 0.24412962794303894, 0.250276654958725, 0.2564236521720886, 0.26257067918777466, 0.2687177062034607, 0.27486473321914673, 0.28101176023483276, 0.2871587872505188, 0.29330581426620483, 0.29945284128189087, 0.3055998682975769, 0.31174689531326294, 0.317893922328949, 0.324040949344635, 0.33018797636032104, 0.3363350033760071, 0.3424820303916931, 0.34862905740737915, 0.3547760844230652]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 13.0, 6.0, 7.0, 11.0, 16.0, 16.0, 8.0, 21.0, 16.0, 23.0, 29.0, 32.0, 31.0, 36.0, 31.0, 48.0, 53.0, 46.0, 39.0, 33.0, 45.0, 44.0, 29.0, 41.0, 39.0, 35.0, 20.0, 32.0, 17.0, 22.0, 23.0, 17.0, 24.0, 16.0, 17.0, 12.0, 15.0, 6.0, 10.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03021639585494995, -0.029295291751623154, -0.028374185785651207, -0.02745307981967926, -0.026531975716352463, -0.025610871613025665, -0.02468976564705372, -0.023768659681081772, -0.022847555577754974, -0.021926451474428177, -0.02100534550845623, -0.020084239542484283, -0.019163135439157486, -0.01824203133583069, -0.017320925369858742, -0.016399819403886795, -0.015478715300559998, -0.014557610265910625, -0.013636505231261253, -0.012715400196611881, -0.01179429516196251, -0.010873190127313137, -0.009952085092663765, -0.009030980058014393, -0.00810987502336502, -0.007188769988715649, -0.0062676649540662766, -0.0053465599194169044, -0.004425454884767532, -0.0035043498501181602, -0.002583244815468788, -0.001662139780819416, -0.0007410347461700439, 0.00018007028847932816, 0.0011011753231287003, 0.0020222803577780724, 0.0029433853924274445, 0.0038644904270768166, 0.004785595461726189, 0.005706700496375561, 0.006627805531024933, 0.007548910565674305, 0.008470015600323677, 0.00939112063497305, 0.010312225669622421, 0.011233330704271793, 0.012154435738921165, 0.013075540773570538, 0.01399664580821991, 0.014917750842869282, 0.015838855877518654, 0.0167599618434906, 0.017681065946817398, 0.018602170050144196, 0.019523276016116142, 0.02044438198208809, 0.021365486085414886, 0.022286590188741684, 0.02320769615471363, 0.024128802120685577, 0.025049906224012375, 0.025971010327339172, 0.02689211629331112, 0.027813222259283066, 0.028734326362609863]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 14.0, 16.0, 20.0, 32.0, 39.0, 49.0, 99.0, 121.0, 194.0, 292.0, 498.0, 1248.0, 2722.0, 5922.0, 50506.0, 4004970.0, 112516.0, 9873.0, 2991.0, 895.0, 435.0, 203.0, 174.0, 95.0, 76.0, 54.0, 59.0, 39.0, 17.0, 16.0, 15.0, 8.0, 14.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0269775390625, -0.026124000549316406, -0.025270462036132812, -0.02441692352294922, -0.023563385009765625, -0.02270984649658203, -0.021856307983398438, -0.021002769470214844, -0.02014923095703125, -0.019295692443847656, -0.018442153930664062, -0.01758861541748047, -0.016735076904296875, -0.01588153839111328, -0.015027999877929688, -0.014174461364746094, -0.0133209228515625, -0.012467384338378906, -0.011613845825195312, -0.010760307312011719, -0.009906768798828125, -0.009053230285644531, -0.008199691772460938, -0.007346153259277344, -0.00649261474609375, -0.005639076232910156, -0.0047855377197265625, -0.003931999206542969, -0.003078460693359375, -0.0022249221801757812, -0.0013713836669921875, -0.0005178451538085938, 0.000335693359375, 0.0011892318725585938, 0.0020427703857421875, 0.0028963088989257812, 0.003749847412109375, 0.004603385925292969, 0.0054569244384765625, 0.006310462951660156, 0.00716400146484375, 0.008017539978027344, 0.008871078491210938, 0.009724617004394531, 0.010578155517578125, 0.011431694030761719, 0.012285232543945312, 0.013138771057128906, 0.0139923095703125, 0.014845848083496094, 0.015699386596679688, 0.01655292510986328, 0.017406463623046875, 0.01826000213623047, 0.019113540649414062, 0.019967079162597656, 0.02082061767578125, 0.021674156188964844, 0.022527694702148438, 0.02338123321533203, 0.024234771728515625, 0.02508831024169922, 0.025941848754882812, 0.026795387268066406, 0.02764892578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 38.0, 104.0, 209.0, 215.0, 224.0, 125.0, 52.0, 14.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180816650390625, -0.017450809478759766, -0.01681995391845703, -0.016189098358154297, -0.015558242797851562, -0.014927387237548828, -0.014296531677246094, -0.01366567611694336, -0.013034820556640625, -0.01240396499633789, -0.011773109436035156, -0.011142253875732422, -0.010511398315429688, -0.009880542755126953, -0.009249687194824219, -0.008618831634521484, -0.00798797607421875, -0.007357120513916016, -0.006726264953613281, -0.006095409393310547, -0.0054645538330078125, -0.004833698272705078, -0.004202842712402344, -0.0035719871520996094, -0.002941131591796875, -0.0023102760314941406, -0.0016794204711914062, -0.0010485649108886719, -0.0004177093505859375, 0.00021314620971679688, 0.0008440017700195312, 0.0014748573303222656, 0.002105712890625, 0.0027365684509277344, 0.0033674240112304688, 0.003998279571533203, 0.0046291351318359375, 0.005259990692138672, 0.005890846252441406, 0.006521701812744141, 0.007152557373046875, 0.007783412933349609, 0.008414268493652344, 0.009045124053955078, 0.009675979614257812, 0.010306835174560547, 0.010937690734863281, 0.011568546295166016, 0.01219940185546875, 0.012830257415771484, 0.013461112976074219, 0.014091968536376953, 0.014722824096679688, 0.015353679656982422, 0.015984535217285156, 0.01661539077758789, 0.017246246337890625, 0.01787710189819336, 0.018507957458496094, 0.019138813018798828, 0.019769668579101562, 0.020400524139404297, 0.02103137969970703, 0.021662235260009766, 0.0222930908203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 10.0, 21.0, 24.0, 39.0, 64.0, 107.0, 193.0, 356.0, 680.0, 1521.0, 3857.0, 14289.0, 102796.0, 3650442.0, 378954.0, 30339.0, 6568.0, 2172.0, 869.0, 463.0, 201.0, 124.0, 58.0, 41.0, 33.0, 16.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010262012481689453, -0.009766578674316406, -0.00927114486694336, -0.008775711059570312, -0.008280277252197266, -0.007784843444824219, -0.007289409637451172, -0.006793975830078125, -0.006298542022705078, -0.005803108215332031, -0.005307674407958984, -0.0048122406005859375, -0.004316806793212891, -0.0038213729858398438, -0.003325939178466797, -0.00283050537109375, -0.002335071563720703, -0.0018396377563476562, -0.0013442039489746094, -0.0008487701416015625, -0.0003533363342285156, 0.00014209747314453125, 0.0006375312805175781, 0.001132965087890625, 0.0016283988952636719, 0.0021238327026367188, 0.0026192665100097656, 0.0031147003173828125, 0.0036101341247558594, 0.004105567932128906, 0.004601001739501953, 0.005096435546875, 0.005591869354248047, 0.006087303161621094, 0.006582736968994141, 0.0070781707763671875, 0.007573604583740234, 0.008069038391113281, 0.008564472198486328, 0.009059906005859375, 0.009555339813232422, 0.010050773620605469, 0.010546207427978516, 0.011041641235351562, 0.01153707504272461, 0.012032508850097656, 0.012527942657470703, 0.01302337646484375, 0.013518810272216797, 0.014014244079589844, 0.01450967788696289, 0.015005111694335938, 0.015500545501708984, 0.01599597930908203, 0.016491413116455078, 0.016986846923828125, 0.017482280731201172, 0.01797771453857422, 0.018473148345947266, 0.018968582153320312, 0.01946401596069336, 0.019959449768066406, 0.020454883575439453, 0.0209503173828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 10.0, 17.0, 25.0, 32.0, 65.0, 79.0, 175.0, 453.0, 1215.0, 1052.0, 400.0, 184.0, 99.0, 77.0, 47.0, 39.0, 23.0, 18.0, 11.0, 7.0, 6.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01050567626953125, -0.010186433792114258, -0.009867191314697266, -0.009547948837280273, -0.009228706359863281, -0.008909463882446289, -0.008590221405029297, -0.008270978927612305, -0.007951736450195312, -0.00763249397277832, -0.007313251495361328, -0.006994009017944336, -0.006674766540527344, -0.0063555240631103516, -0.006036281585693359, -0.005717039108276367, -0.005397796630859375, -0.005078554153442383, -0.004759311676025391, -0.0044400691986083984, -0.004120826721191406, -0.003801584243774414, -0.003482341766357422, -0.0031630992889404297, -0.0028438568115234375, -0.0025246143341064453, -0.002205371856689453, -0.001886129379272461, -0.0015668869018554688, -0.0012476444244384766, -0.0009284019470214844, -0.0006091594696044922, -0.0002899169921875, 2.9325485229492188e-05, 0.0003485679626464844, 0.0006678104400634766, 0.0009870529174804688, 0.001306295394897461, 0.0016255378723144531, 0.0019447803497314453, 0.0022640228271484375, 0.0025832653045654297, 0.002902507781982422, 0.003221750259399414, 0.0035409927368164062, 0.0038602352142333984, 0.004179477691650391, 0.004498720169067383, 0.004817962646484375, 0.005137205123901367, 0.005456447601318359, 0.0057756900787353516, 0.006094932556152344, 0.006414175033569336, 0.006733417510986328, 0.00705265998840332, 0.0073719024658203125, 0.007691144943237305, 0.008010387420654297, 0.008329629898071289, 0.008648872375488281, 0.008968114852905273, 0.009287357330322266, 0.009606599807739258, 0.00992584228515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 366.0, 505.0, 82.0, 11.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20076274871826172, -0.19598011672496796, -0.1911974847316742, -0.18641485273838043, -0.18163222074508667, -0.1768496036529541, -0.17206695675849915, -0.16728433966636658, -0.16250170767307281, -0.15771907567977905, -0.1529364436864853, -0.14815381169319153, -0.14337117969989777, -0.138588547706604, -0.13380593061447144, -0.12902329862117767, -0.12424065917730331, -0.11945802718400955, -0.11467539519071579, -0.10989277064800262, -0.10511013865470886, -0.1003275066614151, -0.09554487466812134, -0.09076224267482758, -0.08597961068153381, -0.08119697868824005, -0.07641434669494629, -0.07163171470165253, -0.06684909015893936, -0.0620664581656456, -0.05728382617235184, -0.05250119790434837, -0.04771857708692551, -0.042935945093631744, -0.03815331682562828, -0.03337068483233452, -0.028588054701685905, -0.023805424571037292, -0.01902279257774353, -0.014240164309740067, -0.009457532316446304, -0.004674901720136404, 0.00010772887617349625, 0.004890359938144684, 0.009672990068793297, 0.01445562019944191, 0.019238252192735672, 0.024020880460739136, 0.028803512454032898, 0.03358614444732666, 0.038368772715330124, 0.043151404708623886, 0.04793403297662735, 0.05271666496992111, 0.057499296963214874, 0.06228192523121834, 0.0670645534992218, 0.07184718549251556, 0.07662981748580933, 0.08141244947910309, 0.08619507402181625, 0.09097770601511002, 0.09576033800840378, 0.10054296255111694, 0.1053256019949913]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 15.0, 18.0, 23.0, 34.0, 34.0, 47.0, 57.0, 64.0, 72.0, 67.0, 67.0, 60.0, 61.0, 78.0, 61.0, 39.0, 38.0, 34.0, 23.0, 17.0, 11.0, 20.0, 13.0, 10.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02980595827102661, -0.02871539816260338, -0.027624839916825294, -0.02653428167104721, -0.025443721562623978, -0.024353161454200745, -0.02326260320842266, -0.022172044962644577, -0.021081484854221344, -0.01999092474579811, -0.018900366500020027, -0.017809808254241943, -0.01671924814581871, -0.015628688037395477, -0.014538129791617393, -0.013447570614516735, -0.012357011437416077, -0.011266452260315418, -0.01017589308321476, -0.009085333906114101, -0.007994774729013443, -0.006904215551912785, -0.005813656374812126, -0.004723097197711468, -0.0036325380206108093, -0.002541978843510151, -0.0014514196664094925, -0.0003608604893088341, 0.0007296986877918243, 0.0018202578648924828, 0.002910817041993141, 0.0040013762190938, 0.005091935396194458, 0.006182494573295116, 0.007273053750395775, 0.008363612927496433, 0.009454172104597092, 0.01054473128169775, 0.011635290458798409, 0.012725849635899067, 0.013816408812999725, 0.014906967990100384, 0.015997527167201042, 0.017088085412979126, 0.01817864552140236, 0.019269205629825592, 0.020359763875603676, 0.02145032212138176, 0.022540882229804993, 0.023631442338228226, 0.02472200058400631, 0.025812558829784393, 0.026903118938207626, 0.02799367904663086, 0.029084237292408943, 0.030174795538187027, 0.03126535564661026, 0.03235591575503349, 0.033446475863456726, 0.03453703224658966, 0.035627592355012894, 0.03671815246343613, 0.03780870884656906, 0.038899268954992294, 0.03998982906341553]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 15.0, 11.0, 15.0, 24.0, 37.0, 32.0, 65.0, 88.0, 93.0, 150.0, 183.0, 313.0, 461.0, 699.0, 1358.0, 3938.0, 33812.0, 783884.0, 208545.0, 9862.0, 2091.0, 967.0, 545.0, 396.0, 256.0, 200.0, 147.0, 97.0, 66.0, 48.0, 40.0, 28.0, 18.0, 11.0, 11.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0236358642578125, -0.022814035415649414, -0.021992206573486328, -0.021170377731323242, -0.020348548889160156, -0.01952672004699707, -0.018704891204833984, -0.0178830623626709, -0.017061233520507812, -0.016239404678344727, -0.01541757583618164, -0.014595746994018555, -0.013773918151855469, -0.012952089309692383, -0.012130260467529297, -0.011308431625366211, -0.010486602783203125, -0.009664773941040039, -0.008842945098876953, -0.008021116256713867, -0.007199287414550781, -0.006377458572387695, -0.005555629730224609, -0.0047338008880615234, -0.0039119720458984375, -0.0030901432037353516, -0.0022683143615722656, -0.0014464855194091797, -0.0006246566772460938, 0.0001971721649169922, 0.0010190010070800781, 0.001840829849243164, 0.00266265869140625, 0.003484487533569336, 0.004306316375732422, 0.005128145217895508, 0.005949974060058594, 0.00677180290222168, 0.007593631744384766, 0.008415460586547852, 0.009237289428710938, 0.010059118270874023, 0.01088094711303711, 0.011702775955200195, 0.012524604797363281, 0.013346433639526367, 0.014168262481689453, 0.014990091323852539, 0.015811920166015625, 0.01663374900817871, 0.017455577850341797, 0.018277406692504883, 0.01909923553466797, 0.019921064376831055, 0.02074289321899414, 0.021564722061157227, 0.022386550903320312, 0.0232083797454834, 0.024030208587646484, 0.02485203742980957, 0.025673866271972656, 0.026495695114135742, 0.027317523956298828, 0.028139352798461914, 0.028961181640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 16.0, 54.0, 142.0, 193.0, 212.0, 205.0, 100.0, 50.0, 16.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01806640625, -0.017472267150878906, -0.016878128051757812, -0.01628398895263672, -0.015689849853515625, -0.015095710754394531, -0.014501571655273438, -0.013907432556152344, -0.01331329345703125, -0.012719154357910156, -0.012125015258789062, -0.011530876159667969, -0.010936737060546875, -0.010342597961425781, -0.009748458862304688, -0.009154319763183594, -0.0085601806640625, -0.007966041564941406, -0.0073719024658203125, -0.006777763366699219, -0.006183624267578125, -0.005589485168457031, -0.0049953460693359375, -0.004401206970214844, -0.00380706787109375, -0.0032129287719726562, -0.0026187896728515625, -0.0020246505737304688, -0.001430511474609375, -0.0008363723754882812, -0.0002422332763671875, 0.00035190582275390625, 0.000946044921875, 0.0015401840209960938, 0.0021343231201171875, 0.0027284622192382812, 0.003322601318359375, 0.003916740417480469, 0.0045108795166015625, 0.005105018615722656, 0.00569915771484375, 0.006293296813964844, 0.0068874359130859375, 0.007481575012207031, 0.008075714111328125, 0.008669853210449219, 0.009263992309570312, 0.009858131408691406, 0.0104522705078125, 0.011046409606933594, 0.011640548706054688, 0.012234687805175781, 0.012828826904296875, 0.013422966003417969, 0.014017105102539062, 0.014611244201660156, 0.01520538330078125, 0.015799522399902344, 0.016393661499023438, 0.01698780059814453, 0.017581939697265625, 0.01817607879638672, 0.018770217895507812, 0.019364356994628906, 0.01995849609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 12.0, 11.0, 25.0, 15.0, 16.0, 32.0, 35.0, 50.0, 54.0, 58.0, 87.0, 130.0, 185.0, 408.0, 807.0, 2094.0, 6472.0, 25940.0, 141010.0, 570664.0, 244361.0, 41529.0, 9328.0, 2790.0, 1060.0, 474.0, 235.0, 142.0, 92.0, 85.0, 57.0, 66.0, 36.0, 35.0, 30.0, 16.0, 27.0, 17.0, 8.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.012847900390625, -0.012466073036193848, -0.012084245681762695, -0.011702418327331543, -0.01132059097290039, -0.010938763618469238, -0.010556936264038086, -0.010175108909606934, -0.009793281555175781, -0.009411454200744629, -0.009029626846313477, -0.008647799491882324, -0.008265972137451172, -0.00788414478302002, -0.007502317428588867, -0.007120490074157715, -0.0067386627197265625, -0.00635683536529541, -0.005975008010864258, -0.0055931806564331055, -0.005211353302001953, -0.004829525947570801, -0.0044476985931396484, -0.004065871238708496, -0.0036840438842773438, -0.0033022165298461914, -0.002920389175415039, -0.0025385618209838867, -0.0021567344665527344, -0.001774907112121582, -0.0013930797576904297, -0.0010112524032592773, -0.000629425048828125, -0.00024759769439697266, 0.0001342296600341797, 0.000516057014465332, 0.0008978843688964844, 0.0012797117233276367, 0.001661539077758789, 0.0020433664321899414, 0.0024251937866210938, 0.002807021141052246, 0.0031888484954833984, 0.0035706758499145508, 0.003952503204345703, 0.0043343305587768555, 0.004716157913208008, 0.00509798526763916, 0.0054798126220703125, 0.005861639976501465, 0.006243467330932617, 0.0066252946853637695, 0.007007122039794922, 0.007388949394226074, 0.0077707767486572266, 0.008152604103088379, 0.008534431457519531, 0.008916258811950684, 0.009298086166381836, 0.009679913520812988, 0.01006174087524414, 0.010443568229675293, 0.010825395584106445, 0.011207222938537598, 0.01158905029296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 6.0, 3.0, 8.0, 16.0, 12.0, 7.0, 18.0, 15.0, 30.0, 33.0, 26.0, 20.0, 20.0, 21.0, 34.0, 32.0, 37.0, 42.0, 42.0, 37.0, 47.0, 46.0, 37.0, 32.0, 31.0, 25.0, 32.0, 33.0, 22.0, 23.0, 19.0, 24.0, 20.0, 23.0, 18.0, 19.0, 11.0, 11.0, 9.0, 7.0, 7.0, 12.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00865936279296875, -0.008371472358703613, -0.008083581924438477, -0.00779569149017334, -0.007507801055908203, -0.007219910621643066, -0.00693202018737793, -0.006644129753112793, -0.006356239318847656, -0.0060683488845825195, -0.005780458450317383, -0.005492568016052246, -0.005204677581787109, -0.004916787147521973, -0.004628896713256836, -0.004341006278991699, -0.0040531158447265625, -0.0037652254104614258, -0.003477334976196289, -0.0031894445419311523, -0.0029015541076660156, -0.002613663673400879, -0.002325773239135742, -0.0020378828048706055, -0.0017499923706054688, -0.001462101936340332, -0.0011742115020751953, -0.0008863210678100586, -0.0005984306335449219, -0.00031054019927978516, -2.2649765014648438e-05, 0.0002652406692504883, 0.000553131103515625, 0.0008410215377807617, 0.0011289119720458984, 0.0014168024063110352, 0.0017046928405761719, 0.0019925832748413086, 0.0022804737091064453, 0.002568364143371582, 0.0028562545776367188, 0.0031441450119018555, 0.003432035446166992, 0.003719925880432129, 0.004007816314697266, 0.004295706748962402, 0.004583597183227539, 0.004871487617492676, 0.0051593780517578125, 0.005447268486022949, 0.005735158920288086, 0.006023049354553223, 0.006310939788818359, 0.006598830223083496, 0.006886720657348633, 0.0071746110916137695, 0.007462501525878906, 0.007750391960144043, 0.00803828239440918, 0.008326172828674316, 0.008614063262939453, 0.00890195369720459, 0.009189844131469727, 0.009477734565734863, 0.009765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 15.0, 24.0, 32.0, 62.0, 106.0, 144.0, 245.0, 518.0, 927.0, 1750.0, 3645.0, 9582.0, 30904.0, 152925.0, 613424.0, 180911.0, 34867.0, 10373.0, 4043.0, 1928.0, 962.0, 464.0, 255.0, 166.0, 95.0, 55.0, 32.0, 29.0, 14.0, 13.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0041046142578125, -0.0039656758308410645, -0.003826737403869629, -0.0036877989768981934, -0.003548860549926758, -0.0034099221229553223, -0.0032709836959838867, -0.003132045269012451, -0.0029931068420410156, -0.00285416841506958, -0.0027152299880981445, -0.002576291561126709, -0.0024373531341552734, -0.002298414707183838, -0.0021594762802124023, -0.002020537853240967, -0.0018815994262695312, -0.0017426609992980957, -0.0016037225723266602, -0.0014647841453552246, -0.001325845718383789, -0.0011869072914123535, -0.001047968864440918, -0.0009090304374694824, -0.0007700920104980469, -0.0006311535835266113, -0.0004922151565551758, -0.00035327672958374023, -0.0002143383026123047, -7.539987564086914e-05, 6.35385513305664e-05, 0.00020247697830200195, 0.0003414154052734375, 0.00048035383224487305, 0.0006192922592163086, 0.0007582306861877441, 0.0008971691131591797, 0.0010361075401306152, 0.0011750459671020508, 0.0013139843940734863, 0.0014529228210449219, 0.0015918612480163574, 0.001730799674987793, 0.0018697381019592285, 0.002008676528930664, 0.0021476149559020996, 0.002286553382873535, 0.0024254918098449707, 0.0025644302368164062, 0.002703368663787842, 0.0028423070907592773, 0.002981245517730713, 0.0031201839447021484, 0.003259122371673584, 0.0033980607986450195, 0.003536999225616455, 0.0036759376525878906, 0.003814876079559326, 0.003953814506530762, 0.004092752933502197, 0.004231691360473633, 0.004370629787445068, 0.004509568214416504, 0.0046485066413879395, 0.004787445068359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 9.0, 17.0, 22.0, 27.0, 63.0, 87.0, 129.0, 156.0, 149.0, 110.0, 67.0, 42.0, 33.0, 35.0, 21.0, 7.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022232532501220703, -0.00021508708596229553, -0.00020784884691238403, -0.00020061060786247253, -0.00019337236881256104, -0.00018613412976264954, -0.00017889589071273804, -0.00017165765166282654, -0.00016441941261291504, -0.00015718117356300354, -0.00014994293451309204, -0.00014270469546318054, -0.00013546645641326904, -0.00012822821736335754, -0.00012098997831344604, -0.00011375173926353455, -0.00010651350021362305, -9.927526116371155e-05, -9.203702211380005e-05, -8.479878306388855e-05, -7.756054401397705e-05, -7.032230496406555e-05, -6.308406591415405e-05, -5.5845826864242554e-05, -4.8607587814331055e-05, -4.1369348764419556e-05, -3.413110971450806e-05, -2.6892870664596558e-05, -1.965463161468506e-05, -1.241639256477356e-05, -5.1781535148620605e-06, 2.0600855350494385e-06, 9.298324584960938e-06, 1.6536563634872437e-05, 2.3774802684783936e-05, 3.1013041734695435e-05, 3.8251280784606934e-05, 4.548951983451843e-05, 5.272775888442993e-05, 5.996599793434143e-05, 6.720423698425293e-05, 7.444247603416443e-05, 8.168071508407593e-05, 8.891895413398743e-05, 9.615719318389893e-05, 0.00010339543223381042, 0.00011063367128372192, 0.00011787191033363342, 0.00012511014938354492, 0.00013234838843345642, 0.00013958662748336792, 0.00014682486653327942, 0.00015406310558319092, 0.00016130134463310242, 0.00016853958368301392, 0.00017577782273292542, 0.00018301606178283691, 0.0001902543008327484, 0.0001974925398826599, 0.0002047307789325714, 0.0002119690179824829, 0.0002192072570323944, 0.0002264454960823059, 0.0002336837351322174, 0.0002409219741821289]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 15.0, 13.0, 6.0, 11.0, 22.0, 21.0, 19.0, 43.0, 68.0, 118.0, 252.0, 565.0, 1274.0, 3142.0, 10643.0, 64941.0, 724934.0, 211641.0, 22096.0, 5265.0, 1882.0, 744.0, 335.0, 188.0, 95.0, 52.0, 37.0, 31.0, 20.0, 16.0, 10.0, 5.0, 6.0, 6.0, 9.0, 8.0, 0.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007289886474609375, -0.00706714391708374, -0.0068444013595581055, -0.006621658802032471, -0.006398916244506836, -0.006176173686981201, -0.005953431129455566, -0.005730688571929932, -0.005507946014404297, -0.005285203456878662, -0.005062460899353027, -0.004839718341827393, -0.004616975784301758, -0.004394233226776123, -0.004171490669250488, -0.0039487481117248535, -0.0037260055541992188, -0.003503262996673584, -0.0032805204391479492, -0.0030577778816223145, -0.0028350353240966797, -0.002612292766571045, -0.00238955020904541, -0.0021668076515197754, -0.0019440650939941406, -0.0017213225364685059, -0.001498579978942871, -0.0012758374214172363, -0.0010530948638916016, -0.0008303523063659668, -0.000607609748840332, -0.00038486719131469727, -0.0001621246337890625, 6.0617923736572266e-05, 0.00028336048126220703, 0.0005061030387878418, 0.0007288455963134766, 0.0009515881538391113, 0.001174330711364746, 0.0013970732688903809, 0.0016198158264160156, 0.0018425583839416504, 0.002065300941467285, 0.00228804349899292, 0.0025107860565185547, 0.0027335286140441895, 0.0029562711715698242, 0.003179013729095459, 0.0034017562866210938, 0.0036244988441467285, 0.0038472414016723633, 0.004069983959197998, 0.004292726516723633, 0.004515469074249268, 0.004738211631774902, 0.004960954189300537, 0.005183696746826172, 0.005406439304351807, 0.005629181861877441, 0.005851924419403076, 0.006074666976928711, 0.006297409534454346, 0.0065201520919799805, 0.006742894649505615, 0.00696563720703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 13.0, 13.0, 24.0, 20.0, 49.0, 89.0, 120.0, 128.0, 153.0, 97.0, 71.0, 53.0, 54.0, 16.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00611114501953125, -0.0059320926666259766, -0.005753040313720703, -0.00557398796081543, -0.005394935607910156, -0.005215883255004883, -0.005036830902099609, -0.004857778549194336, -0.0046787261962890625, -0.004499673843383789, -0.004320621490478516, -0.004141569137573242, -0.003962516784667969, -0.0037834644317626953, -0.003604412078857422, -0.0034253597259521484, -0.003246307373046875, -0.0030672550201416016, -0.002888202667236328, -0.0027091503143310547, -0.0025300979614257812, -0.002351045608520508, -0.0021719932556152344, -0.001992940902709961, -0.0018138885498046875, -0.001634836196899414, -0.0014557838439941406, -0.0012767314910888672, -0.0010976791381835938, -0.0009186267852783203, -0.0007395744323730469, -0.0005605220794677734, -0.0003814697265625, -0.00020241737365722656, -2.3365020751953125e-05, 0.0001556873321533203, 0.00033473968505859375, 0.0005137920379638672, 0.0006928443908691406, 0.0008718967437744141, 0.0010509490966796875, 0.001230001449584961, 0.0014090538024902344, 0.0015881061553955078, 0.0017671585083007812, 0.0019462108612060547, 0.002125263214111328, 0.0023043155670166016, 0.002483367919921875, 0.0026624202728271484, 0.002841472625732422, 0.0030205249786376953, 0.0031995773315429688, 0.003378629684448242, 0.0035576820373535156, 0.003736734390258789, 0.0039157867431640625, 0.004094839096069336, 0.004273891448974609, 0.004452943801879883, 0.004631996154785156, 0.00481104850769043, 0.004990100860595703, 0.0051691532135009766, 0.00534820556640625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 849.0, 164.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0588495172560215, -0.03818943351507187, -0.017529349774122238, 0.0031307339668273926, 0.023790817707777023, 0.04445090517401695, 0.06511098146438599, 0.08577106893062592, 0.10643115639686584, 0.12709124386310577, 0.1477513313293457, 0.16841140389442444, 0.18907149136066437, 0.2097315788269043, 0.23039165139198303, 0.25105172395706177, 0.2717118263244629, 0.2923718988895416, 0.31303200125694275, 0.3336920738220215, 0.3543521761894226, 0.37501224875450134, 0.3956723213195801, 0.4163324236869812, 0.43699249625205994, 0.45765256881713867, 0.4783126711845398, 0.49897274374961853, 0.5196328163146973, 0.5402929186820984, 0.5609530210494995, 0.5816130638122559, 0.6022731065750122, 0.6229332089424133, 0.6435932517051697, 0.6642533540725708, 0.6849134564399719, 0.705573558807373, 0.7262336015701294, 0.7468937039375305, 0.7675538063049316, 0.7882139086723328, 0.8088739514350891, 0.8295340538024902, 0.8501941561698914, 0.8708542585372925, 0.8915143013000488, 0.91217440366745, 0.9328344464302063, 0.9534945487976074, 0.9741545915603638, 0.9948146939277649, 1.015474796295166, 1.0361348390579224, 1.0567950010299683, 1.0774550437927246, 1.098115086555481, 1.1187751293182373, 1.1394352912902832, 1.1600953340530396, 1.180755376815796, 1.2014155387878418, 1.2220755815505981, 1.2427356243133545, 1.2633957862854004]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 8.0, 13.0, 21.0, 19.0, 36.0, 34.0, 42.0, 40.0, 63.0, 63.0, 67.0, 77.0, 60.0, 87.0, 66.0, 52.0, 49.0, 55.0, 42.0, 26.0, 24.0, 17.0, 12.0, 13.0, 4.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.068867027759552, -0.06716986000537872, -0.06547269225120544, -0.06377552449703217, -0.06207835674285889, -0.06038118898868561, -0.05868402123451233, -0.05698685348033905, -0.05528968572616577, -0.05359251797199249, -0.051895350217819214, -0.050198182463645935, -0.048501014709472656, -0.04680384695529938, -0.0451066792011261, -0.04340951144695282, -0.04171234369277954, -0.04001517593860626, -0.03831800818443298, -0.036620840430259705, -0.034923672676086426, -0.03322650492191315, -0.03152933716773987, -0.02983216941356659, -0.02813500165939331, -0.026437833905220032, -0.024740666151046753, -0.023043498396873474, -0.021346330642700195, -0.019649162888526917, -0.017951995134353638, -0.01625482738018036, -0.01455765962600708, -0.012860491871833801, -0.011163324117660522, -0.009466156363487244, -0.007768988609313965, -0.006071820855140686, -0.004374653100967407, -0.0026774853467941284, -0.0009803175926208496, 0.0007168501615524292, 0.002414017915725708, 0.004111185669898987, 0.005808353424072266, 0.007505521178245544, 0.009202688932418823, 0.010899856686592102, 0.01259702444076538, 0.01429419219493866, 0.01599135994911194, 0.017688527703285217, 0.019385695457458496, 0.021082863211631775, 0.022780030965805054, 0.024477198719978333, 0.02617436647415161, 0.02787153422832489, 0.02956870198249817, 0.03126586973667145, 0.03296303749084473, 0.034660205245018005, 0.036357372999191284, 0.03805454075336456, 0.03975170850753784]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 8.0, 12.0, 18.0, 22.0, 32.0, 48.0, 81.0, 113.0, 187.0, 294.0, 827.0, 2324.0, 7547.0, 450707.0, 3714472.0, 13616.0, 2527.0, 700.0, 253.0, 145.0, 104.0, 58.0, 47.0, 27.0, 24.0, 17.0, 13.0, 17.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0313720703125, -0.03036355972290039, -0.02935504913330078, -0.028346538543701172, -0.027338027954101562, -0.026329517364501953, -0.025321006774902344, -0.024312496185302734, -0.023303985595703125, -0.022295475006103516, -0.021286964416503906, -0.020278453826904297, -0.019269943237304688, -0.018261432647705078, -0.01725292205810547, -0.01624441146850586, -0.01523590087890625, -0.01422739028930664, -0.013218879699707031, -0.012210369110107422, -0.011201858520507812, -0.010193347930908203, -0.009184837341308594, -0.008176326751708984, -0.007167816162109375, -0.006159305572509766, -0.005150794982910156, -0.004142284393310547, -0.0031337738037109375, -0.002125263214111328, -0.0011167526245117188, -0.00010824203491210938, 0.0009002685546875, 0.0019087791442871094, 0.0029172897338867188, 0.003925800323486328, 0.0049343109130859375, 0.005942821502685547, 0.006951332092285156, 0.007959842681884766, 0.008968353271484375, 0.009976863861083984, 0.010985374450683594, 0.011993885040283203, 0.013002395629882812, 0.014010906219482422, 0.015019416809082031, 0.01602792739868164, 0.01703643798828125, 0.01804494857788086, 0.01905345916748047, 0.020061969757080078, 0.021070480346679688, 0.022078990936279297, 0.023087501525878906, 0.024096012115478516, 0.025104522705078125, 0.026113033294677734, 0.027121543884277344, 0.028130054473876953, 0.029138565063476562, 0.030147075653076172, 0.03115558624267578, 0.03216409683227539, 0.033172607421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 51.0, 131.0, 219.0, 224.0, 202.0, 105.0, 38.0, 13.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183563232421875, -0.017709732055664062, -0.017063140869140625, -0.016416549682617188, -0.01576995849609375, -0.015123367309570312, -0.014476776123046875, -0.013830184936523438, -0.01318359375, -0.012537002563476562, -0.011890411376953125, -0.011243820190429688, -0.01059722900390625, -0.009950637817382812, -0.009304046630859375, -0.008657455444335938, -0.0080108642578125, -0.0073642730712890625, -0.006717681884765625, -0.0060710906982421875, -0.00542449951171875, -0.0047779083251953125, -0.004131317138671875, -0.0034847259521484375, -0.002838134765625, -0.0021915435791015625, -0.001544952392578125, -0.0008983612060546875, -0.00025177001953125, 0.0003948211669921875, 0.001041412353515625, 0.0016880035400390625, 0.0023345947265625, 0.0029811859130859375, 0.003627777099609375, 0.0042743682861328125, 0.00492095947265625, 0.0055675506591796875, 0.006214141845703125, 0.0068607330322265625, 0.00750732421875, 0.008153915405273438, 0.008800506591796875, 0.009447097778320312, 0.01009368896484375, 0.010740280151367188, 0.011386871337890625, 0.012033462524414062, 0.0126800537109375, 0.013326644897460938, 0.013973236083984375, 0.014619827270507812, 0.01526641845703125, 0.015913009643554688, 0.016559600830078125, 0.017206192016601562, 0.017852783203125, 0.018499374389648438, 0.019145965576171875, 0.019792556762695312, 0.02043914794921875, 0.021085739135742188, 0.021732330322265625, 0.022378921508789062, 0.0230255126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 10.0, 19.0, 32.0, 42.0, 87.0, 137.0, 234.0, 378.0, 803.0, 1704.0, 4691.0, 21278.0, 228531.0, 3821579.0, 95877.0, 13028.0, 3289.0, 1235.0, 565.0, 282.0, 175.0, 94.0, 66.0, 39.0, 31.0, 30.0, 6.0, 4.0, 6.0, 12.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013946533203125, -0.013486981391906738, -0.013027429580688477, -0.012567877769470215, -0.012108325958251953, -0.011648774147033691, -0.01118922233581543, -0.010729670524597168, -0.010270118713378906, -0.009810566902160645, -0.009351015090942383, -0.008891463279724121, -0.00843191146850586, -0.007972359657287598, -0.007512807846069336, -0.007053256034851074, -0.0065937042236328125, -0.006134152412414551, -0.005674600601196289, -0.005215048789978027, -0.004755496978759766, -0.004295945167541504, -0.003836393356323242, -0.0033768415451049805, -0.0029172897338867188, -0.002457737922668457, -0.0019981861114501953, -0.0015386343002319336, -0.0010790824890136719, -0.0006195306777954102, -0.00015997886657714844, 0.0002995729446411133, 0.000759124755859375, 0.0012186765670776367, 0.0016782283782958984, 0.00213778018951416, 0.002597332000732422, 0.0030568838119506836, 0.0035164356231689453, 0.003975987434387207, 0.004435539245605469, 0.0048950910568237305, 0.005354642868041992, 0.005814194679260254, 0.006273746490478516, 0.006733298301696777, 0.007192850112915039, 0.007652401924133301, 0.008111953735351562, 0.008571505546569824, 0.009031057357788086, 0.009490609169006348, 0.00995016098022461, 0.010409712791442871, 0.010869264602661133, 0.011328816413879395, 0.011788368225097656, 0.012247920036315918, 0.01270747184753418, 0.013167023658752441, 0.013626575469970703, 0.014086127281188965, 0.014545679092407227, 0.015005230903625488, 0.01546478271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 10.0, 19.0, 22.0, 42.0, 80.0, 147.0, 826.0, 1896.0, 529.0, 208.0, 95.0, 54.0, 54.0, 27.0, 17.0, 11.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01201629638671875, -0.011710822582244873, -0.011405348777770996, -0.01109987497329712, -0.010794401168823242, -0.010488927364349365, -0.010183453559875488, -0.009877979755401611, -0.009572505950927734, -0.009267032146453857, -0.00896155834197998, -0.008656084537506104, -0.008350610733032227, -0.00804513692855835, -0.007739663124084473, -0.007434189319610596, -0.007128715515136719, -0.006823241710662842, -0.006517767906188965, -0.006212294101715088, -0.005906820297241211, -0.005601346492767334, -0.005295872688293457, -0.00499039888381958, -0.004684925079345703, -0.004379451274871826, -0.004073977470397949, -0.0037685036659240723, -0.0034630298614501953, -0.0031575560569763184, -0.0028520822525024414, -0.0025466084480285645, -0.0022411346435546875, -0.0019356608390808105, -0.0016301870346069336, -0.0013247132301330566, -0.0010192394256591797, -0.0007137656211853027, -0.0004082918167114258, -0.00010281801223754883, 0.00020265579223632812, 0.0005081295967102051, 0.000813603401184082, 0.001119077205657959, 0.001424551010131836, 0.0017300248146057129, 0.00203549861907959, 0.002340972423553467, 0.0026464462280273438, 0.0029519200325012207, 0.0032573938369750977, 0.0035628676414489746, 0.0038683414459228516, 0.0041738152503967285, 0.0044792890548706055, 0.004784762859344482, 0.005090236663818359, 0.005395710468292236, 0.005701184272766113, 0.00600665807723999, 0.006312131881713867, 0.006617605686187744, 0.006923079490661621, 0.007228553295135498, 0.007534027099609375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 24.0, 344.0, 530.0, 89.0, 17.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2103511542081833, -0.20597201585769653, -0.20159286260604858, -0.19721372425556183, -0.19283458590507507, -0.18845544755458832, -0.18407630920410156, -0.1796971559524536, -0.17531801760196686, -0.1709388792514801, -0.16655972599983215, -0.1621805876493454, -0.15780144929885864, -0.1534223109483719, -0.14904317259788513, -0.14466401934623718, -0.14028488099575043, -0.13590574264526367, -0.13152658939361572, -0.12714745104312897, -0.12276831269264221, -0.11838917434215546, -0.1140100285410881, -0.10963088274002075, -0.105251744389534, -0.10087260603904724, -0.09649346023797989, -0.09211431443691254, -0.08773517608642578, -0.08335603773593903, -0.07897689193487167, -0.07459774613380432, -0.07021862268447876, -0.065839484333992, -0.06146033853292465, -0.0570811964571476, -0.052702054381370544, -0.04832291230559349, -0.04394377022981644, -0.03956462815403938, -0.03518548607826233, -0.030806344002485275, -0.02642720192670822, -0.022048059850931168, -0.017668917775154114, -0.01328977569937706, -0.008910633623600006, -0.004531491547822952, -0.00015234947204589844, 0.004226792603731155, 0.00860593467950821, 0.012985076755285263, 0.017364218831062317, 0.02174336090683937, 0.026122502982616425, 0.03050164505839348, 0.03488078713417053, 0.039259929209947586, 0.04363907128572464, 0.048018213361501694, 0.05239735543727875, 0.0567764975130558, 0.061155639588832855, 0.06553478538990021, 0.06991392374038696]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 9.0, 5.0, 9.0, 11.0, 13.0, 8.0, 18.0, 11.0, 28.0, 23.0, 28.0, 29.0, 18.0, 26.0, 32.0, 25.0, 34.0, 37.0, 31.0, 46.0, 34.0, 37.0, 43.0, 36.0, 33.0, 34.0, 34.0, 36.0, 33.0, 35.0, 34.0, 29.0, 20.0, 20.0, 22.0, 13.0, 16.0, 8.0, 14.0, 3.0, 8.0, 5.0, 3.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.020189642906188965, -0.01961723156273365, -0.019044820219278336, -0.01847240887582302, -0.017899997532367706, -0.01732758618891239, -0.016755174845457077, -0.016182763502001762, -0.015610352158546448, -0.015037940815091133, -0.014465529471635818, -0.013893118128180504, -0.01332070678472519, -0.012748295441269875, -0.01217588409781456, -0.011603472754359245, -0.01103106141090393, -0.010458650067448616, -0.009886238723993301, -0.009313827380537987, -0.008741416037082672, -0.008169004693627357, -0.007596593350172043, -0.007024182006716728, -0.006451770663261414, -0.005879359319806099, -0.005306947976350784, -0.00473453663289547, -0.004162125289440155, -0.0035897139459848404, -0.0030173026025295258, -0.002444891259074211, -0.0018724799156188965, -0.0013000685721635818, -0.0007276572287082672, -0.00015524588525295258, 0.00041716545820236206, 0.0009895768016576767, 0.0015619881451129913, 0.002134399488568306, 0.0027068108320236206, 0.0032792221754789352, 0.00385163351893425, 0.0044240448623895645, 0.004996456205844879, 0.005568867549300194, 0.006141278892755508, 0.006713690236210823, 0.007286101579666138, 0.007858512923121452, 0.008430924266576767, 0.009003335610032082, 0.009575746953487396, 0.010148158296942711, 0.010720569640398026, 0.01129298098385334, 0.011865392327308655, 0.01243780367076397, 0.013010215014219284, 0.013582626357674599, 0.014155037701129913, 0.014727449044585228, 0.015299860388040543, 0.015872271731495857, 0.016444683074951172]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 8.0, 7.0, 13.0, 17.0, 26.0, 39.0, 42.0, 49.0, 102.0, 129.0, 191.0, 275.0, 334.0, 524.0, 768.0, 1402.0, 3965.0, 30919.0, 661196.0, 326751.0, 15573.0, 2771.0, 1077.0, 697.0, 466.0, 318.0, 222.0, 201.0, 119.0, 99.0, 66.0, 44.0, 27.0, 22.0, 24.0, 19.0, 9.0, 9.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0207366943359375, -0.020064830780029297, -0.019392967224121094, -0.01872110366821289, -0.018049240112304688, -0.017377376556396484, -0.01670551300048828, -0.016033649444580078, -0.015361785888671875, -0.014689922332763672, -0.014018058776855469, -0.013346195220947266, -0.012674331665039062, -0.01200246810913086, -0.011330604553222656, -0.010658740997314453, -0.00998687744140625, -0.009315013885498047, -0.008643150329589844, -0.00797128677368164, -0.0072994232177734375, -0.006627559661865234, -0.005955696105957031, -0.005283832550048828, -0.004611968994140625, -0.003940105438232422, -0.0032682418823242188, -0.0025963783264160156, -0.0019245147705078125, -0.0012526512145996094, -0.0005807876586914062, 9.107589721679688e-05, 0.000762939453125, 0.0014348030090332031, 0.0021066665649414062, 0.0027785301208496094, 0.0034503936767578125, 0.004122257232666016, 0.004794120788574219, 0.005465984344482422, 0.006137847900390625, 0.006809711456298828, 0.007481575012207031, 0.008153438568115234, 0.008825302124023438, 0.00949716567993164, 0.010169029235839844, 0.010840892791748047, 0.01151275634765625, 0.012184619903564453, 0.012856483459472656, 0.01352834701538086, 0.014200210571289062, 0.014872074127197266, 0.015543937683105469, 0.016215801239013672, 0.016887664794921875, 0.017559528350830078, 0.01823139190673828, 0.018903255462646484, 0.019575119018554688, 0.02024698257446289, 0.020918846130371094, 0.021590709686279297, 0.0222625732421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 50.0, 126.0, 210.0, 233.0, 200.0, 104.0, 39.0, 17.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01898193359375, -0.018336772918701172, -0.017691612243652344, -0.017046451568603516, -0.016401290893554688, -0.01575613021850586, -0.015110969543457031, -0.014465808868408203, -0.013820648193359375, -0.013175487518310547, -0.012530326843261719, -0.01188516616821289, -0.011240005493164062, -0.010594844818115234, -0.009949684143066406, -0.009304523468017578, -0.00865936279296875, -0.008014202117919922, -0.007369041442871094, -0.006723880767822266, -0.0060787200927734375, -0.005433559417724609, -0.004788398742675781, -0.004143238067626953, -0.003498077392578125, -0.002852916717529297, -0.0022077560424804688, -0.0015625953674316406, -0.0009174346923828125, -0.0002722740173339844, 0.00037288665771484375, 0.0010180473327636719, 0.0016632080078125, 0.002308368682861328, 0.0029535293579101562, 0.0035986900329589844, 0.0042438507080078125, 0.004889011383056641, 0.005534172058105469, 0.006179332733154297, 0.006824493408203125, 0.007469654083251953, 0.008114814758300781, 0.00875997543334961, 0.009405136108398438, 0.010050296783447266, 0.010695457458496094, 0.011340618133544922, 0.01198577880859375, 0.012630939483642578, 0.013276100158691406, 0.013921260833740234, 0.014566421508789062, 0.01521158218383789, 0.01585674285888672, 0.016501903533935547, 0.017147064208984375, 0.017792224884033203, 0.01843738555908203, 0.01908254623413086, 0.019727706909179688, 0.020372867584228516, 0.021018028259277344, 0.021663188934326172, 0.022308349609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 7.0, 9.0, 11.0, 20.0, 23.0, 36.0, 32.0, 37.0, 41.0, 59.0, 82.0, 109.0, 170.0, 296.0, 653.0, 1836.0, 7421.0, 42044.0, 333350.0, 558462.0, 85584.0, 13173.0, 3052.0, 934.0, 356.0, 202.0, 118.0, 73.0, 45.0, 39.0, 48.0, 44.0, 22.0, 24.0, 16.0, 14.0, 13.0, 17.0, 10.0, 12.0, 9.0, 8.0, 8.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.012140393257141113, -0.011738061904907227, -0.01133573055267334, -0.010933399200439453, -0.010531067848205566, -0.01012873649597168, -0.009726405143737793, -0.009324073791503906, -0.00892174243927002, -0.008519411087036133, -0.008117079734802246, -0.007714748382568359, -0.007312417030334473, -0.006910085678100586, -0.006507754325866699, -0.0061054229736328125, -0.005703091621398926, -0.005300760269165039, -0.004898428916931152, -0.004496097564697266, -0.004093766212463379, -0.003691434860229492, -0.0032891035079956055, -0.0028867721557617188, -0.002484440803527832, -0.0020821094512939453, -0.0016797780990600586, -0.0012774467468261719, -0.0008751153945922852, -0.00047278404235839844, -7.045269012451172e-05, 0.000331878662109375, 0.0007342100143432617, 0.0011365413665771484, 0.0015388727188110352, 0.0019412040710449219, 0.0023435354232788086, 0.0027458667755126953, 0.003148198127746582, 0.0035505294799804688, 0.0039528608322143555, 0.004355192184448242, 0.004757523536682129, 0.005159854888916016, 0.005562186241149902, 0.005964517593383789, 0.006366848945617676, 0.0067691802978515625, 0.007171511650085449, 0.007573843002319336, 0.007976174354553223, 0.00837850570678711, 0.008780837059020996, 0.009183168411254883, 0.00958549976348877, 0.009987831115722656, 0.010390162467956543, 0.01079249382019043, 0.011194825172424316, 0.011597156524658203, 0.01199948787689209, 0.012401819229125977, 0.012804150581359863, 0.01320648193359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 8.0, 7.0, 7.0, 8.0, 3.0, 18.0, 22.0, 17.0, 24.0, 17.0, 36.0, 37.0, 40.0, 30.0, 41.0, 55.0, 46.0, 40.0, 45.0, 45.0, 53.0, 44.0, 38.0, 44.0, 40.0, 49.0, 27.0, 28.0, 31.0, 20.0, 9.0, 19.0, 6.0, 10.0, 6.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0129241943359375, -0.012560725212097168, -0.012197256088256836, -0.011833786964416504, -0.011470317840576172, -0.01110684871673584, -0.010743379592895508, -0.010379910469055176, -0.010016441345214844, -0.009652972221374512, -0.00928950309753418, -0.008926033973693848, -0.008562564849853516, -0.008199095726013184, -0.007835626602172852, -0.0074721574783325195, -0.0071086883544921875, -0.0067452192306518555, -0.0063817501068115234, -0.006018280982971191, -0.005654811859130859, -0.005291342735290527, -0.004927873611450195, -0.004564404487609863, -0.004200935363769531, -0.0038374662399291992, -0.003473997116088867, -0.003110527992248535, -0.002747058868408203, -0.002383589744567871, -0.002020120620727539, -0.001656651496887207, -0.001293182373046875, -0.000929713249206543, -0.0005662441253662109, -0.0002027750015258789, 0.00016069412231445312, 0.0005241632461547852, 0.0008876323699951172, 0.0012511014938354492, 0.0016145706176757812, 0.0019780397415161133, 0.0023415088653564453, 0.0027049779891967773, 0.0030684471130371094, 0.0034319162368774414, 0.0037953853607177734, 0.0041588544845581055, 0.0045223236083984375, 0.0048857927322387695, 0.0052492618560791016, 0.005612730979919434, 0.005976200103759766, 0.006339669227600098, 0.00670313835144043, 0.007066607475280762, 0.007430076599121094, 0.007793545722961426, 0.008157014846801758, 0.00852048397064209, 0.008883953094482422, 0.009247422218322754, 0.009610891342163086, 0.009974360466003418, 0.01033782958984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 17.0, 5.0, 16.0, 25.0, 25.0, 51.0, 85.0, 121.0, 208.0, 361.0, 672.0, 1258.0, 2616.0, 5682.0, 13857.0, 37808.0, 134355.0, 491130.0, 260344.0, 63382.0, 20932.0, 8192.0, 3626.0, 1738.0, 893.0, 468.0, 278.0, 137.0, 107.0, 47.0, 29.0, 21.0, 24.0, 13.0, 11.0, 5.0, 7.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030117034912109375, -0.0029167532920837402, -0.002821803092956543, -0.0027268528938293457, -0.0026319026947021484, -0.002536952495574951, -0.002442002296447754, -0.0023470520973205566, -0.0022521018981933594, -0.002157151699066162, -0.002062201499938965, -0.0019672513008117676, -0.0018723011016845703, -0.001777350902557373, -0.0016824007034301758, -0.0015874505043029785, -0.0014925003051757812, -0.001397550106048584, -0.0013025999069213867, -0.0012076497077941895, -0.0011126995086669922, -0.001017749309539795, -0.0009227991104125977, -0.0008278489112854004, -0.0007328987121582031, -0.0006379485130310059, -0.0005429983139038086, -0.00044804811477661133, -0.00035309791564941406, -0.0002581477165222168, -0.00016319751739501953, -6.824731826782227e-05, 2.6702880859375e-05, 0.00012165307998657227, 0.00021660327911376953, 0.0003115534782409668, 0.00040650367736816406, 0.0005014538764953613, 0.0005964040756225586, 0.0006913542747497559, 0.0007863044738769531, 0.0008812546730041504, 0.0009762048721313477, 0.001071155071258545, 0.0011661052703857422, 0.0012610554695129395, 0.0013560056686401367, 0.001450955867767334, 0.0015459060668945312, 0.0016408562660217285, 0.0017358064651489258, 0.001830756664276123, 0.0019257068634033203, 0.0020206570625305176, 0.002115607261657715, 0.002210557460784912, 0.0023055076599121094, 0.0024004578590393066, 0.002495408058166504, 0.002590358257293701, 0.0026853084564208984, 0.0027802586555480957, 0.002875208854675293, 0.0029701590538024902, 0.0030651092529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 12.0, 15.0, 15.0, 31.0, 45.0, 51.0, 59.0, 88.0, 91.0, 118.0, 102.0, 91.0, 64.0, 75.0, 46.0, 45.0, 18.0, 12.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015211105346679688, -0.00014808028936386108, -0.0001440495252609253, -0.0001400187611579895, -0.0001359879970550537, -0.00013195723295211792, -0.00012792646884918213, -0.00012389570474624634, -0.00011986494064331055, -0.00011583417654037476, -0.00011180341243743896, -0.00010777264833450317, -0.00010374188423156738, -9.971112012863159e-05, -9.56803560256958e-05, -9.164959192276001e-05, -8.761882781982422e-05, -8.358806371688843e-05, -7.955729961395264e-05, -7.552653551101685e-05, -7.149577140808105e-05, -6.746500730514526e-05, -6.343424320220947e-05, -5.940347909927368e-05, -5.537271499633789e-05, -5.13419508934021e-05, -4.731118679046631e-05, -4.328042268753052e-05, -3.9249658584594727e-05, -3.5218894481658936e-05, -3.1188130378723145e-05, -2.7157366275787354e-05, -2.3126602172851562e-05, -1.909583806991577e-05, -1.506507396697998e-05, -1.103430986404419e-05, -7.0035457611083984e-06, -2.9727816581726074e-06, 1.0579824447631836e-06, 5.088746547698975e-06, 9.119510650634766e-06, 1.3150274753570557e-05, 1.7181038856506348e-05, 2.121180295944214e-05, 2.524256706237793e-05, 2.927333116531372e-05, 3.330409526824951e-05, 3.73348593711853e-05, 4.1365623474121094e-05, 4.5396387577056885e-05, 4.9427151679992676e-05, 5.345791578292847e-05, 5.748867988586426e-05, 6.151944398880005e-05, 6.555020809173584e-05, 6.958097219467163e-05, 7.361173629760742e-05, 7.764250040054321e-05, 8.1673264503479e-05, 8.57040286064148e-05, 8.973479270935059e-05, 9.376555681228638e-05, 9.779632091522217e-05, 0.00010182708501815796, 0.00010585784912109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 14.0, 13.0, 14.0, 28.0, 66.0, 154.0, 386.0, 1142.0, 4479.0, 28371.0, 530886.0, 451226.0, 25810.0, 4219.0, 1042.0, 391.0, 161.0, 66.0, 26.0, 17.0, 14.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00800323486328125, -0.007760524749755859, -0.007517814636230469, -0.007275104522705078, -0.0070323944091796875, -0.006789684295654297, -0.006546974182128906, -0.006304264068603516, -0.006061553955078125, -0.005818843841552734, -0.005576133728027344, -0.005333423614501953, -0.0050907135009765625, -0.004848003387451172, -0.004605293273925781, -0.004362583160400391, -0.004119873046875, -0.0038771629333496094, -0.0036344528198242188, -0.003391742706298828, -0.0031490325927734375, -0.002906322479248047, -0.0026636123657226562, -0.0024209022521972656, -0.002178192138671875, -0.0019354820251464844, -0.0016927719116210938, -0.0014500617980957031, -0.0012073516845703125, -0.0009646415710449219, -0.0007219314575195312, -0.0004792213439941406, -0.00023651123046875, 6.198883056640625e-06, 0.00024890899658203125, 0.0004916191101074219, 0.0007343292236328125, 0.0009770393371582031, 0.0012197494506835938, 0.0014624595642089844, 0.001705169677734375, 0.0019478797912597656, 0.0021905899047851562, 0.002433300018310547, 0.0026760101318359375, 0.002918720245361328, 0.0031614303588867188, 0.0034041404724121094, 0.0036468505859375, 0.0038895606994628906, 0.004132270812988281, 0.004374980926513672, 0.0046176910400390625, 0.004860401153564453, 0.005103111267089844, 0.005345821380615234, 0.005588531494140625, 0.005831241607666016, 0.006073951721191406, 0.006316661834716797, 0.0065593719482421875, 0.006802082061767578, 0.007044792175292969, 0.007287502288818359, 0.00753021240234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 0.0, 7.0, 2.0, 3.0, 5.0, 12.0, 12.0, 15.0, 27.0, 37.0, 29.0, 83.0, 85.0, 146.0, 129.0, 145.0, 82.0, 58.0, 31.0, 18.0, 15.0, 12.0, 17.0, 11.0, 4.0, 3.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005512237548828125, -0.005355894565582275, -0.005199551582336426, -0.005043208599090576, -0.0048868656158447266, -0.004730522632598877, -0.004574179649353027, -0.004417836666107178, -0.004261493682861328, -0.0041051506996154785, -0.003948807716369629, -0.0037924647331237793, -0.0036361217498779297, -0.00347977876663208, -0.0033234357833862305, -0.003167092800140381, -0.0030107498168945312, -0.0028544068336486816, -0.002698063850402832, -0.0025417208671569824, -0.002385377883911133, -0.002229034900665283, -0.0020726919174194336, -0.001916348934173584, -0.0017600059509277344, -0.0016036629676818848, -0.0014473199844360352, -0.0012909770011901855, -0.001134634017944336, -0.0009782910346984863, -0.0008219480514526367, -0.0006656050682067871, -0.0005092620849609375, -0.0003529191017150879, -0.00019657611846923828, -4.023313522338867e-05, 0.00011610984802246094, 0.00027245283126831055, 0.00042879581451416016, 0.0005851387977600098, 0.0007414817810058594, 0.000897824764251709, 0.0010541677474975586, 0.0012105107307434082, 0.0013668537139892578, 0.0015231966972351074, 0.001679539680480957, 0.0018358826637268066, 0.0019922256469726562, 0.002148568630218506, 0.0023049116134643555, 0.002461254596710205, 0.0026175975799560547, 0.0027739405632019043, 0.002930283546447754, 0.0030866265296936035, 0.003242969512939453, 0.0033993124961853027, 0.0035556554794311523, 0.003711998462677002, 0.0038683414459228516, 0.004024684429168701, 0.004181027412414551, 0.0043373703956604, 0.00449371337890625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 16.0, 975.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07159274816513062, -0.05123282968997955, -0.03087291121482849, -0.01051299273967743, 0.009846925735473633, 0.030206844210624695, 0.05056676268577576, 0.07092668116092682, 0.09128659963607788, 0.11164651811122894, 0.13200643658638, 0.15236635506153107, 0.17272627353668213, 0.1930861920118332, 0.21344611048698425, 0.23380602896213531, 0.2541659474372864, 0.27452588081359863, 0.2948857843875885, 0.31524568796157837, 0.3356056213378906, 0.3559655547142029, 0.37632545828819275, 0.3966853618621826, 0.4170452952384949, 0.43740522861480713, 0.457765132188797, 0.47812503576278687, 0.4984849691390991, 0.5188449025154114, 0.5392048358917236, 0.5595647096633911, 0.5799245834350586, 0.6002845168113708, 0.6206444501876831, 0.6410043239593506, 0.6613642573356628, 0.6817241907119751, 0.7020840644836426, 0.7224439978599548, 0.7428039312362671, 0.7631638646125793, 0.7835237979888916, 0.8038836717605591, 0.8242436051368713, 0.8446035385131836, 0.8649634122848511, 0.8853233456611633, 0.9056832790374756, 0.9260432124137878, 0.9464031457901001, 0.9667630195617676, 0.9871229529380798, 1.007482886314392, 1.0278427600860596, 1.0482027530670166, 1.068562626838684, 1.0889225006103516, 1.1092824935913086, 1.129642367362976, 1.1500022411346436, 1.1703622341156006, 1.190722107887268, 1.211082100868225, 1.2314419746398926]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 14.0, 12.0, 22.0, 15.0, 27.0, 39.0, 36.0, 50.0, 58.0, 56.0, 57.0, 49.0, 64.0, 72.0, 59.0, 65.0, 50.0, 45.0, 46.0, 33.0, 32.0, 28.0, 13.0, 18.0, 10.0, 13.0, 9.0, 2.0, 4.0, 0.0, 4.0, 3.0], "bins": [-0.07052725553512573, -0.0689583271741867, -0.06738939881324768, -0.06582047045230865, -0.06425154209136963, -0.06268260627985, -0.06111367791891098, -0.059544749557971954, -0.05797582119703293, -0.0564068928360939, -0.05483796447515488, -0.05326903238892555, -0.051700104027986526, -0.0501311756670475, -0.048562243580818176, -0.04699331521987915, -0.045424386858940125, -0.0438554584980011, -0.04228653013706207, -0.04071759805083275, -0.03914866968989372, -0.0375797413289547, -0.03601080924272537, -0.034441880881786346, -0.03287295252084732, -0.031304024159908295, -0.02973509393632412, -0.028166163712739944, -0.02659723535180092, -0.025028306990861893, -0.023459376767277718, -0.021890446543693542, -0.020321518182754517, -0.01875258982181549, -0.017183659598231316, -0.015614730305969715, -0.014045801013708115, -0.012476871721446514, -0.010907942429184914, -0.009339013136923313, -0.007770083844661713, -0.006201154552400112, -0.004632225260138512, -0.003063295967876911, -0.0014943666756153107, 7.456261664628983e-05, 0.0016434919089078903, 0.003212421201169491, 0.004781350493431091, 0.006350279785692692, 0.007919209077954292, 0.009488138370215893, 0.011057067662477493, 0.012625996954739094, 0.014194926247000694, 0.01576385647058487, 0.017332784831523895, 0.01890171319246292, 0.020470643416047096, 0.02203957363963127, 0.023608502000570297, 0.025177430361509323, 0.026746360585093498, 0.028315290808677673, 0.0298842191696167]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 14.0, 6.0, 9.0, 12.0, 15.0, 32.0, 51.0, 77.0, 150.0, 255.0, 723.0, 2450.0, 10498.0, 4043204.0, 129779.0, 5194.0, 1108.0, 299.0, 153.0, 70.0, 44.0, 38.0, 25.0, 16.0, 14.0, 11.0, 3.0, 3.0, 6.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0302276611328125, -0.02905583381652832, -0.02788400650024414, -0.02671217918395996, -0.02554035186767578, -0.0243685245513916, -0.023196697235107422, -0.022024869918823242, -0.020853042602539062, -0.019681215286254883, -0.018509387969970703, -0.017337560653686523, -0.016165733337402344, -0.014993906021118164, -0.013822078704833984, -0.012650251388549805, -0.011478424072265625, -0.010306596755981445, -0.009134769439697266, -0.007962942123413086, -0.006791114807128906, -0.0056192874908447266, -0.004447460174560547, -0.003275632858276367, -0.0021038055419921875, -0.0009319782257080078, 0.00023984909057617188, 0.0014116764068603516, 0.0025835037231445312, 0.003755331039428711, 0.004927158355712891, 0.00609898567199707, 0.00727081298828125, 0.00844264030456543, 0.00961446762084961, 0.010786294937133789, 0.011958122253417969, 0.013129949569702148, 0.014301776885986328, 0.015473604202270508, 0.016645431518554688, 0.017817258834838867, 0.018989086151123047, 0.020160913467407227, 0.021332740783691406, 0.022504568099975586, 0.023676395416259766, 0.024848222732543945, 0.026020050048828125, 0.027191877365112305, 0.028363704681396484, 0.029535531997680664, 0.030707359313964844, 0.03187918663024902, 0.0330510139465332, 0.03422284126281738, 0.03539466857910156, 0.03656649589538574, 0.03773832321166992, 0.0389101505279541, 0.04008197784423828, 0.04125380516052246, 0.04242563247680664, 0.04359745979309082, 0.044769287109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 18.0, 58.0, 140.0, 216.0, 226.0, 183.0, 101.0, 32.0, 17.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.018218994140625, -0.01759791374206543, -0.01697683334350586, -0.01635575294494629, -0.01573467254638672, -0.015113592147827148, -0.014492511749267578, -0.013871431350708008, -0.013250350952148438, -0.012629270553588867, -0.012008190155029297, -0.011387109756469727, -0.010766029357910156, -0.010144948959350586, -0.009523868560791016, -0.008902788162231445, -0.008281707763671875, -0.007660627365112305, -0.007039546966552734, -0.006418466567993164, -0.005797386169433594, -0.0051763057708740234, -0.004555225372314453, -0.003934144973754883, -0.0033130645751953125, -0.002691984176635742, -0.002070903778076172, -0.0014498233795166016, -0.0008287429809570312, -0.00020766258239746094, 0.0004134178161621094, 0.0010344982147216797, 0.00165557861328125, 0.0022766590118408203, 0.0028977394104003906, 0.003518819808959961, 0.004139900207519531, 0.0047609806060791016, 0.005382061004638672, 0.006003141403198242, 0.0066242218017578125, 0.007245302200317383, 0.007866382598876953, 0.008487462997436523, 0.009108543395996094, 0.009729623794555664, 0.010350704193115234, 0.010971784591674805, 0.011592864990234375, 0.012213945388793945, 0.012835025787353516, 0.013456106185913086, 0.014077186584472656, 0.014698266983032227, 0.015319347381591797, 0.015940427780151367, 0.016561508178710938, 0.017182588577270508, 0.017803668975830078, 0.01842474937438965, 0.01904582977294922, 0.01966691017150879, 0.02028799057006836, 0.02090907096862793, 0.0215301513671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 9.0, 20.0, 29.0, 44.0, 60.0, 64.0, 72.0, 97.0, 146.0, 193.0, 268.0, 450.0, 754.0, 1466.0, 3598.0, 11160.0, 48682.0, 619342.0, 3388379.0, 91343.0, 18058.0, 5362.0, 2078.0, 908.0, 523.0, 319.0, 224.0, 167.0, 108.0, 79.0, 60.0, 51.0, 30.0, 25.0, 14.0, 19.0, 16.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01117706298828125, -0.010849952697753906, -0.010522842407226562, -0.010195732116699219, -0.009868621826171875, -0.009541511535644531, -0.009214401245117188, -0.008887290954589844, -0.0085601806640625, -0.008233070373535156, -0.007905960083007812, -0.007578849792480469, -0.007251739501953125, -0.006924629211425781, -0.0065975189208984375, -0.006270408630371094, -0.00594329833984375, -0.005616188049316406, -0.0052890777587890625, -0.004961967468261719, -0.004634857177734375, -0.004307746887207031, -0.0039806365966796875, -0.0036535263061523438, -0.003326416015625, -0.0029993057250976562, -0.0026721954345703125, -0.0023450851440429688, -0.002017974853515625, -0.0016908645629882812, -0.0013637542724609375, -0.0010366439819335938, -0.00070953369140625, -0.00038242340087890625, -5.53131103515625e-05, 0.00027179718017578125, 0.000598907470703125, 0.0009260177612304688, 0.0012531280517578125, 0.0015802383422851562, 0.0019073486328125, 0.0022344589233398438, 0.0025615692138671875, 0.0028886795043945312, 0.003215789794921875, 0.0035429000854492188, 0.0038700103759765625, 0.004197120666503906, 0.00452423095703125, 0.004851341247558594, 0.0051784515380859375, 0.005505561828613281, 0.005832672119140625, 0.006159782409667969, 0.0064868927001953125, 0.006814002990722656, 0.00714111328125, 0.007468223571777344, 0.0077953338623046875, 0.008122444152832031, 0.008449554443359375, 0.008776664733886719, 0.009103775024414062, 0.009430885314941406, 0.00975799560546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 32.0, 48.0, 97.0, 300.0, 1977.0, 1125.0, 243.0, 99.0, 51.0, 30.0, 20.0, 10.0, 5.0, 7.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0127410888671875, -0.012395262718200684, -0.012049436569213867, -0.01170361042022705, -0.011357784271240234, -0.011011958122253418, -0.010666131973266602, -0.010320305824279785, -0.009974479675292969, -0.009628653526306152, -0.009282827377319336, -0.00893700122833252, -0.008591175079345703, -0.008245348930358887, -0.00789952278137207, -0.007553696632385254, -0.0072078704833984375, -0.006862044334411621, -0.006516218185424805, -0.006170392036437988, -0.005824565887451172, -0.0054787397384643555, -0.005132913589477539, -0.004787087440490723, -0.004441261291503906, -0.00409543514251709, -0.0037496089935302734, -0.003403782844543457, -0.0030579566955566406, -0.0027121305465698242, -0.002366304397583008, -0.0020204782485961914, -0.001674652099609375, -0.0013288259506225586, -0.0009829998016357422, -0.0006371736526489258, -0.0002913475036621094, 5.447864532470703e-05, 0.00040030479431152344, 0.0007461309432983398, 0.0010919570922851562, 0.0014377832412719727, 0.001783609390258789, 0.0021294355392456055, 0.002475261688232422, 0.0028210878372192383, 0.0031669139862060547, 0.003512740135192871, 0.0038585662841796875, 0.004204392433166504, 0.00455021858215332, 0.004896044731140137, 0.005241870880126953, 0.0055876970291137695, 0.005933523178100586, 0.006279349327087402, 0.006625175476074219, 0.006971001625061035, 0.0073168277740478516, 0.007662653923034668, 0.008008480072021484, 0.0083543062210083, 0.008700132369995117, 0.009045958518981934, 0.00939178466796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 11.0, 41.0, 112.0, 281.0, 296.0, 156.0, 66.0, 22.0, 11.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08237071335315704, -0.08074934780597687, -0.07912798225879669, -0.07750660926103592, -0.07588524371385574, -0.07426387816667557, -0.07264251261949539, -0.07102114707231522, -0.06939977407455444, -0.06777840852737427, -0.06615704298019409, -0.06453566998243332, -0.06291430443525314, -0.06129293888807297, -0.05967157334089279, -0.05805020406842232, -0.05642884224653244, -0.054807476699352264, -0.05318610742688179, -0.051564741879701614, -0.04994337260723114, -0.048322007060050964, -0.04670064151287079, -0.045079272240400314, -0.04345790296792984, -0.041836537420749664, -0.04021516814827919, -0.038593802601099014, -0.03697243332862854, -0.035351067781448364, -0.03372970223426819, -0.032108332961797714, -0.03048696555197239, -0.028865598142147064, -0.02724423073232174, -0.025622863322496414, -0.02400149777531624, -0.022380130365490913, -0.02075876295566559, -0.019137397408485413, -0.01751602813601494, -0.015894660726189613, -0.014273294247686863, -0.012651926837861538, -0.011030560359358788, -0.009409192949533463, -0.0077878255397081375, -0.006166459061205387, -0.004545092582702637, -0.002923725638538599, -0.0013023584615439177, 0.0003190087154507637, 0.0019403756596148014, 0.003561742603778839, 0.005183110013604164, 0.0068044764921069145, 0.00842584390193224, 0.010047211311757565, 0.011668577790260315, 0.01328994520008564, 0.014911312609910965, 0.01653267815709114, 0.018154047429561615, 0.01977541297674179, 0.021396780386567116]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 6.0, 9.0, 13.0, 17.0, 15.0, 20.0, 21.0, 27.0, 23.0, 24.0, 21.0, 34.0, 30.0, 40.0, 35.0, 34.0, 42.0, 36.0, 35.0, 40.0, 30.0, 44.0, 32.0, 34.0, 35.0, 37.0, 21.0, 21.0, 20.0, 32.0, 21.0, 24.0, 14.0, 16.0, 16.0, 10.0, 9.0, 6.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-0.013236522674560547, -0.01282115001231432, -0.012405777350068092, -0.011990404687821865, -0.011575032025575638, -0.01115965936332941, -0.010744286701083183, -0.010328914038836956, -0.009913541376590729, -0.009498168714344501, -0.009082796052098274, -0.008667423389852047, -0.00825205072760582, -0.007836678065359592, -0.007421305403113365, -0.007005932740867138, -0.006590560078620911, -0.006175187416374683, -0.005759814754128456, -0.005344442091882229, -0.004929069429636002, -0.004513696767389774, -0.004098324105143547, -0.00368295144289732, -0.0032675787806510925, -0.0028522061184048653, -0.002436833456158638, -0.0020214607939124107, -0.0016060881316661835, -0.0011907154694199562, -0.0007753428071737289, -0.0003599701449275017, 5.5402517318725586e-05, 0.00047077517956495285, 0.0008861478418111801, 0.0013015205040574074, 0.0017168931663036346, 0.002132265828549862, 0.002547638490796089, 0.0029630111530423164, 0.0033783838152885437, 0.003793756477534771, 0.004209129139780998, 0.0046245018020272255, 0.005039874464273453, 0.00545524712651968, 0.005870619788765907, 0.0062859924510121346, 0.006701365113258362, 0.007116737775504589, 0.007532110437750816, 0.007947483099997044, 0.008362855762243271, 0.008778228424489498, 0.009193601086735725, 0.009608973748981953, 0.01002434641122818, 0.010439719073474407, 0.010855091735720634, 0.011270464397966862, 0.011685837060213089, 0.012101209722459316, 0.012516582384705544, 0.01293195504695177, 0.013347327709197998]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 15.0, 11.0, 17.0, 21.0, 55.0, 67.0, 109.0, 155.0, 276.0, 377.0, 603.0, 1207.0, 3739.0, 45668.0, 924372.0, 64456.0, 4296.0, 1326.0, 658.0, 432.0, 217.0, 170.0, 83.0, 53.0, 40.0, 43.0, 15.0, 12.0, 11.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257720947265625, -0.024899721145629883, -0.024027347564697266, -0.02315497398376465, -0.02228260040283203, -0.021410226821899414, -0.020537853240966797, -0.01966547966003418, -0.018793106079101562, -0.017920732498168945, -0.017048358917236328, -0.01617598533630371, -0.015303611755371094, -0.014431238174438477, -0.01355886459350586, -0.012686491012573242, -0.011814117431640625, -0.010941743850708008, -0.01006937026977539, -0.009196996688842773, -0.008324623107910156, -0.007452249526977539, -0.006579875946044922, -0.005707502365112305, -0.0048351287841796875, -0.00396275520324707, -0.003090381622314453, -0.002218008041381836, -0.0013456344604492188, -0.00047326087951660156, 0.0003991127014160156, 0.0012714862823486328, 0.00214385986328125, 0.003016233444213867, 0.0038886070251464844, 0.0047609806060791016, 0.005633354187011719, 0.006505727767944336, 0.007378101348876953, 0.00825047492980957, 0.009122848510742188, 0.009995222091674805, 0.010867595672607422, 0.011739969253540039, 0.012612342834472656, 0.013484716415405273, 0.01435708999633789, 0.015229463577270508, 0.016101837158203125, 0.016974210739135742, 0.01784658432006836, 0.018718957901000977, 0.019591331481933594, 0.02046370506286621, 0.021336078643798828, 0.022208452224731445, 0.023080825805664062, 0.02395319938659668, 0.024825572967529297, 0.025697946548461914, 0.02657032012939453, 0.02744269371032715, 0.028315067291259766, 0.029187440872192383, 0.030059814453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 18.0, 76.0, 134.0, 236.0, 220.0, 174.0, 98.0, 24.0, 16.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01904296875, -0.018390178680419922, -0.017737388610839844, -0.017084598541259766, -0.016431808471679688, -0.01577901840209961, -0.015126228332519531, -0.014473438262939453, -0.013820648193359375, -0.013167858123779297, -0.012515068054199219, -0.01186227798461914, -0.011209487915039062, -0.010556697845458984, -0.009903907775878906, -0.009251117706298828, -0.00859832763671875, -0.007945537567138672, -0.007292747497558594, -0.006639957427978516, -0.0059871673583984375, -0.005334377288818359, -0.004681587219238281, -0.004028797149658203, -0.003376007080078125, -0.002723217010498047, -0.0020704269409179688, -0.0014176368713378906, -0.0007648468017578125, -0.00011205673217773438, 0.0005407333374023438, 0.0011935234069824219, 0.0018463134765625, 0.002499103546142578, 0.0031518936157226562, 0.0038046836853027344, 0.0044574737548828125, 0.005110263824462891, 0.005763053894042969, 0.006415843963623047, 0.007068634033203125, 0.007721424102783203, 0.008374214172363281, 0.00902700424194336, 0.009679794311523438, 0.010332584381103516, 0.010985374450683594, 0.011638164520263672, 0.01229095458984375, 0.012943744659423828, 0.013596534729003906, 0.014249324798583984, 0.014902114868164062, 0.01555490493774414, 0.01620769500732422, 0.016860485076904297, 0.017513275146484375, 0.018166065216064453, 0.01881885528564453, 0.01947164535522461, 0.020124435424804688, 0.020777225494384766, 0.021430015563964844, 0.022082805633544922, 0.022735595703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 15.0, 20.0, 31.0, 38.0, 52.0, 85.0, 109.0, 188.0, 318.0, 529.0, 1278.0, 3397.0, 13561.0, 116275.0, 718530.0, 169468.0, 17559.0, 4084.0, 1461.0, 631.0, 321.0, 185.0, 109.0, 82.0, 56.0, 45.0, 31.0, 20.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010773420333862305, -0.01031637191772461, -0.009859323501586914, -0.009402275085449219, -0.008945226669311523, -0.008488178253173828, -0.008031129837036133, -0.0075740814208984375, -0.007117033004760742, -0.006659984588623047, -0.0062029361724853516, -0.005745887756347656, -0.005288839340209961, -0.004831790924072266, -0.00437474250793457, -0.003917694091796875, -0.0034606456756591797, -0.0030035972595214844, -0.002546548843383789, -0.0020895004272460938, -0.0016324520111083984, -0.0011754035949707031, -0.0007183551788330078, -0.0002613067626953125, 0.0001957416534423828, 0.0006527900695800781, 0.0011098384857177734, 0.0015668869018554688, 0.002023935317993164, 0.0024809837341308594, 0.0029380321502685547, 0.00339508056640625, 0.0038521289825439453, 0.004309177398681641, 0.004766225814819336, 0.005223274230957031, 0.0056803226470947266, 0.006137371063232422, 0.006594419479370117, 0.0070514678955078125, 0.007508516311645508, 0.007965564727783203, 0.008422613143920898, 0.008879661560058594, 0.009336709976196289, 0.009793758392333984, 0.01025080680847168, 0.010707855224609375, 0.01116490364074707, 0.011621952056884766, 0.012079000473022461, 0.012536048889160156, 0.012993097305297852, 0.013450145721435547, 0.013907194137573242, 0.014364242553710938, 0.014821290969848633, 0.015278339385986328, 0.015735387802124023, 0.01619243621826172, 0.016649484634399414, 0.01710653305053711, 0.017563581466674805, 0.0180206298828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 7.0, 8.0, 19.0, 21.0, 28.0, 37.0, 29.0, 45.0, 36.0, 50.0, 55.0, 74.0, 61.0, 48.0, 62.0, 66.0, 54.0, 39.0, 47.0, 49.0, 39.0, 34.0, 18.0, 28.0, 10.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01873779296875, -0.018262267112731934, -0.017786741256713867, -0.0173112154006958, -0.016835689544677734, -0.016360163688659668, -0.0158846378326416, -0.015409111976623535, -0.014933586120605469, -0.014458060264587402, -0.013982534408569336, -0.01350700855255127, -0.013031482696533203, -0.012555956840515137, -0.01208043098449707, -0.011604905128479004, -0.011129379272460938, -0.010653853416442871, -0.010178327560424805, -0.009702801704406738, -0.009227275848388672, -0.008751749992370605, -0.008276224136352539, -0.007800698280334473, -0.007325172424316406, -0.00684964656829834, -0.0063741207122802734, -0.005898594856262207, -0.005423069000244141, -0.004947543144226074, -0.004472017288208008, -0.003996491432189941, -0.003520965576171875, -0.0030454397201538086, -0.002569913864135742, -0.0020943880081176758, -0.0016188621520996094, -0.001143336296081543, -0.0006678104400634766, -0.00019228458404541016, 0.00028324127197265625, 0.0007587671279907227, 0.001234292984008789, 0.0017098188400268555, 0.002185344696044922, 0.0026608705520629883, 0.0031363964080810547, 0.003611922264099121, 0.0040874481201171875, 0.004562973976135254, 0.00503849983215332, 0.005514025688171387, 0.005989551544189453, 0.0064650774002075195, 0.006940603256225586, 0.007416129112243652, 0.007891654968261719, 0.008367180824279785, 0.008842706680297852, 0.009318232536315918, 0.009793758392333984, 0.01026928424835205, 0.010744810104370117, 0.011220335960388184, 0.01169586181640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 13.0, 22.0, 18.0, 29.0, 44.0, 59.0, 99.0, 111.0, 233.0, 344.0, 510.0, 861.0, 1483.0, 2530.0, 4647.0, 8596.0, 17737.0, 38730.0, 93972.0, 238820.0, 342374.0, 172664.0, 66896.0, 28355.0, 13397.0, 6956.0, 3730.0, 2042.0, 1268.0, 734.0, 431.0, 295.0, 171.0, 121.0, 69.0, 51.0, 33.0, 29.0, 26.0, 16.0, 8.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0016489028930664062, -0.0015885382890701294, -0.0015281736850738525, -0.0014678090810775757, -0.0014074444770812988, -0.001347079873085022, -0.0012867152690887451, -0.0012263506650924683, -0.0011659860610961914, -0.0011056214570999146, -0.0010452568531036377, -0.0009848922491073608, -0.000924527645111084, -0.0008641630411148071, -0.0008037984371185303, -0.0007434338331222534, -0.0006830692291259766, -0.0006227046251296997, -0.0005623400211334229, -0.000501975417137146, -0.00044161081314086914, -0.0003812462091445923, -0.00032088160514831543, -0.0002605170011520386, -0.00020015239715576172, -0.00013978779315948486, -7.942318916320801e-05, -1.9058585166931152e-05, 4.13060188293457e-05, 0.00010167062282562256, 0.00016203522682189941, 0.00022239983081817627, 0.0002827644348144531, 0.00034312903881073, 0.00040349364280700684, 0.0004638582468032837, 0.0005242228507995605, 0.0005845874547958374, 0.0006449520587921143, 0.0007053166627883911, 0.000765681266784668, 0.0008260458707809448, 0.0008864104747772217, 0.0009467750787734985, 0.0010071396827697754, 0.0010675042867660522, 0.001127868890762329, 0.001188233494758606, 0.0012485980987548828, 0.0013089627027511597, 0.0013693273067474365, 0.0014296919107437134, 0.0014900565147399902, 0.001550421118736267, 0.001610785722732544, 0.0016711503267288208, 0.0017315149307250977, 0.0017918795347213745, 0.0018522441387176514, 0.0019126087427139282, 0.001972973346710205, 0.002033337950706482, 0.002093702554702759, 0.0021540671586990356, 0.0022144317626953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 3.0, 6.0, 8.0, 4.0, 11.0, 10.0, 15.0, 30.0, 43.0, 60.0, 102.0, 117.0, 139.0, 141.0, 110.0, 46.0, 52.0, 32.0, 25.0, 16.0, 9.0, 4.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001500844955444336, -0.00014518573880195618, -0.00014028698205947876, -0.00013538822531700134, -0.00013048946857452393, -0.0001255907118320465, -0.00012069195508956909, -0.00011579319834709167, -0.00011089444160461426, -0.00010599568486213684, -0.00010109692811965942, -9.619817137718201e-05, -9.129941463470459e-05, -8.640065789222717e-05, -8.150190114974976e-05, -7.660314440727234e-05, -7.170438766479492e-05, -6.68056309223175e-05, -6.190687417984009e-05, -5.700811743736267e-05, -5.2109360694885254e-05, -4.721060395240784e-05, -4.231184720993042e-05, -3.7413090467453e-05, -3.2514333724975586e-05, -2.761557698249817e-05, -2.2716820240020752e-05, -1.7818063497543335e-05, -1.2919306755065918e-05, -8.020550012588501e-06, -3.121793270111084e-06, 1.776963472366333e-06, 6.67572021484375e-06, 1.1574476957321167e-05, 1.6473233699798584e-05, 2.1371990442276e-05, 2.6270747184753418e-05, 3.1169503927230835e-05, 3.606826066970825e-05, 4.096701741218567e-05, 4.5865774154663086e-05, 5.07645308971405e-05, 5.566328763961792e-05, 6.056204438209534e-05, 6.546080112457275e-05, 7.035955786705017e-05, 7.525831460952759e-05, 8.0157071352005e-05, 8.505582809448242e-05, 8.995458483695984e-05, 9.485334157943726e-05, 9.975209832191467e-05, 0.00010465085506439209, 0.00010954961180686951, 0.00011444836854934692, 0.00011934712529182434, 0.00012424588203430176, 0.00012914463877677917, 0.0001340433955192566, 0.000138942152261734, 0.00014384090900421143, 0.00014873966574668884, 0.00015363842248916626, 0.00015853717923164368, 0.0001634359359741211]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 11.0, 17.0, 18.0, 44.0, 58.0, 117.0, 226.0, 537.0, 1652.0, 7849.0, 61094.0, 699339.0, 250288.0, 21942.0, 3668.0, 925.0, 381.0, 159.0, 68.0, 58.0, 43.0, 18.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0058441162109375, -0.005647778511047363, -0.0054514408111572266, -0.00525510311126709, -0.005058765411376953, -0.004862427711486816, -0.00466609001159668, -0.004469752311706543, -0.004273414611816406, -0.0040770769119262695, -0.003880739212036133, -0.003684401512145996, -0.0034880638122558594, -0.0032917261123657227, -0.003095388412475586, -0.0028990507125854492, -0.0027027130126953125, -0.0025063753128051758, -0.002310037612915039, -0.0021136999130249023, -0.0019173622131347656, -0.001721024513244629, -0.0015246868133544922, -0.0013283491134643555, -0.0011320114135742188, -0.000935673713684082, -0.0007393360137939453, -0.0005429983139038086, -0.0003466606140136719, -0.00015032291412353516, 4.601478576660156e-05, 0.00024235248565673828, 0.000438690185546875, 0.0006350278854370117, 0.0008313655853271484, 0.0010277032852172852, 0.0012240409851074219, 0.0014203786849975586, 0.0016167163848876953, 0.001813054084777832, 0.0020093917846679688, 0.0022057294845581055, 0.002402067184448242, 0.002598404884338379, 0.0027947425842285156, 0.0029910802841186523, 0.003187417984008789, 0.0033837556838989258, 0.0035800933837890625, 0.0037764310836791992, 0.003972768783569336, 0.004169106483459473, 0.004365444183349609, 0.004561781883239746, 0.004758119583129883, 0.0049544572830200195, 0.005150794982910156, 0.005347132682800293, 0.00554347038269043, 0.005739808082580566, 0.005936145782470703, 0.00613248348236084, 0.0063288211822509766, 0.006525158882141113, 0.00672149658203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 11.0, 12.0, 29.0, 38.0, 40.0, 62.0, 97.0, 113.0, 147.0, 121.0, 91.0, 63.0, 40.0, 22.0, 18.0, 16.0, 15.0, 12.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00559234619140625, -0.00544700026512146, -0.00530165433883667, -0.00515630841255188, -0.00501096248626709, -0.0048656165599823, -0.00472027063369751, -0.00457492470741272, -0.00442957878112793, -0.00428423285484314, -0.00413888692855835, -0.00399354100227356, -0.0038481950759887695, -0.0037028491497039795, -0.0035575032234191895, -0.0034121572971343994, -0.0032668113708496094, -0.0031214654445648193, -0.0029761195182800293, -0.0028307735919952393, -0.0026854276657104492, -0.002540081739425659, -0.002394735813140869, -0.002249389886856079, -0.002104043960571289, -0.001958698034286499, -0.001813352108001709, -0.001668006181716919, -0.001522660255432129, -0.0013773143291473389, -0.0012319684028625488, -0.0010866224765777588, -0.0009412765502929688, -0.0007959306240081787, -0.0006505846977233887, -0.0005052387714385986, -0.0003598928451538086, -0.00021454691886901855, -6.920099258422852e-05, 7.614493370056152e-05, 0.00022149085998535156, 0.0003668367862701416, 0.0005121827125549316, 0.0006575286388397217, 0.0008028745651245117, 0.0009482204914093018, 0.0010935664176940918, 0.0012389123439788818, 0.0013842582702636719, 0.001529604196548462, 0.001674950122833252, 0.001820296049118042, 0.001965641975402832, 0.002110987901687622, 0.002256333827972412, 0.002401679754257202, 0.002547025680541992, 0.0026923716068267822, 0.0028377175331115723, 0.0029830634593963623, 0.0031284093856811523, 0.0032737553119659424, 0.0034191012382507324, 0.0035644471645355225, 0.0037097930908203125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 12.0, 607.0, 384.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05807831138372421, -0.046206049621105194, -0.034333787858486176, -0.022461526095867157, -0.010589264333248138, 0.0012829974293708801, 0.013155259191989899, 0.025027520954608917, 0.036899782717227936, 0.048772044479846954, 0.06064430624246597, 0.07251656800508499, 0.08438882976770401, 0.09626109153032303, 0.10813335329294205, 0.12000561505556107, 0.1318778693675995, 0.1437501311302185, 0.15562239289283752, 0.16749465465545654, 0.17936691641807556, 0.19123917818069458, 0.2031114399433136, 0.21498370170593262, 0.22685596346855164, 0.23872822523117065, 0.2506004869937897, 0.2624727487564087, 0.2743450105190277, 0.28621727228164673, 0.29808953404426575, 0.30996179580688477, 0.32183408737182617, 0.3337063491344452, 0.3455786108970642, 0.3574508726596832, 0.36932313442230225, 0.38119539618492126, 0.3930676579475403, 0.4049399197101593, 0.4168121814727783, 0.42868444323539734, 0.44055670499801636, 0.4524289667606354, 0.4643012285232544, 0.4761734902858734, 0.48804575204849243, 0.49991801381111145, 0.5117902755737305, 0.5236625671386719, 0.5355347990989685, 0.5474070310592651, 0.5592793226242065, 0.571151614189148, 0.5830238461494446, 0.5948960781097412, 0.6067683696746826, 0.618640661239624, 0.6305128931999207, 0.6423851251602173, 0.6542574167251587, 0.6661297082901001, 0.6780019402503967, 0.6898741722106934, 0.7017464637756348]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 16.0, 16.0, 19.0, 17.0, 36.0, 35.0, 42.0, 43.0, 43.0, 56.0, 49.0, 66.0, 71.0, 61.0, 66.0, 65.0, 42.0, 40.0, 41.0, 30.0, 25.0, 26.0, 23.0, 22.0, 12.0, 7.0, 7.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.05944877862930298, -0.05809399485588074, -0.0567392073571682, -0.05538441985845566, -0.05402963608503342, -0.052674852311611176, -0.051320064812898636, -0.049965277314186096, -0.048610493540763855, -0.047255709767341614, -0.045900922268629074, -0.044546134769916534, -0.04319135099649429, -0.04183656722307205, -0.04048177972435951, -0.03912699222564697, -0.03777220845222473, -0.03641742467880249, -0.03506263718008995, -0.03370784968137741, -0.03235306590795517, -0.03099828027188778, -0.02964349463582039, -0.028288708999753, -0.026933923363685608, -0.025579137727618217, -0.024224352091550827, -0.022869566455483437, -0.021514780819416046, -0.020159995183348656, -0.018805209547281265, -0.017450423911213875, -0.016095638275146484, -0.014740852639079094, -0.013386067003011703, -0.012031281366944313, -0.010676495730876923, -0.009321710094809532, -0.007966924458742142, -0.006612138822674751, -0.005257353186607361, -0.0039025675505399704, -0.00254778191447258, -0.0011929962784051895, 0.00016178935766220093, 0.0015165749937295914, 0.002871360629796982, 0.004226146265864372, 0.005580931901931763, 0.006935717537999153, 0.008290503174066544, 0.009645288810133934, 0.011000074446201324, 0.012354860082268715, 0.013709645718336105, 0.015064431354403496, 0.016419216990470886, 0.017774002626538277, 0.019128788262605667, 0.020483573898673058, 0.021838359534740448, 0.02319314517080784, 0.02454793080687523, 0.02590271644294262, 0.02725750207901001]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 6.0, 4.0, 7.0, 17.0, 12.0, 32.0, 39.0, 45.0, 77.0, 99.0, 134.0, 263.0, 594.0, 1441.0, 2700.0, 9671.0, 270738.0, 3872777.0, 27790.0, 4953.0, 1515.0, 601.0, 278.0, 148.0, 97.0, 61.0, 41.0, 30.0, 24.0, 17.0, 14.0, 8.0, 11.0, 2.0, 3.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021636962890625, -0.020870208740234375, -0.02010345458984375, -0.019336700439453125, -0.0185699462890625, -0.017803192138671875, -0.01703643798828125, -0.016269683837890625, -0.0155029296875, -0.014736175537109375, -0.01396942138671875, -0.013202667236328125, -0.0124359130859375, -0.011669158935546875, -0.01090240478515625, -0.010135650634765625, -0.009368896484375, -0.008602142333984375, -0.00783538818359375, -0.007068634033203125, -0.0063018798828125, -0.005535125732421875, -0.00476837158203125, -0.004001617431640625, -0.00323486328125, -0.002468109130859375, -0.00170135498046875, -0.000934600830078125, -0.0001678466796875, 0.000598907470703125, 0.00136566162109375, 0.002132415771484375, 0.002899169921875, 0.003665924072265625, 0.00443267822265625, 0.005199432373046875, 0.0059661865234375, 0.006732940673828125, 0.00749969482421875, 0.008266448974609375, 0.009033203125, 0.009799957275390625, 0.01056671142578125, 0.011333465576171875, 0.0121002197265625, 0.012866973876953125, 0.01363372802734375, 0.014400482177734375, 0.015167236328125, 0.015933990478515625, 0.01670074462890625, 0.017467498779296875, 0.0182342529296875, 0.019001007080078125, 0.01976776123046875, 0.020534515380859375, 0.02130126953125, 0.022068023681640625, 0.02283477783203125, 0.023601531982421875, 0.0243682861328125, 0.025135040283203125, 0.02590179443359375, 0.026668548583984375, 0.027435302734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 25.0, 90.0, 171.0, 228.0, 220.0, 163.0, 67.0, 19.0, 11.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0196990966796875, -0.019040584564208984, -0.01838207244873047, -0.017723560333251953, -0.017065048217773438, -0.016406536102294922, -0.015748023986816406, -0.01508951187133789, -0.014430999755859375, -0.01377248764038086, -0.013113975524902344, -0.012455463409423828, -0.011796951293945312, -0.011138439178466797, -0.010479927062988281, -0.009821414947509766, -0.00916290283203125, -0.008504390716552734, -0.007845878601074219, -0.007187366485595703, -0.0065288543701171875, -0.005870342254638672, -0.005211830139160156, -0.004553318023681641, -0.003894805908203125, -0.0032362937927246094, -0.0025777816772460938, -0.0019192695617675781, -0.0012607574462890625, -0.0006022453308105469, 5.626678466796875e-05, 0.0007147789001464844, 0.001373291015625, 0.0020318031311035156, 0.0026903152465820312, 0.003348827362060547, 0.0040073394775390625, 0.004665851593017578, 0.005324363708496094, 0.005982875823974609, 0.006641387939453125, 0.007299900054931641, 0.007958412170410156, 0.008616924285888672, 0.009275436401367188, 0.009933948516845703, 0.010592460632324219, 0.011250972747802734, 0.01190948486328125, 0.012567996978759766, 0.013226509094238281, 0.013885021209716797, 0.014543533325195312, 0.015202045440673828, 0.015860557556152344, 0.01651906967163086, 0.017177581787109375, 0.01783609390258789, 0.018494606018066406, 0.019153118133544922, 0.019811630249023438, 0.020470142364501953, 0.02112865447998047, 0.021787166595458984, 0.0224456787109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 3.0, 6.0, 5.0, 7.0, 14.0, 15.0, 17.0, 10.0, 30.0, 40.0, 50.0, 68.0, 109.0, 146.0, 258.0, 449.0, 823.0, 1716.0, 3777.0, 11465.0, 54002.0, 968960.0, 3046578.0, 81199.0, 15533.0, 4837.0, 1902.0, 974.0, 511.0, 271.0, 155.0, 96.0, 71.0, 48.0, 32.0, 29.0, 22.0, 11.0, 14.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0106658935546875, -0.010333657264709473, -0.010001420974731445, -0.009669184684753418, -0.00933694839477539, -0.009004712104797363, -0.008672475814819336, -0.008340239524841309, -0.008008003234863281, -0.007675766944885254, -0.0073435306549072266, -0.007011294364929199, -0.006679058074951172, -0.0063468217849731445, -0.006014585494995117, -0.00568234920501709, -0.0053501129150390625, -0.005017876625061035, -0.004685640335083008, -0.0043534040451049805, -0.004021167755126953, -0.0036889314651489258, -0.0033566951751708984, -0.003024458885192871, -0.0026922225952148438, -0.0023599863052368164, -0.002027750015258789, -0.0016955137252807617, -0.0013632774353027344, -0.001031041145324707, -0.0006988048553466797, -0.00036656856536865234, -3.4332275390625e-05, 0.00029790401458740234, 0.0006301403045654297, 0.000962376594543457, 0.0012946128845214844, 0.0016268491744995117, 0.001959085464477539, 0.0022913217544555664, 0.0026235580444335938, 0.002955794334411621, 0.0032880306243896484, 0.0036202669143676758, 0.003952503204345703, 0.0042847394943237305, 0.004616975784301758, 0.004949212074279785, 0.0052814483642578125, 0.00561368465423584, 0.005945920944213867, 0.0062781572341918945, 0.006610393524169922, 0.006942629814147949, 0.0072748661041259766, 0.007607102394104004, 0.007939338684082031, 0.008271574974060059, 0.008603811264038086, 0.008936047554016113, 0.00926828384399414, 0.009600520133972168, 0.009932756423950195, 0.010264992713928223, 0.01059722900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 30.0, 75.0, 109.0, 505.0, 2020.0, 876.0, 202.0, 95.0, 45.0, 20.0, 28.0, 14.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.01666438579559326, -0.016254186630249023, -0.015843987464904785, -0.015433788299560547, -0.015023589134216309, -0.01461338996887207, -0.014203190803527832, -0.013792991638183594, -0.013382792472839355, -0.012972593307495117, -0.012562394142150879, -0.01215219497680664, -0.011741995811462402, -0.011331796646118164, -0.010921597480773926, -0.010511398315429688, -0.01010119915008545, -0.009690999984741211, -0.009280800819396973, -0.008870601654052734, -0.008460402488708496, -0.008050203323364258, -0.0076400041580200195, -0.007229804992675781, -0.006819605827331543, -0.006409406661987305, -0.005999207496643066, -0.005589008331298828, -0.00517880916595459, -0.0047686100006103516, -0.004358410835266113, -0.003948211669921875, -0.0035380125045776367, -0.0031278133392333984, -0.00271761417388916, -0.002307415008544922, -0.0018972158432006836, -0.0014870166778564453, -0.001076817512512207, -0.0006666183471679688, -0.00025641918182373047, 0.0001537799835205078, 0.0005639791488647461, 0.0009741783142089844, 0.0013843774795532227, 0.001794576644897461, 0.0022047758102416992, 0.0026149749755859375, 0.0030251741409301758, 0.003435373306274414, 0.0038455724716186523, 0.004255771636962891, 0.004665970802307129, 0.005076169967651367, 0.0054863691329956055, 0.005896568298339844, 0.006306767463684082, 0.00671696662902832, 0.007127165794372559, 0.007537364959716797, 0.007947564125061035, 0.008357763290405273, 0.008767962455749512, 0.00917816162109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 27.0, 47.0, 161.0, 362.0, 261.0, 96.0, 27.0, 13.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1007395014166832, -0.0984795019030571, -0.0962194949388504, -0.0939594954252243, -0.0916994959115982, -0.0894394963979721, -0.08717949688434601, -0.08491948992013931, -0.08265949040651321, -0.08039949089288712, -0.07813948392868042, -0.07587948441505432, -0.07361948490142822, -0.07135948538780212, -0.06909948587417603, -0.06683947890996933, -0.06457947939634323, -0.06231947988271713, -0.060059476643800735, -0.05779947340488434, -0.05553947389125824, -0.05327947437763214, -0.051019471138715744, -0.04875946789979935, -0.04649946838617325, -0.04423946887254715, -0.04197946563363075, -0.039719462394714355, -0.03745946288108826, -0.03519946336746216, -0.03293946012854576, -0.030679458752274513, -0.028419457376003265, -0.026159455999732018, -0.02389945462346077, -0.021639453247189522, -0.019379451870918274, -0.017119450494647026, -0.014859449118375778, -0.01259944774210453, -0.010339446365833282, -0.008079444989562035, -0.005819443613290787, -0.003559442237019539, -0.001299440860748291, 0.0009605605155229568, 0.0032205618917942047, 0.005480563268065453, 0.0077405646443367004, 0.010000566020607948, 0.012260567396879196, 0.014520568773150444, 0.016780570149421692, 0.01904057152569294, 0.021300572901964188, 0.023560574278235435, 0.025820575654506683, 0.02808057703077793, 0.03034057840704918, 0.032600581645965576, 0.034860581159591675, 0.03712058067321777, 0.03938058391213417, 0.04164058715105057, 0.043900586664676666]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 17.0, 16.0, 19.0, 24.0, 21.0, 29.0, 39.0, 33.0, 39.0, 30.0, 41.0, 34.0, 39.0, 42.0, 39.0, 61.0, 46.0, 34.0, 40.0, 44.0, 33.0, 36.0, 40.0, 36.0, 22.0, 26.0, 15.0, 22.0, 9.0, 10.0, 8.0, 3.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.020525634288787842, -0.019929347559809685, -0.019333060830831528, -0.01873677410185337, -0.018140487372875214, -0.017544200643897057, -0.0169479139149189, -0.016351627185940742, -0.015755340456962585, -0.015159053727984428, -0.014562766999006271, -0.013966480270028114, -0.013370193541049957, -0.0127739068120718, -0.012177620083093643, -0.011581333354115486, -0.010985046625137329, -0.010388759896159172, -0.009792473167181015, -0.009196186438202858, -0.008599899709224701, -0.008003612980246544, -0.007407326251268387, -0.00681103952229023, -0.006214752793312073, -0.005618466064333916, -0.005022179335355759, -0.004425892606377602, -0.0038296058773994446, -0.0032333191484212875, -0.0026370324194431305, -0.0020407456904649734, -0.0014444589614868164, -0.0008481722325086594, -0.0002518855035305023, 0.0003444012254476547, 0.0009406879544258118, 0.0015369746834039688, 0.002133261412382126, 0.002729548141360283, 0.00332583487033844, 0.003922121599316597, 0.004518408328294754, 0.005114695057272911, 0.005710981786251068, 0.006307268515229225, 0.006903555244207382, 0.007499841973185539, 0.008096128702163696, 0.008692415431141853, 0.00928870216012001, 0.009884988889098167, 0.010481275618076324, 0.011077562347054482, 0.011673849076032639, 0.012270135805010796, 0.012866422533988953, 0.01346270926296711, 0.014058995991945267, 0.014655282720923424, 0.01525156944990158, 0.015847856178879738, 0.016444142907857895, 0.017040429636836052, 0.01763671636581421]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 10.0, 13.0, 19.0, 24.0, 39.0, 76.0, 118.0, 191.0, 349.0, 609.0, 1354.0, 4803.0, 87034.0, 929523.0, 19418.0, 2770.0, 990.0, 493.0, 277.0, 155.0, 86.0, 68.0, 33.0, 21.0, 13.0, 8.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041412353515625, -0.04004621505737305, -0.038680076599121094, -0.03731393814086914, -0.03594779968261719, -0.034581661224365234, -0.03321552276611328, -0.03184938430786133, -0.030483245849609375, -0.029117107391357422, -0.02775096893310547, -0.026384830474853516, -0.025018692016601562, -0.02365255355834961, -0.022286415100097656, -0.020920276641845703, -0.01955413818359375, -0.018187999725341797, -0.016821861267089844, -0.01545572280883789, -0.014089584350585938, -0.012723445892333984, -0.011357307434082031, -0.009991168975830078, -0.008625030517578125, -0.007258892059326172, -0.005892753601074219, -0.004526615142822266, -0.0031604766845703125, -0.0017943382263183594, -0.00042819976806640625, 0.0009379386901855469, 0.0023040771484375, 0.003670215606689453, 0.005036354064941406, 0.006402492523193359, 0.0077686309814453125, 0.009134769439697266, 0.010500907897949219, 0.011867046356201172, 0.013233184814453125, 0.014599323272705078, 0.01596546173095703, 0.017331600189208984, 0.018697738647460938, 0.02006387710571289, 0.021430015563964844, 0.022796154022216797, 0.02416229248046875, 0.025528430938720703, 0.026894569396972656, 0.02826070785522461, 0.029626846313476562, 0.030992984771728516, 0.03235912322998047, 0.03372526168823242, 0.035091400146484375, 0.03645753860473633, 0.03782367706298828, 0.039189815521240234, 0.04055595397949219, 0.04192209243774414, 0.043288230895996094, 0.04465436935424805, 0.0460205078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 43.0, 113.0, 194.0, 244.0, 208.0, 120.0, 47.0, 12.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02069091796875, -0.020014047622680664, -0.019337177276611328, -0.018660306930541992, -0.017983436584472656, -0.01730656623840332, -0.016629695892333984, -0.01595282554626465, -0.015275955200195312, -0.014599084854125977, -0.01392221450805664, -0.013245344161987305, -0.012568473815917969, -0.011891603469848633, -0.011214733123779297, -0.010537862777709961, -0.009860992431640625, -0.009184122085571289, -0.008507251739501953, -0.007830381393432617, -0.007153511047363281, -0.006476640701293945, -0.005799770355224609, -0.0051229000091552734, -0.0044460296630859375, -0.0037691593170166016, -0.0030922889709472656, -0.0024154186248779297, -0.0017385482788085938, -0.0010616779327392578, -0.0003848075866699219, 0.00029206275939941406, 0.00096893310546875, 0.001645803451538086, 0.002322673797607422, 0.002999544143676758, 0.0036764144897460938, 0.00435328483581543, 0.005030155181884766, 0.0057070255279541016, 0.0063838958740234375, 0.0070607662200927734, 0.007737636566162109, 0.008414506912231445, 0.009091377258300781, 0.009768247604370117, 0.010445117950439453, 0.011121988296508789, 0.011798858642578125, 0.012475728988647461, 0.013152599334716797, 0.013829469680786133, 0.014506340026855469, 0.015183210372924805, 0.01586008071899414, 0.016536951065063477, 0.017213821411132812, 0.01789069175720215, 0.018567562103271484, 0.01924443244934082, 0.019921302795410156, 0.020598173141479492, 0.021275043487548828, 0.021951913833618164, 0.0226287841796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 7.0, 13.0, 19.0, 21.0, 30.0, 50.0, 70.0, 106.0, 178.0, 335.0, 598.0, 1024.0, 2061.0, 5040.0, 17227.0, 98270.0, 585951.0, 283135.0, 38990.0, 8979.0, 3093.0, 1444.0, 769.0, 448.0, 247.0, 167.0, 94.0, 68.0, 37.0, 18.0, 12.0, 12.0, 10.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01526641845703125, -0.014800310134887695, -0.01433420181274414, -0.013868093490600586, -0.013401985168457031, -0.012935876846313477, -0.012469768524169922, -0.012003660202026367, -0.011537551879882812, -0.011071443557739258, -0.010605335235595703, -0.010139226913452148, -0.009673118591308594, -0.009207010269165039, -0.008740901947021484, -0.00827479362487793, -0.007808685302734375, -0.00734257698059082, -0.006876468658447266, -0.006410360336303711, -0.005944252014160156, -0.0054781436920166016, -0.005012035369873047, -0.004545927047729492, -0.0040798187255859375, -0.003613710403442383, -0.003147602081298828, -0.0026814937591552734, -0.0022153854370117188, -0.001749277114868164, -0.0012831687927246094, -0.0008170604705810547, -0.0003509521484375, 0.00011515617370605469, 0.0005812644958496094, 0.001047372817993164, 0.0015134811401367188, 0.0019795894622802734, 0.002445697784423828, 0.002911806106567383, 0.0033779144287109375, 0.003844022750854492, 0.004310131072998047, 0.0047762393951416016, 0.005242347717285156, 0.005708456039428711, 0.006174564361572266, 0.00664067268371582, 0.007106781005859375, 0.00757288932800293, 0.008038997650146484, 0.008505105972290039, 0.008971214294433594, 0.009437322616577148, 0.009903430938720703, 0.010369539260864258, 0.010835647583007812, 0.011301755905151367, 0.011767864227294922, 0.012233972549438477, 0.012700080871582031, 0.013166189193725586, 0.01363229751586914, 0.014098405838012695, 0.01456451416015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 6.0, 8.0, 5.0, 11.0, 11.0, 12.0, 18.0, 20.0, 33.0, 32.0, 32.0, 57.0, 43.0, 58.0, 69.0, 73.0, 60.0, 82.0, 51.0, 41.0, 48.0, 58.0, 34.0, 29.0, 19.0, 23.0, 16.0, 17.0, 10.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176239013671875, -0.017091989517211914, -0.016560077667236328, -0.016028165817260742, -0.015496253967285156, -0.01496434211730957, -0.014432430267333984, -0.013900518417358398, -0.013368606567382812, -0.012836694717407227, -0.01230478286743164, -0.011772871017456055, -0.011240959167480469, -0.010709047317504883, -0.010177135467529297, -0.009645223617553711, -0.009113311767578125, -0.008581399917602539, -0.008049488067626953, -0.007517576217651367, -0.006985664367675781, -0.006453752517700195, -0.005921840667724609, -0.0053899288177490234, -0.0048580169677734375, -0.0043261051177978516, -0.0037941932678222656, -0.0032622814178466797, -0.0027303695678710938, -0.002198457717895508, -0.0016665458679199219, -0.001134634017944336, -0.00060272216796875, -7.081031799316406e-05, 0.0004611015319824219, 0.0009930133819580078, 0.0015249252319335938, 0.0020568370819091797, 0.0025887489318847656, 0.0031206607818603516, 0.0036525726318359375, 0.0041844844818115234, 0.004716396331787109, 0.005248308181762695, 0.005780220031738281, 0.006312131881713867, 0.006844043731689453, 0.007375955581665039, 0.007907867431640625, 0.008439779281616211, 0.008971691131591797, 0.009503602981567383, 0.010035514831542969, 0.010567426681518555, 0.01109933853149414, 0.011631250381469727, 0.012163162231445312, 0.012695074081420898, 0.013226985931396484, 0.01375889778137207, 0.014290809631347656, 0.014822721481323242, 0.015354633331298828, 0.015886545181274414, 0.01641845703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 1.0, 7.0, 8.0, 12.0, 12.0, 20.0, 22.0, 36.0, 58.0, 87.0, 143.0, 181.0, 309.0, 408.0, 573.0, 865.0, 1374.0, 2114.0, 3449.0, 6337.0, 12124.0, 26700.0, 74310.0, 317933.0, 433749.0, 101564.0, 33314.0, 14416.0, 7304.0, 4108.0, 2429.0, 1481.0, 1012.0, 662.0, 431.0, 298.0, 213.0, 164.0, 102.0, 66.0, 58.0, 25.0, 25.0, 9.0, 10.0, 7.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.0029735565185546875, -0.002880990505218506, -0.0027884244918823242, -0.0026958584785461426, -0.002603292465209961, -0.0025107264518737793, -0.0024181604385375977, -0.002325594425201416, -0.0022330284118652344, -0.0021404623985290527, -0.002047896385192871, -0.0019553303718566895, -0.0018627643585205078, -0.0017701983451843262, -0.0016776323318481445, -0.0015850663185119629, -0.0014925003051757812, -0.0013999342918395996, -0.001307368278503418, -0.0012148022651672363, -0.0011222362518310547, -0.001029670238494873, -0.0009371042251586914, -0.0008445382118225098, -0.0007519721984863281, -0.0006594061851501465, -0.0005668401718139648, -0.0004742741584777832, -0.00038170814514160156, -0.0002891421318054199, -0.00019657611846923828, -0.00010401010513305664, -1.1444091796875e-05, 8.112192153930664e-05, 0.00017368793487548828, 0.0002662539482116699, 0.00035881996154785156, 0.0004513859748840332, 0.0005439519882202148, 0.0006365180015563965, 0.0007290840148925781, 0.0008216500282287598, 0.0009142160415649414, 0.001006782054901123, 0.0010993480682373047, 0.0011919140815734863, 0.001284480094909668, 0.0013770461082458496, 0.0014696121215820312, 0.0015621781349182129, 0.0016547441482543945, 0.0017473101615905762, 0.0018398761749267578, 0.0019324421882629395, 0.002025008201599121, 0.0021175742149353027, 0.0022101402282714844, 0.002302706241607666, 0.0023952722549438477, 0.0024878382682800293, 0.002580404281616211, 0.0026729702949523926, 0.0027655363082885742, 0.002858102321624756, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 7.0, 6.0, 11.0, 13.0, 22.0, 30.0, 26.0, 43.0, 80.0, 114.0, 124.0, 112.0, 119.0, 85.0, 45.0, 44.0, 17.0, 21.0, 20.0, 19.0, 3.0, 7.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.936094284057617e-05, -9.62642952799797e-05, -9.316764771938324e-05, -9.007100015878677e-05, -8.697435259819031e-05, -8.387770503759384e-05, -8.078105747699738e-05, -7.768440991640091e-05, -7.458776235580444e-05, -7.149111479520798e-05, -6.839446723461151e-05, -6.529781967401505e-05, -6.220117211341858e-05, -5.910452455282211e-05, -5.600787699222565e-05, -5.291122943162918e-05, -4.9814581871032715e-05, -4.671793431043625e-05, -4.362128674983978e-05, -4.052463918924332e-05, -3.742799162864685e-05, -3.4331344068050385e-05, -3.123469650745392e-05, -2.8138048946857452e-05, -2.5041401386260986e-05, -2.194475382566452e-05, -1.8848106265068054e-05, -1.5751458704471588e-05, -1.2654811143875122e-05, -9.558163583278656e-06, -6.46151602268219e-06, -3.364868462085724e-06, -2.682209014892578e-07, 2.8284266591072083e-06, 5.925074219703674e-06, 9.02172178030014e-06, 1.2118369340896606e-05, 1.5215016901493073e-05, 1.831166446208954e-05, 2.1408312022686005e-05, 2.450495958328247e-05, 2.7601607143878937e-05, 3.06982547044754e-05, 3.379490226507187e-05, 3.6891549825668335e-05, 3.99881973862648e-05, 4.308484494686127e-05, 4.618149250745773e-05, 4.92781400680542e-05, 5.2374787628650665e-05, 5.547143518924713e-05, 5.85680827498436e-05, 6.166473031044006e-05, 6.476137787103653e-05, 6.7858025431633e-05, 7.095467299222946e-05, 7.405132055282593e-05, 7.71479681134224e-05, 8.024461567401886e-05, 8.334126323461533e-05, 8.643791079521179e-05, 8.953455835580826e-05, 9.263120591640472e-05, 9.572785347700119e-05, 9.882450103759766e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 9.0, 13.0, 16.0, 21.0, 28.0, 37.0, 66.0, 124.0, 244.0, 455.0, 873.0, 1955.0, 4469.0, 12323.0, 40247.0, 221186.0, 626766.0, 101532.0, 24098.0, 8058.0, 3083.0, 1451.0, 700.0, 323.0, 206.0, 100.0, 61.0, 33.0, 16.0, 15.0, 12.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.005031585693359375, -0.00488048791885376, -0.0047293901443481445, -0.004578292369842529, -0.004427194595336914, -0.004276096820831299, -0.004124999046325684, -0.003973901271820068, -0.003822803497314453, -0.003671705722808838, -0.0035206079483032227, -0.0033695101737976074, -0.003218412399291992, -0.003067314624786377, -0.0029162168502807617, -0.0027651190757751465, -0.0026140213012695312, -0.002462923526763916, -0.0023118257522583008, -0.0021607279777526855, -0.0020096302032470703, -0.001858532428741455, -0.0017074346542358398, -0.0015563368797302246, -0.0014052391052246094, -0.0012541413307189941, -0.001103043556213379, -0.0009519457817077637, -0.0008008480072021484, -0.0006497502326965332, -0.000498652458190918, -0.00034755468368530273, -0.0001964569091796875, -4.5359134674072266e-05, 0.00010573863983154297, 0.0002568364143371582, 0.00040793418884277344, 0.0005590319633483887, 0.0007101297378540039, 0.0008612275123596191, 0.0010123252868652344, 0.0011634230613708496, 0.0013145208358764648, 0.00146561861038208, 0.0016167163848876953, 0.0017678141593933105, 0.0019189119338989258, 0.002070009708404541, 0.0022211074829101562, 0.0023722052574157715, 0.0025233030319213867, 0.002674400806427002, 0.002825498580932617, 0.0029765963554382324, 0.0031276941299438477, 0.003278791904449463, 0.003429889678955078, 0.0035809874534606934, 0.0037320852279663086, 0.003883183002471924, 0.004034280776977539, 0.004185378551483154, 0.0043364763259887695, 0.004487574100494385, 0.004638671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 9.0, 17.0, 21.0, 29.0, 37.0, 47.0, 70.0, 106.0, 136.0, 123.0, 103.0, 83.0, 63.0, 41.0, 26.0, 21.0, 15.0, 12.0, 4.0, 3.0, 9.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034809112548828125, -0.003347426652908325, -0.003213942050933838, -0.0030804574489593506, -0.0029469728469848633, -0.002813488245010376, -0.0026800036430358887, -0.0025465190410614014, -0.002413034439086914, -0.0022795498371124268, -0.0021460652351379395, -0.002012580633163452, -0.0018790960311889648, -0.0017456114292144775, -0.0016121268272399902, -0.001478642225265503, -0.0013451576232910156, -0.0012116730213165283, -0.001078188419342041, -0.0009447038173675537, -0.0008112192153930664, -0.0006777346134185791, -0.0005442500114440918, -0.0004107654094696045, -0.0002772808074951172, -0.00014379620552062988, -1.0311603546142578e-05, 0.00012317299842834473, 0.00025665760040283203, 0.00039014220237731934, 0.0005236268043518066, 0.0006571114063262939, 0.0007905960083007812, 0.0009240806102752686, 0.0010575652122497559, 0.0011910498142242432, 0.0013245344161987305, 0.0014580190181732178, 0.001591503620147705, 0.0017249882221221924, 0.0018584728240966797, 0.001991957426071167, 0.0021254420280456543, 0.0022589266300201416, 0.002392411231994629, 0.002525895833969116, 0.0026593804359436035, 0.002792865037918091, 0.002926349639892578, 0.0030598342418670654, 0.0031933188438415527, 0.00332680344581604, 0.0034602880477905273, 0.0035937726497650146, 0.003727257251739502, 0.0038607418537139893, 0.0039942264556884766, 0.004127711057662964, 0.004261195659637451, 0.0043946802616119385, 0.004528164863586426, 0.004661649465560913, 0.0047951340675354, 0.004928618669509888, 0.005062103271484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 20.0, 49.0, 117.0, 202.0, 273.0, 162.0, 76.0, 60.0, 17.0, 11.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08436357975006104, -0.08147940039634705, -0.07859522104263306, -0.07571104168891907, -0.07282686233520508, -0.06994268298149109, -0.0670585036277771, -0.06417432427406311, -0.06129014864563942, -0.05840596929192543, -0.05552178993821144, -0.05263761430978775, -0.04975343495607376, -0.04686925560235977, -0.04398507624864578, -0.04110089689493179, -0.038216717541217804, -0.035332538187503815, -0.032448358833789825, -0.029564181342720985, -0.026680001989006996, -0.023795822635293007, -0.020911645144224167, -0.018027465790510178, -0.015143286436796188, -0.012259107083082199, -0.009374928660690784, -0.00649075023829937, -0.0036065708845853806, -0.0007223915308713913, 0.0021617859601974487, 0.005045965313911438, 0.007930144667625427, 0.010814324021339417, 0.013698502443730831, 0.016582680866122246, 0.019466860219836235, 0.022351039573550224, 0.025235217064619064, 0.028119396418333054, 0.031003575772047043, 0.03388775512576103, 0.03677193447947502, 0.03965611010789871, 0.0425402894616127, 0.04542446881532669, 0.04830864816904068, 0.05119282752275467, 0.05407700687646866, 0.05696118623018265, 0.05984536558389664, 0.06272954493761063, 0.06561372429132462, 0.0684979036450386, 0.071382075548172, 0.07426625490188599, 0.07715043425559998, 0.08003461360931396, 0.08291879296302795, 0.08580297231674194, 0.08868715167045593, 0.09157133102416992, 0.09445551037788391, 0.0973396897315979, 0.10022386908531189]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 4.0, 11.0, 10.0, 5.0, 12.0, 15.0, 17.0, 18.0, 18.0, 15.0, 14.0, 18.0, 42.0, 32.0, 40.0, 30.0, 28.0, 53.0, 32.0, 42.0, 46.0, 44.0, 39.0, 44.0, 38.0, 53.0, 35.0, 37.0, 33.0, 26.0, 18.0, 18.0, 14.0, 11.0, 18.0, 10.0, 13.0, 6.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033133864402770996, -0.032058119773864746, -0.030982377007603645, -0.029906634241342545, -0.028830889612436295, -0.027755144983530045, -0.026679402217268944, -0.025603659451007843, -0.024527914822101593, -0.023452170193195343, -0.022376427426934242, -0.02130068466067314, -0.02022494003176689, -0.01914919540286064, -0.01807345263659954, -0.01699770987033844, -0.01592196524143219, -0.014846221543848515, -0.01377047784626484, -0.012694734148681164, -0.011618990451097488, -0.010543246753513813, -0.009467503055930138, -0.008391759358346462, -0.007316015660762787, -0.0062402719631791115, -0.005164528265595436, -0.004088784568011761, -0.0030130408704280853, -0.00193729717284441, -0.0008615534752607346, 0.00021419022232294083, 0.0012899339199066162, 0.0023656776174902916, 0.003441421315073967, 0.004517165012657642, 0.005592908710241318, 0.006668652407824993, 0.0077443961054086685, 0.008820139802992344, 0.00989588350057602, 0.010971627198159695, 0.01204737089574337, 0.013123114593327045, 0.01419885829091072, 0.015274601988494396, 0.01635034568607807, 0.017426088452339172, 0.018501833081245422, 0.019577577710151672, 0.020653320476412773, 0.021729063242673874, 0.022804807871580124, 0.023880552500486374, 0.024956295266747475, 0.026032038033008575, 0.027107782661914825, 0.028183527290821075, 0.029259270057082176, 0.030335012823343277, 0.03141075745224953, 0.03248650208115578, 0.03356224298477173, 0.03463798761367798, 0.03571373224258423]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 6.0, 0.0, 6.0, 5.0, 9.0, 16.0, 20.0, 24.0, 27.0, 45.0, 91.0, 99.0, 158.0, 222.0, 521.0, 1240.0, 2800.0, 8611.0, 122197.0, 4002190.0, 45941.0, 6566.0, 1902.0, 713.0, 287.0, 178.0, 120.0, 75.0, 57.0, 48.0, 25.0, 21.0, 15.0, 12.0, 12.0, 5.0, 3.0, 5.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02362060546875, -0.022787809371948242, -0.021955013275146484, -0.021122217178344727, -0.02028942108154297, -0.01945662498474121, -0.018623828887939453, -0.017791032791137695, -0.016958236694335938, -0.01612544059753418, -0.015292644500732422, -0.014459848403930664, -0.013627052307128906, -0.012794256210327148, -0.01196146011352539, -0.011128664016723633, -0.010295867919921875, -0.009463071823120117, -0.00863027572631836, -0.0077974796295166016, -0.006964683532714844, -0.006131887435913086, -0.005299091339111328, -0.00446629524230957, -0.0036334991455078125, -0.0028007030487060547, -0.001967906951904297, -0.001135110855102539, -0.00030231475830078125, 0.0005304813385009766, 0.0013632774353027344, 0.002196073532104492, 0.00302886962890625, 0.003861665725708008, 0.004694461822509766, 0.0055272579193115234, 0.006360054016113281, 0.007192850112915039, 0.008025646209716797, 0.008858442306518555, 0.009691238403320312, 0.01052403450012207, 0.011356830596923828, 0.012189626693725586, 0.013022422790527344, 0.013855218887329102, 0.01468801498413086, 0.015520811080932617, 0.016353607177734375, 0.017186403274536133, 0.01801919937133789, 0.01885199546813965, 0.019684791564941406, 0.020517587661743164, 0.021350383758544922, 0.02218317985534668, 0.023015975952148438, 0.023848772048950195, 0.024681568145751953, 0.02551436424255371, 0.02634716033935547, 0.027179956436157227, 0.028012752532958984, 0.028845548629760742, 0.0296783447265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 20.0, 85.0, 155.0, 202.0, 246.0, 168.0, 87.0, 19.0, 12.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0213775634765625, -0.020689725875854492, -0.020001888275146484, -0.019314050674438477, -0.01862621307373047, -0.01793837547302246, -0.017250537872314453, -0.016562700271606445, -0.015874862670898438, -0.01518702507019043, -0.014499187469482422, -0.013811349868774414, -0.013123512268066406, -0.012435674667358398, -0.01174783706665039, -0.011059999465942383, -0.010372161865234375, -0.009684324264526367, -0.00899648666381836, -0.008308649063110352, -0.007620811462402344, -0.006932973861694336, -0.006245136260986328, -0.00555729866027832, -0.0048694610595703125, -0.004181623458862305, -0.003493785858154297, -0.002805948257446289, -0.0021181106567382812, -0.0014302730560302734, -0.0007424354553222656, -5.459785461425781e-05, 0.00063323974609375, 0.0013210773468017578, 0.0020089149475097656, 0.0026967525482177734, 0.0033845901489257812, 0.004072427749633789, 0.004760265350341797, 0.005448102951049805, 0.0061359405517578125, 0.00682377815246582, 0.007511615753173828, 0.008199453353881836, 0.008887290954589844, 0.009575128555297852, 0.01026296615600586, 0.010950803756713867, 0.011638641357421875, 0.012326478958129883, 0.01301431655883789, 0.013702154159545898, 0.014389991760253906, 0.015077829360961914, 0.015765666961669922, 0.01645350456237793, 0.017141342163085938, 0.017829179763793945, 0.018517017364501953, 0.01920485496520996, 0.01989269256591797, 0.020580530166625977, 0.021268367767333984, 0.021956205368041992, 0.02264404296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 8.0, 11.0, 8.0, 19.0, 38.0, 59.0, 87.0, 185.0, 310.0, 534.0, 995.0, 1870.0, 3937.0, 9984.0, 34574.0, 223639.0, 3609495.0, 251562.0, 37799.0, 10791.0, 4154.0, 1966.0, 1028.0, 529.0, 311.0, 156.0, 99.0, 61.0, 29.0, 28.0, 10.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01122283935546875, -0.010877728462219238, -0.010532617568969727, -0.010187506675720215, -0.009842395782470703, -0.009497284889221191, -0.00915217399597168, -0.008807063102722168, -0.008461952209472656, -0.008116841316223145, -0.007771730422973633, -0.007426619529724121, -0.007081508636474609, -0.006736397743225098, -0.006391286849975586, -0.006046175956726074, -0.0057010650634765625, -0.005355954170227051, -0.005010843276977539, -0.004665732383728027, -0.004320621490478516, -0.003975510597229004, -0.003630399703979492, -0.0032852888107299805, -0.0029401779174804688, -0.002595067024230957, -0.0022499561309814453, -0.0019048452377319336, -0.0015597343444824219, -0.0012146234512329102, -0.0008695125579833984, -0.0005244016647338867, -0.000179290771484375, 0.00016582012176513672, 0.0005109310150146484, 0.0008560419082641602, 0.0012011528015136719, 0.0015462636947631836, 0.0018913745880126953, 0.002236485481262207, 0.0025815963745117188, 0.0029267072677612305, 0.003271818161010742, 0.003616929054260254, 0.003962039947509766, 0.004307150840759277, 0.004652261734008789, 0.004997372627258301, 0.0053424835205078125, 0.005687594413757324, 0.006032705307006836, 0.006377816200256348, 0.006722927093505859, 0.007068037986755371, 0.007413148880004883, 0.0077582597732543945, 0.008103370666503906, 0.008448481559753418, 0.00879359245300293, 0.009138703346252441, 0.009483814239501953, 0.009828925132751465, 0.010174036026000977, 0.010519146919250488, 0.0108642578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 20.0, 28.0, 47.0, 87.0, 164.0, 547.0, 1425.0, 991.0, 324.0, 125.0, 80.0, 63.0, 42.0, 36.0, 20.0, 11.0, 8.0, 6.0, 8.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0121002197265625, -0.011770963668823242, -0.011441707611083984, -0.011112451553344727, -0.010783195495605469, -0.010453939437866211, -0.010124683380126953, -0.009795427322387695, -0.009466171264648438, -0.00913691520690918, -0.008807659149169922, -0.008478403091430664, -0.008149147033691406, -0.007819890975952148, -0.007490634918212891, -0.007161378860473633, -0.006832122802734375, -0.006502866744995117, -0.006173610687255859, -0.0058443546295166016, -0.005515098571777344, -0.005185842514038086, -0.004856586456298828, -0.00452733039855957, -0.0041980743408203125, -0.0038688182830810547, -0.003539562225341797, -0.003210306167602539, -0.0028810501098632812, -0.0025517940521240234, -0.0022225379943847656, -0.0018932819366455078, -0.00156402587890625, -0.0012347698211669922, -0.0009055137634277344, -0.0005762577056884766, -0.00024700164794921875, 8.225440979003906e-05, 0.0004115104675292969, 0.0007407665252685547, 0.0010700225830078125, 0.0013992786407470703, 0.0017285346984863281, 0.002057790756225586, 0.0023870468139648438, 0.0027163028717041016, 0.0030455589294433594, 0.003374814987182617, 0.003704071044921875, 0.004033327102661133, 0.004362583160400391, 0.0046918392181396484, 0.005021095275878906, 0.005350351333618164, 0.005679607391357422, 0.00600886344909668, 0.0063381195068359375, 0.006667375564575195, 0.006996631622314453, 0.007325887680053711, 0.007655143737792969, 0.007984399795532227, 0.008313655853271484, 0.008642911911010742, 0.00897216796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 103.0, 369.0, 380.0, 107.0, 27.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13586591184139252, -0.13217034935951233, -0.12847478687763214, -0.12477922439575195, -0.12108366191387177, -0.11738809943199158, -0.11369254440069199, -0.1099969819188118, -0.10630141943693161, -0.10260585695505142, -0.09891029447317123, -0.09521473199129105, -0.09151917695999146, -0.08782361447811127, -0.08412805199623108, -0.08043248951435089, -0.0767369270324707, -0.07304136455059052, -0.06934580206871033, -0.06565023958683014, -0.06195468083024025, -0.05825911834836006, -0.05456355959177017, -0.050867997109889984, -0.047172434628009796, -0.04347687214612961, -0.03978130966424942, -0.03608575090765953, -0.03239018842577934, -0.028694625943899155, -0.024999065324664116, -0.021303504705429077, -0.01760794222354889, -0.013912380672991276, -0.010216819122433662, -0.006521257571876049, -0.0028256960213184357, 0.0008698664605617523, 0.004565427079796791, 0.00826098769903183, 0.011956550180912018, 0.015652112662792206, 0.019347673282027245, 0.023043233901262283, 0.02673879638314247, 0.03043435886502266, 0.03412991762161255, 0.03782548010349274, 0.041521042585372925, 0.04521660506725311, 0.0489121675491333, 0.05260772630572319, 0.05630328878760338, 0.059998851269483566, 0.06369441002607346, 0.06738997250795364, 0.07108553498983383, 0.07478109747171402, 0.07847665995359421, 0.0821722224354744, 0.08586777746677399, 0.08956333994865417, 0.09325890243053436, 0.09695446491241455, 0.10065002739429474]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 10.0, 13.0, 18.0, 15.0, 20.0, 24.0, 27.0, 30.0, 40.0, 42.0, 35.0, 46.0, 47.0, 37.0, 51.0, 48.0, 47.0, 48.0, 38.0, 42.0, 30.0, 29.0, 35.0, 23.0, 28.0, 22.0, 16.0, 15.0, 16.0, 12.0, 14.0, 10.0, 10.0, 13.0, 2.0, 1.0, 4.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021767079830169678, -0.021027568727731705, -0.02028805762529373, -0.01954854652285576, -0.018809035420417786, -0.018069524317979813, -0.01733001321554184, -0.016590502113103867, -0.015850991010665894, -0.01511147990822792, -0.014371968805789948, -0.013632457703351974, -0.012892946600914001, -0.012153435498476028, -0.011413924396038055, -0.010674413293600082, -0.00993490219116211, -0.009195391088724136, -0.008455879986286163, -0.00771636888384819, -0.006976857781410217, -0.006237346678972244, -0.005497835576534271, -0.004758324474096298, -0.004018813371658325, -0.003279302269220352, -0.002539791166782379, -0.0018002800643444061, -0.001060768961906433, -0.0003212578594684601, 0.00041825324296951294, 0.001157764345407486, 0.001897275447845459, 0.002636786550283432, 0.003376297652721405, 0.004115808755159378, 0.004855319857597351, 0.005594830960035324, 0.006334342062473297, 0.00707385316491127, 0.007813364267349243, 0.008552875369787216, 0.00929238647222519, 0.010031897574663162, 0.010771408677101135, 0.011510919779539108, 0.012250430881977081, 0.012989941984415054, 0.013729453086853027, 0.014468964189291, 0.015208475291728973, 0.015947986394166946, 0.01668749749660492, 0.017427008599042892, 0.018166519701480865, 0.01890603080391884, 0.01964554190635681, 0.020385053008794785, 0.021124564111232758, 0.02186407521367073, 0.022603586316108704, 0.023343097418546677, 0.02408260852098465, 0.024822119623422623, 0.025561630725860596]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 15.0, 11.0, 26.0, 40.0, 40.0, 63.0, 98.0, 123.0, 161.0, 195.0, 331.0, 454.0, 797.0, 1613.0, 5223.0, 44350.0, 818456.0, 161439.0, 9970.0, 2325.0, 954.0, 585.0, 365.0, 270.0, 182.0, 131.0, 85.0, 80.0, 48.0, 28.0, 28.0, 20.0, 12.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0274200439453125, -0.026581287384033203, -0.025742530822753906, -0.02490377426147461, -0.024065017700195312, -0.023226261138916016, -0.02238750457763672, -0.021548748016357422, -0.020709991455078125, -0.019871234893798828, -0.01903247833251953, -0.018193721771240234, -0.017354965209960938, -0.01651620864868164, -0.015677452087402344, -0.014838695526123047, -0.01399993896484375, -0.013161182403564453, -0.012322425842285156, -0.01148366928100586, -0.010644912719726562, -0.009806156158447266, -0.008967399597167969, -0.008128643035888672, -0.007289886474609375, -0.006451129913330078, -0.005612373352050781, -0.004773616790771484, -0.0039348602294921875, -0.0030961036682128906, -0.0022573471069335938, -0.0014185905456542969, -0.000579833984375, 0.0002589225769042969, 0.0010976791381835938, 0.0019364356994628906, 0.0027751922607421875, 0.0036139488220214844, 0.004452705383300781, 0.005291461944580078, 0.006130218505859375, 0.006968975067138672, 0.007807731628417969, 0.008646488189697266, 0.009485244750976562, 0.01032400131225586, 0.011162757873535156, 0.012001514434814453, 0.01284027099609375, 0.013679027557373047, 0.014517784118652344, 0.01535654067993164, 0.016195297241210938, 0.017034053802490234, 0.01787281036376953, 0.018711566925048828, 0.019550323486328125, 0.020389080047607422, 0.02122783660888672, 0.022066593170166016, 0.022905349731445312, 0.02374410629272461, 0.024582862854003906, 0.025421619415283203, 0.0262603759765625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 31.0, 87.0, 159.0, 215.0, 223.0, 166.0, 73.0, 25.0, 13.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021270751953125, -0.020583629608154297, -0.019896507263183594, -0.01920938491821289, -0.018522262573242188, -0.017835140228271484, -0.01714801788330078, -0.016460895538330078, -0.015773773193359375, -0.015086650848388672, -0.014399528503417969, -0.013712406158447266, -0.013025283813476562, -0.01233816146850586, -0.011651039123535156, -0.010963916778564453, -0.01027679443359375, -0.009589672088623047, -0.008902549743652344, -0.00821542739868164, -0.0075283050537109375, -0.006841182708740234, -0.006154060363769531, -0.005466938018798828, -0.004779815673828125, -0.004092693328857422, -0.0034055709838867188, -0.0027184486389160156, -0.0020313262939453125, -0.0013442039489746094, -0.0006570816040039062, 3.0040740966796875e-05, 0.0007171630859375, 0.0014042854309082031, 0.0020914077758789062, 0.0027785301208496094, 0.0034656524658203125, 0.004152774810791016, 0.004839897155761719, 0.005527019500732422, 0.006214141845703125, 0.006901264190673828, 0.007588386535644531, 0.008275508880615234, 0.008962631225585938, 0.00964975357055664, 0.010336875915527344, 0.011023998260498047, 0.01171112060546875, 0.012398242950439453, 0.013085365295410156, 0.01377248764038086, 0.014459609985351562, 0.015146732330322266, 0.01583385467529297, 0.016520977020263672, 0.017208099365234375, 0.017895221710205078, 0.01858234405517578, 0.019269466400146484, 0.019956588745117188, 0.02064371109008789, 0.021330833435058594, 0.022017955780029297, 0.022705078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 20.0, 25.0, 52.0, 59.0, 97.0, 149.0, 235.0, 420.0, 678.0, 1394.0, 2722.0, 6078.0, 14114.0, 42606.0, 172000.0, 495871.0, 227357.0, 53795.0, 17143.0, 6846.0, 3271.0, 1606.0, 809.0, 434.0, 286.0, 139.0, 105.0, 73.0, 34.0, 23.0, 16.0, 13.0, 13.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0104827880859375, -0.010161161422729492, -0.009839534759521484, -0.009517908096313477, -0.009196281433105469, -0.008874654769897461, -0.008553028106689453, -0.008231401443481445, -0.007909774780273438, -0.00758814811706543, -0.007266521453857422, -0.006944894790649414, -0.006623268127441406, -0.0063016414642333984, -0.005980014801025391, -0.005658388137817383, -0.005336761474609375, -0.005015134811401367, -0.004693508148193359, -0.0043718814849853516, -0.004050254821777344, -0.003728628158569336, -0.003407001495361328, -0.0030853748321533203, -0.0027637481689453125, -0.0024421215057373047, -0.002120494842529297, -0.001798868179321289, -0.0014772415161132812, -0.0011556148529052734, -0.0008339881896972656, -0.0005123615264892578, -0.00019073486328125, 0.0001308917999267578, 0.0004525184631347656, 0.0007741451263427734, 0.0010957717895507812, 0.001417398452758789, 0.0017390251159667969, 0.0020606517791748047, 0.0023822784423828125, 0.0027039051055908203, 0.003025531768798828, 0.003347158432006836, 0.0036687850952148438, 0.0039904117584228516, 0.004312038421630859, 0.004633665084838867, 0.004955291748046875, 0.005276918411254883, 0.005598545074462891, 0.0059201717376708984, 0.006241798400878906, 0.006563425064086914, 0.006885051727294922, 0.00720667839050293, 0.0075283050537109375, 0.007849931716918945, 0.008171558380126953, 0.008493185043334961, 0.008814811706542969, 0.009136438369750977, 0.009458065032958984, 0.009779691696166992, 0.010101318359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 4.0, 7.0, 11.0, 16.0, 15.0, 13.0, 13.0, 19.0, 32.0, 24.0, 34.0, 37.0, 57.0, 47.0, 55.0, 59.0, 62.0, 51.0, 50.0, 50.0, 34.0, 51.0, 41.0, 36.0, 25.0, 32.0, 28.0, 15.0, 19.0, 8.0, 7.0, 11.0, 10.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0156707763671875, -0.015208601951599121, -0.014746427536010742, -0.014284253120422363, -0.013822078704833984, -0.013359904289245605, -0.012897729873657227, -0.012435555458068848, -0.011973381042480469, -0.01151120662689209, -0.011049032211303711, -0.010586857795715332, -0.010124683380126953, -0.009662508964538574, -0.009200334548950195, -0.008738160133361816, -0.008275985717773438, -0.007813811302185059, -0.00735163688659668, -0.006889462471008301, -0.006427288055419922, -0.005965113639831543, -0.005502939224243164, -0.005040764808654785, -0.004578590393066406, -0.004116415977478027, -0.0036542415618896484, -0.0031920671463012695, -0.0027298927307128906, -0.0022677183151245117, -0.0018055438995361328, -0.001343369483947754, -0.000881195068359375, -0.0004190206527709961, 4.315376281738281e-05, 0.0005053281784057617, 0.0009675025939941406, 0.0014296770095825195, 0.0018918514251708984, 0.0023540258407592773, 0.0028162002563476562, 0.003278374671936035, 0.003740549087524414, 0.004202723503112793, 0.004664897918701172, 0.005127072334289551, 0.00558924674987793, 0.006051421165466309, 0.0065135955810546875, 0.006975769996643066, 0.007437944412231445, 0.007900118827819824, 0.008362293243408203, 0.008824467658996582, 0.009286642074584961, 0.00974881649017334, 0.010210990905761719, 0.010673165321350098, 0.011135339736938477, 0.011597514152526855, 0.012059688568115234, 0.012521862983703613, 0.012984037399291992, 0.013446211814880371, 0.01390838623046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 8.0, 22.0, 23.0, 32.0, 55.0, 62.0, 161.0, 213.0, 387.0, 646.0, 1274.0, 2394.0, 4585.0, 10083.0, 31761.0, 267382.0, 643935.0, 58421.0, 14586.0, 5963.0, 2935.0, 1563.0, 797.0, 521.0, 282.0, 158.0, 91.0, 60.0, 40.0, 31.0, 19.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00710296630859375, -0.0068416595458984375, -0.006580352783203125, -0.0063190460205078125, -0.0060577392578125, -0.0057964324951171875, -0.005535125732421875, -0.0052738189697265625, -0.00501251220703125, -0.0047512054443359375, -0.004489898681640625, -0.0042285919189453125, -0.00396728515625, -0.0037059783935546875, -0.003444671630859375, -0.0031833648681640625, -0.00292205810546875, -0.0026607513427734375, -0.002399444580078125, -0.0021381378173828125, -0.0018768310546875, -0.0016155242919921875, -0.001354217529296875, -0.0010929107666015625, -0.00083160400390625, -0.0005702972412109375, -0.000308990478515625, -4.76837158203125e-05, 0.000213623046875, 0.0004749298095703125, 0.000736236572265625, 0.0009975433349609375, 0.00125885009765625, 0.0015201568603515625, 0.001781463623046875, 0.0020427703857421875, 0.0023040771484375, 0.0025653839111328125, 0.002826690673828125, 0.0030879974365234375, 0.00334930419921875, 0.0036106109619140625, 0.003871917724609375, 0.0041332244873046875, 0.00439453125, 0.0046558380126953125, 0.004917144775390625, 0.0051784515380859375, 0.00543975830078125, 0.0057010650634765625, 0.005962371826171875, 0.0062236785888671875, 0.0064849853515625, 0.0067462921142578125, 0.007007598876953125, 0.0072689056396484375, 0.00753021240234375, 0.0077915191650390625, 0.008052825927734375, 0.008314132690429688, 0.008575439453125, 0.008836746215820312, 0.009098052978515625, 0.009359359741210938, 0.00962066650390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 1.0, 10.0, 4.0, 10.0, 18.0, 16.0, 19.0, 35.0, 43.0, 40.0, 58.0, 78.0, 97.0, 103.0, 92.0, 66.0, 71.0, 55.0, 42.0, 30.0, 27.0, 25.0, 11.0, 15.0, 10.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.88453796505928e-05, -8.536316454410553e-05, -8.188094943761826e-05, -7.839873433113098e-05, -7.491651922464371e-05, -7.143430411815643e-05, -6.795208901166916e-05, -6.446987390518188e-05, -6.098765879869461e-05, -5.7505443692207336e-05, -5.402322858572006e-05, -5.054101347923279e-05, -4.7058798372745514e-05, -4.357658326625824e-05, -4.0094368159770966e-05, -3.661215305328369e-05, -3.312993794679642e-05, -2.9647722840309143e-05, -2.616550773382187e-05, -2.2683292627334595e-05, -1.920107752084732e-05, -1.5718862414360046e-05, -1.2236647307872772e-05, -8.754432201385498e-06, -5.272217094898224e-06, -1.7900019884109497e-06, 1.6922131180763245e-06, 5.174428224563599e-06, 8.656643331050873e-06, 1.2138858437538147e-05, 1.562107354402542e-05, 1.9103288650512695e-05, 2.258550375699997e-05, 2.6067718863487244e-05, 2.9549933969974518e-05, 3.303214907646179e-05, 3.6514364182949066e-05, 3.999657928943634e-05, 4.3478794395923615e-05, 4.696100950241089e-05, 5.044322460889816e-05, 5.392543971538544e-05, 5.740765482187271e-05, 6.0889869928359985e-05, 6.437208503484726e-05, 6.785430014133453e-05, 7.133651524782181e-05, 7.481873035430908e-05, 7.830094546079636e-05, 8.178316056728363e-05, 8.52653756737709e-05, 8.874759078025818e-05, 9.222980588674545e-05, 9.571202099323273e-05, 9.919423609972e-05, 0.00010267645120620728, 0.00010615866631269455, 0.00010964088141918182, 0.0001131230965256691, 0.00011660531163215637, 0.00012008752673864365, 0.00012356974184513092, 0.0001270519569516182, 0.00013053417205810547]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 14.0, 26.0, 44.0, 55.0, 90.0, 165.0, 276.0, 397.0, 763.0, 1505.0, 3187.0, 8295.0, 33752.0, 564664.0, 393983.0, 27728.0, 7478.0, 2977.0, 1350.0, 687.0, 411.0, 255.0, 161.0, 103.0, 64.0, 38.0, 23.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0092926025390625, -0.008971571922302246, -0.008650541305541992, -0.008329510688781738, -0.008008480072021484, -0.0076874494552612305, -0.0073664188385009766, -0.007045388221740723, -0.006724357604980469, -0.006403326988220215, -0.006082296371459961, -0.005761265754699707, -0.005440235137939453, -0.005119204521179199, -0.004798173904418945, -0.004477143287658691, -0.0041561126708984375, -0.0038350820541381836, -0.0035140514373779297, -0.0031930208206176758, -0.002871990203857422, -0.002550959587097168, -0.002229928970336914, -0.0019088983535766602, -0.0015878677368164062, -0.0012668371200561523, -0.0009458065032958984, -0.0006247758865356445, -0.0003037452697753906, 1.728534698486328e-05, 0.0003383159637451172, 0.0006593465805053711, 0.000980377197265625, 0.001301407814025879, 0.0016224384307861328, 0.0019434690475463867, 0.0022644996643066406, 0.0025855302810668945, 0.0029065608978271484, 0.0032275915145874023, 0.0035486221313476562, 0.00386965274810791, 0.004190683364868164, 0.004511713981628418, 0.004832744598388672, 0.005153775215148926, 0.00547480583190918, 0.005795836448669434, 0.0061168670654296875, 0.006437897682189941, 0.006758928298950195, 0.007079958915710449, 0.007400989532470703, 0.007722020149230957, 0.008043050765991211, 0.008364081382751465, 0.008685111999511719, 0.009006142616271973, 0.009327173233032227, 0.00964820384979248, 0.009969234466552734, 0.010290265083312988, 0.010611295700073242, 0.010932326316833496, 0.01125335693359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 11.0, 5.0, 3.0, 14.0, 23.0, 38.0, 88.0, 177.0, 305.0, 143.0, 72.0, 41.0, 14.0, 14.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0105133056640625, -0.010216474533081055, -0.00991964340209961, -0.009622812271118164, -0.009325981140136719, -0.009029150009155273, -0.008732318878173828, -0.008435487747192383, -0.008138656616210938, -0.007841825485229492, -0.007544994354248047, -0.0072481632232666016, -0.006951332092285156, -0.006654500961303711, -0.006357669830322266, -0.00606083869934082, -0.005764007568359375, -0.00546717643737793, -0.005170345306396484, -0.004873514175415039, -0.004576683044433594, -0.0042798519134521484, -0.003983020782470703, -0.003686189651489258, -0.0033893585205078125, -0.003092527389526367, -0.002795696258544922, -0.0024988651275634766, -0.0022020339965820312, -0.001905202865600586, -0.0016083717346191406, -0.0013115406036376953, -0.00101470947265625, -0.0007178783416748047, -0.0004210472106933594, -0.00012421607971191406, 0.00017261505126953125, 0.00046944618225097656, 0.0007662773132324219, 0.0010631084442138672, 0.0013599395751953125, 0.0016567707061767578, 0.001953601837158203, 0.0022504329681396484, 0.0025472640991210938, 0.002844095230102539, 0.0031409263610839844, 0.0034377574920654297, 0.003734588623046875, 0.00403141975402832, 0.004328250885009766, 0.004625082015991211, 0.004921913146972656, 0.0052187442779541016, 0.005515575408935547, 0.005812406539916992, 0.0061092376708984375, 0.006406068801879883, 0.006702899932861328, 0.0069997310638427734, 0.007296562194824219, 0.007593393325805664, 0.00789022445678711, 0.008187055587768555, 0.00848388671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 25.0, 111.0, 525.0, 288.0, 52.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07419072836637497, -0.06646933406591415, -0.05874794349074364, -0.05102655291557312, -0.043305158615112305, -0.03558376803994179, -0.02786237746477127, -0.020140983164310455, -0.012419592589139938, -0.0046982006169855595, 0.0030231913551688194, 0.010744582861661911, 0.018465975299477577, 0.026187367737293243, 0.03390875831246376, 0.041630152612924576, 0.04935154318809509, 0.05707293376326561, 0.06479432433843613, 0.07251571863889694, 0.08023711293935776, 0.08795849978923798, 0.09567989408969879, 0.1034012883901596, 0.11112268269062042, 0.11884407699108124, 0.12656547129154205, 0.13428685069084167, 0.1420082449913025, 0.1497296392917633, 0.15745103359222412, 0.16517242789268494, 0.17289380729198456, 0.18061520159244537, 0.1883365958929062, 0.1960579752922058, 0.20377936959266663, 0.21150076389312744, 0.21922215819358826, 0.22694355249404907, 0.2346649467945099, 0.2423863410949707, 0.2501077353954315, 0.25782912969589233, 0.26555052399635315, 0.27327191829681396, 0.2809932827949524, 0.2887147068977356, 0.296436071395874, 0.30415746569633484, 0.31187885999679565, 0.31960025429725647, 0.3273216485977173, 0.3350430428981781, 0.3427644371986389, 0.35048580169677734, 0.35820722579956055, 0.36592862010002136, 0.3736500144004822, 0.381371408700943, 0.3890928030014038, 0.3968141973018646, 0.40453559160232544, 0.41225695610046387, 0.4199783504009247]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 6.0, 10.0, 3.0, 16.0, 11.0, 23.0, 15.0, 19.0, 37.0, 35.0, 40.0, 35.0, 45.0, 45.0, 66.0, 47.0, 60.0, 52.0, 59.0, 60.0, 61.0, 48.0, 41.0, 36.0, 27.0, 23.0, 25.0, 16.0, 12.0, 13.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0664941668510437, -0.06496723741292953, -0.06344031542539597, -0.0619133859872818, -0.06038646027445793, -0.058859534561634064, -0.0573326051235199, -0.05580567941069603, -0.05427875369787216, -0.052751827985048294, -0.051224902272224426, -0.04969797283411026, -0.04817104712128639, -0.046644121408462524, -0.04511719197034836, -0.04359026625752449, -0.04206334054470062, -0.040536414831876755, -0.03900948911905289, -0.03748255968093872, -0.03595563396811485, -0.034428708255290985, -0.03290177881717682, -0.03137485310435295, -0.029847927391529083, -0.028321001678705215, -0.0267940741032362, -0.02526714652776718, -0.023740220814943314, -0.022213295102119446, -0.02068636752665043, -0.019159439951181412, -0.017632514238357544, -0.016105588525533676, -0.014578660950064659, -0.013051734305918217, -0.011524807661771774, -0.009997881017625332, -0.00847095437347889, -0.006944027729332447, -0.005417101085186005, -0.0038901744410395622, -0.00236324779689312, -0.0008363211527466774, 0.000690605491399765, 0.0022175321355462074, 0.00374445877969265, 0.005271385423839092, 0.006798312067985535, 0.008325238712131977, 0.00985216535627842, 0.011379092000424862, 0.012906018644571304, 0.014432945288717747, 0.01595987193286419, 0.017486799508333206, 0.019013725221157074, 0.020540650933980942, 0.02206757850944996, 0.023594506084918976, 0.025121431797742844, 0.02664835751056671, 0.02817528508603573, 0.029702212661504745, 0.031229138374328613]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 14.0, 25.0, 36.0, 53.0, 125.0, 215.0, 527.0, 1987.0, 9753.0, 3838778.0, 335227.0, 5724.0, 1130.0, 337.0, 147.0, 75.0, 48.0, 28.0, 18.0, 17.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.03751373291015625, -0.0361175537109375, -0.03472137451171875, -0.0333251953125, -0.03192901611328125, -0.0305328369140625, -0.02913665771484375, -0.027740478515625, -0.02634429931640625, -0.0249481201171875, -0.02355194091796875, -0.02215576171875, -0.02075958251953125, -0.0193634033203125, -0.01796722412109375, -0.016571044921875, -0.01517486572265625, -0.0137786865234375, -0.01238250732421875, -0.010986328125, -0.00959014892578125, -0.0081939697265625, -0.00679779052734375, -0.005401611328125, -0.00400543212890625, -0.0026092529296875, -0.00121307373046875, 0.00018310546875, 0.00157928466796875, 0.0029754638671875, 0.00437164306640625, 0.005767822265625, 0.00716400146484375, 0.0085601806640625, 0.00995635986328125, 0.0113525390625, 0.01274871826171875, 0.0141448974609375, 0.01554107666015625, 0.016937255859375, 0.01833343505859375, 0.0197296142578125, 0.02112579345703125, 0.02252197265625, 0.02391815185546875, 0.0253143310546875, 0.02671051025390625, 0.028106689453125, 0.02950286865234375, 0.0308990478515625, 0.03229522705078125, 0.03369140625, 0.03508758544921875, 0.0364837646484375, 0.03787994384765625, 0.039276123046875, 0.04067230224609375, 0.0420684814453125, 0.04346466064453125, 0.04486083984375, 0.04625701904296875, 0.0476531982421875, 0.04904937744140625, 0.050445556640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 41.0, 74.0, 163.0, 210.0, 243.0, 149.0, 74.0, 20.0, 13.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213775634765625, -0.020686864852905273, -0.019996166229248047, -0.01930546760559082, -0.018614768981933594, -0.017924070358276367, -0.01723337173461914, -0.016542673110961914, -0.015851974487304688, -0.015161275863647461, -0.014470577239990234, -0.013779878616333008, -0.013089179992675781, -0.012398481369018555, -0.011707782745361328, -0.011017084121704102, -0.010326385498046875, -0.009635686874389648, -0.008944988250732422, -0.008254289627075195, -0.007563591003417969, -0.006872892379760742, -0.006182193756103516, -0.005491495132446289, -0.0048007965087890625, -0.004110097885131836, -0.0034193992614746094, -0.002728700637817383, -0.0020380020141601562, -0.0013473033905029297, -0.0006566047668457031, 3.409385681152344e-05, 0.00072479248046875, 0.0014154911041259766, 0.002106189727783203, 0.0027968883514404297, 0.0034875869750976562, 0.004178285598754883, 0.004868984222412109, 0.005559682846069336, 0.0062503814697265625, 0.006941080093383789, 0.007631778717041016, 0.008322477340698242, 0.009013175964355469, 0.009703874588012695, 0.010394573211669922, 0.011085271835327148, 0.011775970458984375, 0.012466669082641602, 0.013157367706298828, 0.013848066329956055, 0.014538764953613281, 0.015229463577270508, 0.015920162200927734, 0.01661086082458496, 0.017301559448242188, 0.017992258071899414, 0.01868295669555664, 0.019373655319213867, 0.020064353942871094, 0.02075505256652832, 0.021445751190185547, 0.022136449813842773, 0.0228271484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 9.0, 11.0, 18.0, 21.0, 22.0, 37.0, 64.0, 74.0, 106.0, 179.0, 274.0, 512.0, 990.0, 2571.0, 8595.0, 50704.0, 3526844.0, 566906.0, 26932.0, 5580.0, 1860.0, 816.0, 441.0, 215.0, 140.0, 90.0, 56.0, 50.0, 48.0, 24.0, 14.0, 13.0, 10.0, 5.0, 8.0, 7.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0223236083984375, -0.02170085906982422, -0.021078109741210938, -0.020455360412597656, -0.019832611083984375, -0.019209861755371094, -0.018587112426757812, -0.01796436309814453, -0.01734161376953125, -0.01671886444091797, -0.016096115112304688, -0.015473365783691406, -0.014850616455078125, -0.014227867126464844, -0.013605117797851562, -0.012982368469238281, -0.012359619140625, -0.011736869812011719, -0.011114120483398438, -0.010491371154785156, -0.009868621826171875, -0.009245872497558594, -0.008623123168945312, -0.008000373840332031, -0.00737762451171875, -0.006754875183105469, -0.0061321258544921875, -0.005509376525878906, -0.004886627197265625, -0.004263877868652344, -0.0036411285400390625, -0.0030183792114257812, -0.0023956298828125, -0.0017728805541992188, -0.0011501312255859375, -0.0005273818969726562, 9.5367431640625e-05, 0.0007181167602539062, 0.0013408660888671875, 0.0019636154174804688, 0.00258636474609375, 0.0032091140747070312, 0.0038318634033203125, 0.004454612731933594, 0.005077362060546875, 0.005700111389160156, 0.0063228607177734375, 0.006945610046386719, 0.007568359375, 0.008191108703613281, 0.008813858032226562, 0.009436607360839844, 0.010059356689453125, 0.010682106018066406, 0.011304855346679688, 0.011927604675292969, 0.01255035400390625, 0.013173103332519531, 0.013795852661132812, 0.014418601989746094, 0.015041351318359375, 0.015664100646972656, 0.016286849975585938, 0.01690959930419922, 0.0175323486328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 12.0, 25.0, 60.0, 192.0, 1130.0, 2154.0, 303.0, 99.0, 36.0, 25.0, 14.0, 11.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.029846906661987305, -0.02908468246459961, -0.028322458267211914, -0.02756023406982422, -0.026798009872436523, -0.026035785675048828, -0.025273561477661133, -0.024511337280273438, -0.023749113082885742, -0.022986888885498047, -0.02222466468811035, -0.021462440490722656, -0.02070021629333496, -0.019937992095947266, -0.01917576789855957, -0.018413543701171875, -0.01765131950378418, -0.016889095306396484, -0.01612687110900879, -0.015364646911621094, -0.014602422714233398, -0.013840198516845703, -0.013077974319458008, -0.012315750122070312, -0.011553525924682617, -0.010791301727294922, -0.010029077529907227, -0.009266853332519531, -0.008504629135131836, -0.007742404937744141, -0.006980180740356445, -0.00621795654296875, -0.005455732345581055, -0.004693508148193359, -0.003931283950805664, -0.0031690597534179688, -0.0024068355560302734, -0.0016446113586425781, -0.0008823871612548828, -0.0001201629638671875, 0.0006420612335205078, 0.0014042854309082031, 0.0021665096282958984, 0.0029287338256835938, 0.003690958023071289, 0.004453182220458984, 0.00521540641784668, 0.005977630615234375, 0.00673985481262207, 0.007502079010009766, 0.008264303207397461, 0.009026527404785156, 0.009788751602172852, 0.010550975799560547, 0.011313199996948242, 0.012075424194335938, 0.012837648391723633, 0.013599872589111328, 0.014362096786499023, 0.015124320983886719, 0.015886545181274414, 0.01664876937866211, 0.017410993576049805, 0.0181732177734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 33.0, 93.0, 240.0, 354.0, 191.0, 53.0, 24.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15923556685447693, -0.15571248531341553, -0.15218941867351532, -0.14866633713245392, -0.1451432704925537, -0.1416201889514923, -0.1380971223115921, -0.1345740407705307, -0.1310509741306305, -0.1275278925895691, -0.12400482594966888, -0.12048175185918808, -0.11695867776870728, -0.11343559622764587, -0.10991252213716507, -0.10638944804668427, -0.10286636650562286, -0.09934329241514206, -0.09582021832466125, -0.09229714423418045, -0.08877407014369965, -0.08525098860263824, -0.08172791451215744, -0.07820484042167664, -0.07468176633119583, -0.07115869224071503, -0.06763561815023422, -0.06411254405975342, -0.060589466243982315, -0.05706639215350151, -0.05354331433773041, -0.0500202402472496, -0.0464971587061882, -0.0429740846157074, -0.03945101052522659, -0.03592793270945549, -0.032404858618974686, -0.02888178452849388, -0.025358708575367928, -0.021835632622241974, -0.01831255853176117, -0.01478948350995779, -0.011266408488154411, -0.007743333466351032, -0.004220258444547653, -0.0006971843540668488, 0.002825891599059105, 0.006348967552185059, 0.009872041642665863, 0.013395116664469242, 0.01691819168627262, 0.020441267639398575, 0.02396434172987938, 0.027487415820360184, 0.031010491773486137, 0.03453356772661209, 0.038056641817092896, 0.0415797159075737, 0.045102789998054504, 0.04862586781382561, 0.05214894190430641, 0.055672015994787216, 0.05919509381055832, 0.06271816790103912, 0.06624124199151993]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 10.0, 10.0, 10.0, 16.0, 21.0, 20.0, 32.0, 34.0, 34.0, 38.0, 49.0, 54.0, 55.0, 50.0, 51.0, 52.0, 61.0, 46.0, 33.0, 43.0, 46.0, 38.0, 22.0, 26.0, 24.0, 21.0, 19.0, 11.0, 14.0, 6.0, 11.0, 3.0, 2.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030446171760559082, -0.029427191242575645, -0.02840821072459221, -0.027389230206608772, -0.026370249688625336, -0.0253512691706419, -0.024332288652658463, -0.023313308134675026, -0.02229432761669159, -0.021275347098708153, -0.020256366580724716, -0.01923738606274128, -0.018218405544757843, -0.017199425026774406, -0.01618044450879097, -0.015161463990807533, -0.014142483472824097, -0.01312350295484066, -0.012104522436857224, -0.011085541918873787, -0.01006656140089035, -0.009047580882906914, -0.008028600364923477, -0.007009619846940041, -0.005990639328956604, -0.004971658810973167, -0.003952678292989731, -0.0029336977750062943, -0.0019147172570228577, -0.0008957367390394211, 0.0001232437789440155, 0.001142224296927452, 0.0021612048149108887, 0.0031801853328943253, 0.004199165850877762, 0.005218146368861198, 0.006237126886844635, 0.007256107404828072, 0.008275087922811508, 0.009294068440794945, 0.010313048958778381, 0.011332029476761818, 0.012351009994745255, 0.013369990512728691, 0.014388971030712128, 0.015407951548695564, 0.016426932066679, 0.017445912584662437, 0.018464893102645874, 0.01948387362062931, 0.020502854138612747, 0.021521834656596184, 0.02254081517457962, 0.023559795692563057, 0.024578776210546494, 0.02559775672852993, 0.026616737246513367, 0.027635717764496803, 0.02865469828248024, 0.029673678800463676, 0.030692659318447113, 0.0317116379737854, 0.032730620354413986, 0.03374960273504257, 0.03476858139038086]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 10.0, 9.0, 19.0, 21.0, 30.0, 42.0, 61.0, 86.0, 119.0, 191.0, 265.0, 395.0, 634.0, 1226.0, 3076.0, 14872.0, 336185.0, 656943.0, 26592.0, 4144.0, 1468.0, 708.0, 465.0, 293.0, 224.0, 141.0, 71.0, 72.0, 47.0, 39.0, 29.0, 13.0, 13.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024261474609375, -0.023366928100585938, -0.022472381591796875, -0.021577835083007812, -0.02068328857421875, -0.019788742065429688, -0.018894195556640625, -0.017999649047851562, -0.0171051025390625, -0.016210556030273438, -0.015316009521484375, -0.014421463012695312, -0.01352691650390625, -0.012632369995117188, -0.011737823486328125, -0.010843276977539062, -0.00994873046875, -0.009054183959960938, -0.008159637451171875, -0.0072650909423828125, -0.00637054443359375, -0.0054759979248046875, -0.004581451416015625, -0.0036869049072265625, -0.0027923583984375, -0.0018978118896484375, -0.001003265380859375, -0.0001087188720703125, 0.00078582763671875, 0.0016803741455078125, 0.002574920654296875, 0.0034694671630859375, 0.004364013671875, 0.0052585601806640625, 0.006153106689453125, 0.0070476531982421875, 0.00794219970703125, 0.008836746215820312, 0.009731292724609375, 0.010625839233398438, 0.0115203857421875, 0.012414932250976562, 0.013309478759765625, 0.014204025268554688, 0.01509857177734375, 0.015993118286132812, 0.016887664794921875, 0.017782211303710938, 0.0186767578125, 0.019571304321289062, 0.020465850830078125, 0.021360397338867188, 0.02225494384765625, 0.023149490356445312, 0.024044036865234375, 0.024938583374023438, 0.0258331298828125, 0.026727676391601562, 0.027622222900390625, 0.028516769409179688, 0.02941131591796875, 0.030305862426757812, 0.031200408935546875, 0.03209495544433594, 0.032989501953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 28.0, 85.0, 170.0, 227.0, 224.0, 149.0, 70.0, 21.0, 16.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02288818359375, -0.022147417068481445, -0.02140665054321289, -0.020665884017944336, -0.01992511749267578, -0.019184350967407227, -0.018443584442138672, -0.017702817916870117, -0.016962051391601562, -0.016221284866333008, -0.015480518341064453, -0.014739751815795898, -0.013998985290527344, -0.013258218765258789, -0.012517452239990234, -0.01177668571472168, -0.011035919189453125, -0.01029515266418457, -0.009554386138916016, -0.008813619613647461, -0.008072853088378906, -0.0073320865631103516, -0.006591320037841797, -0.005850553512573242, -0.0051097869873046875, -0.004369020462036133, -0.003628253936767578, -0.0028874874114990234, -0.0021467208862304688, -0.001405954360961914, -0.0006651878356933594, 7.557868957519531e-05, 0.00081634521484375, 0.0015571117401123047, 0.0022978782653808594, 0.003038644790649414, 0.0037794113159179688, 0.0045201778411865234, 0.005260944366455078, 0.006001710891723633, 0.0067424774169921875, 0.007483243942260742, 0.008224010467529297, 0.008964776992797852, 0.009705543518066406, 0.010446310043334961, 0.011187076568603516, 0.01192784309387207, 0.012668609619140625, 0.01340937614440918, 0.014150142669677734, 0.014890909194946289, 0.015631675720214844, 0.0163724422454834, 0.017113208770751953, 0.017853975296020508, 0.018594741821289062, 0.019335508346557617, 0.020076274871826172, 0.020817041397094727, 0.02155780792236328, 0.022298574447631836, 0.02303934097290039, 0.023780107498168945, 0.0245208740234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 15.0, 24.0, 20.0, 31.0, 49.0, 62.0, 121.0, 201.0, 383.0, 742.0, 1494.0, 3302.0, 7800.0, 21052.0, 66192.0, 238427.0, 448168.0, 180973.0, 50781.0, 16766.0, 6365.0, 2882.0, 1229.0, 621.0, 315.0, 189.0, 95.0, 58.0, 43.0, 28.0, 22.0, 20.0, 16.0, 12.0, 13.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.01198577880859375, -0.0116652250289917, -0.011344671249389648, -0.011024117469787598, -0.010703563690185547, -0.010383009910583496, -0.010062456130981445, -0.009741902351379395, -0.009421348571777344, -0.009100794792175293, -0.008780241012573242, -0.008459687232971191, -0.00813913345336914, -0.00781857967376709, -0.007498025894165039, -0.007177472114562988, -0.0068569183349609375, -0.006536364555358887, -0.006215810775756836, -0.005895256996154785, -0.005574703216552734, -0.005254149436950684, -0.004933595657348633, -0.004613041877746582, -0.004292488098144531, -0.0039719343185424805, -0.0036513805389404297, -0.003330826759338379, -0.003010272979736328, -0.0026897192001342773, -0.0023691654205322266, -0.0020486116409301758, -0.001728057861328125, -0.0014075040817260742, -0.0010869503021240234, -0.0007663965225219727, -0.0004458427429199219, -0.0001252889633178711, 0.0001952648162841797, 0.0005158185958862305, 0.0008363723754882812, 0.001156926155090332, 0.0014774799346923828, 0.0017980337142944336, 0.0021185874938964844, 0.002439141273498535, 0.002759695053100586, 0.0030802488327026367, 0.0034008026123046875, 0.0037213563919067383, 0.004041910171508789, 0.00436246395111084, 0.004683017730712891, 0.005003571510314941, 0.005324125289916992, 0.005644679069519043, 0.005965232849121094, 0.0062857866287231445, 0.006606340408325195, 0.006926894187927246, 0.007247447967529297, 0.007568001747131348, 0.007888555526733398, 0.00820910930633545, 0.0085296630859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 8.0, 10.0, 9.0, 12.0, 10.0, 13.0, 22.0, 27.0, 25.0, 24.0, 18.0, 25.0, 40.0, 51.0, 38.0, 52.0, 53.0, 54.0, 52.0, 36.0, 41.0, 49.0, 44.0, 31.0, 28.0, 38.0, 25.0, 25.0, 24.0, 25.0, 17.0, 18.0, 12.0, 8.0, 9.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01180267333984375, -0.011354565620422363, -0.010906457901000977, -0.01045835018157959, -0.010010242462158203, -0.009562134742736816, -0.00911402702331543, -0.008665919303894043, -0.008217811584472656, -0.0077697038650512695, -0.007321596145629883, -0.006873488426208496, -0.006425380706787109, -0.005977272987365723, -0.005529165267944336, -0.005081057548522949, -0.0046329498291015625, -0.004184842109680176, -0.003736734390258789, -0.0032886266708374023, -0.0028405189514160156, -0.002392411231994629, -0.0019443035125732422, -0.0014961957931518555, -0.0010480880737304688, -0.000599980354309082, -0.0001518726348876953, 0.0002962350845336914, 0.0007443428039550781, 0.0011924505233764648, 0.0016405582427978516, 0.0020886659622192383, 0.002536773681640625, 0.0029848814010620117, 0.0034329891204833984, 0.003881096839904785, 0.004329204559326172, 0.004777312278747559, 0.005225419998168945, 0.005673527717590332, 0.006121635437011719, 0.0065697431564331055, 0.007017850875854492, 0.007465958595275879, 0.007914066314697266, 0.008362174034118652, 0.008810281753540039, 0.009258389472961426, 0.009706497192382812, 0.0101546049118042, 0.010602712631225586, 0.011050820350646973, 0.01149892807006836, 0.011947035789489746, 0.012395143508911133, 0.01284325122833252, 0.013291358947753906, 0.013739466667175293, 0.01418757438659668, 0.014635682106018066, 0.015083789825439453, 0.01553189754486084, 0.015980005264282227, 0.016428112983703613, 0.016876220703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 11.0, 10.0, 8.0, 15.0, 28.0, 24.0, 43.0, 78.0, 118.0, 202.0, 378.0, 749.0, 1541.0, 3494.0, 8261.0, 21647.0, 67530.0, 279241.0, 470954.0, 134020.0, 37216.0, 13029.0, 5278.0, 2364.0, 1080.0, 537.0, 264.0, 160.0, 99.0, 44.0, 33.0, 27.0, 11.0, 16.0, 15.0, 7.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035610198974609375, -0.003439277410507202, -0.003317534923553467, -0.0031957924365997314, -0.003074049949645996, -0.0029523074626922607, -0.0028305649757385254, -0.00270882248878479, -0.0025870800018310547, -0.0024653375148773193, -0.002343595027923584, -0.0022218525409698486, -0.0021001100540161133, -0.001978367567062378, -0.0018566250801086426, -0.0017348825931549072, -0.0016131401062011719, -0.0014913976192474365, -0.0013696551322937012, -0.0012479126453399658, -0.0011261701583862305, -0.0010044276714324951, -0.0008826851844787598, -0.0007609426975250244, -0.0006392002105712891, -0.0005174577236175537, -0.00039571523666381836, -0.000273972749710083, -0.00015223026275634766, -3.0487775802612305e-05, 9.125471115112305e-05, 0.0002129971981048584, 0.00033473968505859375, 0.0004564821720123291, 0.0005782246589660645, 0.0006999671459197998, 0.0008217096328735352, 0.0009434521198272705, 0.0010651946067810059, 0.0011869370937347412, 0.0013086795806884766, 0.001430422067642212, 0.0015521645545959473, 0.0016739070415496826, 0.001795649528503418, 0.0019173920154571533, 0.0020391345024108887, 0.002160876989364624, 0.0022826194763183594, 0.0024043619632720947, 0.00252610445022583, 0.0026478469371795654, 0.0027695894241333008, 0.002891331911087036, 0.0030130743980407715, 0.003134816884994507, 0.003256559371948242, 0.0033783018589019775, 0.003500044345855713, 0.0036217868328094482, 0.0037435293197631836, 0.003865271806716919, 0.003987014293670654, 0.00410875678062439, 0.004230499267578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 11.0, 16.0, 15.0, 10.0, 21.0, 20.0, 16.0, 21.0, 23.0, 43.0, 51.0, 45.0, 66.0, 97.0, 96.0, 74.0, 69.0, 48.0, 26.0, 42.0, 28.0, 25.0, 17.0, 20.0, 11.0, 15.0, 6.0, 7.0, 9.0, 9.0, 3.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.744529724121094e-05, -4.574749618768692e-05, -4.40496951341629e-05, -4.2351894080638885e-05, -4.065409302711487e-05, -3.895629197359085e-05, -3.7258490920066833e-05, -3.5560689866542816e-05, -3.38628888130188e-05, -3.216508775949478e-05, -3.0467286705970764e-05, -2.8769485652446747e-05, -2.707168459892273e-05, -2.5373883545398712e-05, -2.3676082491874695e-05, -2.1978281438350677e-05, -2.028048038482666e-05, -1.8582679331302643e-05, -1.6884878277778625e-05, -1.5187077224254608e-05, -1.348927617073059e-05, -1.1791475117206573e-05, -1.0093674063682556e-05, -8.395873010158539e-06, -6.6980719566345215e-06, -5.000270903110504e-06, -3.302469849586487e-06, -1.6046687960624695e-06, 9.313225746154785e-08, 1.7909333109855652e-06, 3.4887343645095825e-06, 5.1865354180336e-06, 6.884336471557617e-06, 8.582137525081635e-06, 1.0279938578605652e-05, 1.197773963212967e-05, 1.3675540685653687e-05, 1.5373341739177704e-05, 1.707114279270172e-05, 1.876894384622574e-05, 2.0466744899749756e-05, 2.2164545953273773e-05, 2.386234700679779e-05, 2.5560148060321808e-05, 2.7257949113845825e-05, 2.8955750167369843e-05, 3.065355122089386e-05, 3.235135227441788e-05, 3.4049153327941895e-05, 3.574695438146591e-05, 3.744475543498993e-05, 3.9142556488513947e-05, 4.0840357542037964e-05, 4.253815859556198e-05, 4.4235959649086e-05, 4.5933760702610016e-05, 4.763156175613403e-05, 4.932936280965805e-05, 5.102716386318207e-05, 5.2724964916706085e-05, 5.44227659702301e-05, 5.612056702375412e-05, 5.781836807727814e-05, 5.9516169130802155e-05, 6.121397018432617e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 3.0, 7.0, 6.0, 3.0, 15.0, 11.0, 29.0, 45.0, 87.0, 101.0, 190.0, 394.0, 719.0, 1527.0, 3031.0, 6624.0, 15961.0, 42908.0, 144984.0, 469889.0, 254254.0, 67363.0, 22933.0, 9296.0, 4157.0, 1994.0, 886.0, 466.0, 280.0, 134.0, 97.0, 58.0, 29.0, 25.0, 13.0, 13.0, 12.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004207611083984375, -0.004086345434188843, -0.0039650797843933105, -0.0038438141345977783, -0.003722548484802246, -0.003601282835006714, -0.0034800171852111816, -0.0033587515354156494, -0.003237485885620117, -0.003116220235824585, -0.0029949545860290527, -0.0028736889362335205, -0.0027524232864379883, -0.002631157636642456, -0.002509891986846924, -0.0023886263370513916, -0.0022673606872558594, -0.002146095037460327, -0.002024829387664795, -0.0019035637378692627, -0.0017822980880737305, -0.0016610324382781982, -0.001539766788482666, -0.0014185011386871338, -0.0012972354888916016, -0.0011759698390960693, -0.0010547041893005371, -0.0009334385395050049, -0.0008121728897094727, -0.0006909072399139404, -0.0005696415901184082, -0.000448375940322876, -0.00032711029052734375, -0.00020584464073181152, -8.45789909362793e-05, 3.668665885925293e-05, 0.00015795230865478516, 0.0002792179584503174, 0.0004004836082458496, 0.0005217492580413818, 0.0006430149078369141, 0.0007642805576324463, 0.0008855462074279785, 0.0010068118572235107, 0.001128077507019043, 0.0012493431568145752, 0.0013706088066101074, 0.0014918744564056396, 0.0016131401062011719, 0.001734405755996704, 0.0018556714057922363, 0.0019769370555877686, 0.0020982027053833008, 0.002219468355178833, 0.0023407340049743652, 0.0024619996547698975, 0.0025832653045654297, 0.002704530954360962, 0.002825796604156494, 0.0029470622539520264, 0.0030683279037475586, 0.003189593553543091, 0.003310859203338623, 0.0034321248531341553, 0.0035533905029296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 6.0, 14.0, 22.0, 23.0, 23.0, 22.0, 38.0, 36.0, 56.0, 55.0, 79.0, 104.0, 73.0, 76.0, 67.0, 62.0, 43.0, 28.0, 25.0, 21.0, 12.0, 18.0, 14.0, 10.0, 8.0, 6.0, 5.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.0037441253662109375, -0.003643631935119629, -0.0035431385040283203, -0.0034426450729370117, -0.003342151641845703, -0.0032416582107543945, -0.003141164779663086, -0.0030406713485717773, -0.0029401779174804688, -0.00283968448638916, -0.0027391910552978516, -0.002638697624206543, -0.0025382041931152344, -0.0024377107620239258, -0.002337217330932617, -0.0022367238998413086, -0.00213623046875, -0.0020357370376586914, -0.0019352436065673828, -0.0018347501754760742, -0.0017342567443847656, -0.001633763313293457, -0.0015332698822021484, -0.0014327764511108398, -0.0013322830200195312, -0.0012317895889282227, -0.001131296157836914, -0.0010308027267456055, -0.0009303092956542969, -0.0008298158645629883, -0.0007293224334716797, -0.0006288290023803711, -0.0005283355712890625, -0.0004278421401977539, -0.0003273487091064453, -0.00022685527801513672, -0.00012636184692382812, -2.586841583251953e-05, 7.462501525878906e-05, 0.00017511844635009766, 0.00027561187744140625, 0.00037610530853271484, 0.00047659873962402344, 0.000577092170715332, 0.0006775856018066406, 0.0007780790328979492, 0.0008785724639892578, 0.0009790658950805664, 0.001079559326171875, 0.0011800527572631836, 0.0012805461883544922, 0.0013810396194458008, 0.0014815330505371094, 0.001582026481628418, 0.0016825199127197266, 0.0017830133438110352, 0.0018835067749023438, 0.0019840002059936523, 0.002084493637084961, 0.0021849870681762695, 0.002285480499267578, 0.0023859739303588867, 0.0024864673614501953, 0.002586960792541504, 0.0026874542236328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 25.0, 61.0, 113.0, 180.0, 214.0, 164.0, 96.0, 55.0, 31.0, 16.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06902939081192017, -0.06695427745580673, -0.0648791640996933, -0.06280405074357986, -0.06072893366217613, -0.0586538203060627, -0.056578706949949265, -0.05450359359383583, -0.0524284765124321, -0.050353363156318665, -0.04827824980020523, -0.0462031364440918, -0.044128019362688065, -0.04205290600657463, -0.0399777926504612, -0.03790267929434776, -0.03582756593823433, -0.033752452582120895, -0.03167733922600746, -0.02960222400724888, -0.027527108788490295, -0.02545199543237686, -0.023376882076263428, -0.021301768720149994, -0.01922665350139141, -0.017151540145277977, -0.015076424926519394, -0.01300131157040596, -0.010926197282969952, -0.008851082995533943, -0.006775969639420509, -0.004700855351984501, -0.0026257410645484924, -0.0005506270099431276, 0.0015244870446622372, 0.0035996008664369583, 0.005674715153872967, 0.007749829441308975, 0.009824942797422409, 0.011900057084858418, 0.013975171372294426, 0.01605028472840786, 0.018125399947166443, 0.020200513303279877, 0.02227562665939331, 0.024350741878151894, 0.026425855234265327, 0.02850097045302391, 0.030576083809137344, 0.03265119716525078, 0.03472631052136421, 0.036801427602767944, 0.03887654095888138, 0.04095165431499481, 0.043026767671108246, 0.04510188102722168, 0.047176994383335114, 0.04925210773944855, 0.05132722109556198, 0.053402334451675415, 0.05547745153307915, 0.05755256488919258, 0.059627678245306015, 0.06170279160141945, 0.06377790868282318]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 4.0, 7.0, 4.0, 3.0, 10.0, 11.0, 12.0, 14.0, 18.0, 14.0, 17.0, 16.0, 26.0, 29.0, 24.0, 27.0, 37.0, 37.0, 36.0, 29.0, 39.0, 32.0, 43.0, 40.0, 36.0, 29.0, 37.0, 28.0, 34.0, 29.0, 33.0, 31.0, 30.0, 21.0, 26.0, 26.0, 12.0, 12.0, 13.0, 11.0, 8.0, 7.0, 8.0, 7.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.030870914459228516, -0.02988198772072792, -0.028893062844872475, -0.02790413796901703, -0.026915211230516434, -0.02592628449201584, -0.024937359616160393, -0.023948434740304947, -0.022959508001804352, -0.021970581263303757, -0.02098165638744831, -0.019992731511592865, -0.01900380477309227, -0.018014878034591675, -0.01702595315873623, -0.016037028282880783, -0.015048101544380188, -0.014059175737202168, -0.013070249930024147, -0.012081324122846127, -0.011092398315668106, -0.010103472508490086, -0.009114546701312065, -0.008125620894134045, -0.007136695086956024, -0.006147769279778004, -0.005158843472599983, -0.004169917665421963, -0.0031809918582439423, -0.002192066051065922, -0.0012031402438879013, -0.00021421443670988083, 0.0007747113704681396, 0.0017636371776461601, 0.0027525629848241806, 0.003741488792002201, 0.0047304145991802216, 0.005719340406358242, 0.0067082662135362625, 0.007697192020714283, 0.008686117827892303, 0.009675043635070324, 0.010663969442248344, 0.011652895249426365, 0.012641821056604385, 0.013630746863782406, 0.014619672670960426, 0.015608598478138447, 0.016597524285316467, 0.017586451023817062, 0.018575375899672508, 0.019564300775527954, 0.02055322751402855, 0.021542154252529144, 0.02253107912838459, 0.023520004004240036, 0.02450893074274063, 0.025497857481241226, 0.026486782357096672, 0.027475707232952118, 0.028464633971452713, 0.029453560709953308, 0.030442485585808754, 0.0314314104616642, 0.032420337200164795]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 19.0, 23.0, 54.0, 121.0, 336.0, 780.0, 4251.0, 51193.0, 4116289.0, 18251.0, 2009.0, 523.0, 207.0, 115.0, 32.0, 25.0, 17.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052398681640625, -0.0506134033203125, -0.048828125, -0.0470428466796875, -0.045257568359375, -0.0434722900390625, -0.04168701171875, -0.0399017333984375, -0.038116455078125, -0.0363311767578125, -0.0345458984375, -0.0327606201171875, -0.030975341796875, -0.0291900634765625, -0.02740478515625, -0.0256195068359375, -0.023834228515625, -0.0220489501953125, -0.020263671875, -0.0184783935546875, -0.016693115234375, -0.0149078369140625, -0.01312255859375, -0.0113372802734375, -0.009552001953125, -0.0077667236328125, -0.0059814453125, -0.0041961669921875, -0.002410888671875, -0.0006256103515625, 0.00115966796875, 0.0029449462890625, 0.004730224609375, 0.0065155029296875, 0.00830078125, 0.0100860595703125, 0.011871337890625, 0.0136566162109375, 0.01544189453125, 0.0172271728515625, 0.019012451171875, 0.0207977294921875, 0.0225830078125, 0.0243682861328125, 0.026153564453125, 0.0279388427734375, 0.02972412109375, 0.0315093994140625, 0.033294677734375, 0.0350799560546875, 0.036865234375, 0.0386505126953125, 0.040435791015625, 0.0422210693359375, 0.04400634765625, 0.0457916259765625, 0.047576904296875, 0.0493621826171875, 0.0511474609375, 0.0529327392578125, 0.054718017578125, 0.0565032958984375, 0.05828857421875, 0.0600738525390625, 0.061859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 24.0, 75.0, 155.0, 198.0, 233.0, 176.0, 84.0, 39.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224456787109375, -0.021700620651245117, -0.020955562591552734, -0.02021050453186035, -0.01946544647216797, -0.018720388412475586, -0.017975330352783203, -0.01723027229309082, -0.016485214233398438, -0.015740156173706055, -0.014995098114013672, -0.014250040054321289, -0.013504981994628906, -0.012759923934936523, -0.01201486587524414, -0.011269807815551758, -0.010524749755859375, -0.009779691696166992, -0.00903463363647461, -0.008289575576782227, -0.007544517517089844, -0.006799459457397461, -0.006054401397705078, -0.005309343338012695, -0.0045642852783203125, -0.0038192272186279297, -0.003074169158935547, -0.002329111099243164, -0.0015840530395507812, -0.0008389949798583984, -9.393692016601562e-05, 0.0006511211395263672, 0.00139617919921875, 0.002141237258911133, 0.0028862953186035156, 0.0036313533782958984, 0.004376411437988281, 0.005121469497680664, 0.005866527557373047, 0.00661158561706543, 0.0073566436767578125, 0.008101701736450195, 0.008846759796142578, 0.009591817855834961, 0.010336875915527344, 0.011081933975219727, 0.01182699203491211, 0.012572050094604492, 0.013317108154296875, 0.014062166213989258, 0.01480722427368164, 0.015552282333374023, 0.016297340393066406, 0.01704239845275879, 0.017787456512451172, 0.018532514572143555, 0.019277572631835938, 0.02002263069152832, 0.020767688751220703, 0.021512746810913086, 0.02225780487060547, 0.02300286293029785, 0.023747920989990234, 0.024492979049682617, 0.025238037109375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 10.0, 17.0, 23.0, 42.0, 51.0, 92.0, 141.0, 227.0, 326.0, 510.0, 922.0, 1647.0, 3293.0, 7966.0, 25473.0, 130696.0, 3162229.0, 767582.0, 65780.0, 15811.0, 5537.0, 2516.0, 1350.0, 740.0, 445.0, 291.0, 182.0, 124.0, 87.0, 46.0, 28.0, 17.0, 20.0, 11.0, 8.0, 12.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119781494140625, -0.011576414108276367, -0.011174678802490234, -0.010772943496704102, -0.010371208190917969, -0.009969472885131836, -0.009567737579345703, -0.00916600227355957, -0.008764266967773438, -0.008362531661987305, -0.007960796356201172, -0.007559061050415039, -0.007157325744628906, -0.0067555904388427734, -0.006353855133056641, -0.005952119827270508, -0.005550384521484375, -0.005148649215698242, -0.004746913909912109, -0.0043451786041259766, -0.003943443298339844, -0.003541707992553711, -0.003139972686767578, -0.0027382373809814453, -0.0023365020751953125, -0.0019347667694091797, -0.0015330314636230469, -0.001131296157836914, -0.0007295608520507812, -0.00032782554626464844, 7.390975952148438e-05, 0.0004756450653076172, 0.00087738037109375, 0.0012791156768798828, 0.0016808509826660156, 0.0020825862884521484, 0.0024843215942382812, 0.002886056900024414, 0.003287792205810547, 0.0036895275115966797, 0.0040912628173828125, 0.004492998123168945, 0.004894733428955078, 0.005296468734741211, 0.005698204040527344, 0.0060999393463134766, 0.006501674652099609, 0.006903409957885742, 0.007305145263671875, 0.007706880569458008, 0.00810861587524414, 0.008510351181030273, 0.008912086486816406, 0.009313821792602539, 0.009715557098388672, 0.010117292404174805, 0.010519027709960938, 0.01092076301574707, 0.011322498321533203, 0.011724233627319336, 0.012125968933105469, 0.012527704238891602, 0.012929439544677734, 0.013331174850463867, 0.01373291015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 23.0, 30.0, 52.0, 94.0, 169.0, 510.0, 1635.0, 987.0, 255.0, 119.0, 74.0, 40.0, 14.0, 15.0, 11.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014495849609375, -0.013932943344116211, -0.013370037078857422, -0.012807130813598633, -0.012244224548339844, -0.011681318283081055, -0.011118412017822266, -0.010555505752563477, -0.009992599487304688, -0.009429693222045898, -0.00886678695678711, -0.00830388069152832, -0.007740974426269531, -0.007178068161010742, -0.006615161895751953, -0.006052255630493164, -0.005489349365234375, -0.004926443099975586, -0.004363536834716797, -0.003800630569458008, -0.0032377243041992188, -0.0026748180389404297, -0.0021119117736816406, -0.0015490055084228516, -0.0009860992431640625, -0.00042319297790527344, 0.00013971328735351562, 0.0007026195526123047, 0.0012655258178710938, 0.0018284320831298828, 0.002391338348388672, 0.002954244613647461, 0.00351715087890625, 0.004080057144165039, 0.004642963409423828, 0.005205869674682617, 0.005768775939941406, 0.006331682205200195, 0.006894588470458984, 0.0074574947357177734, 0.008020401000976562, 0.008583307266235352, 0.00914621353149414, 0.00970911979675293, 0.010272026062011719, 0.010834932327270508, 0.011397838592529297, 0.011960744857788086, 0.012523651123046875, 0.013086557388305664, 0.013649463653564453, 0.014212369918823242, 0.014775276184082031, 0.01533818244934082, 0.01590108871459961, 0.0164639949798584, 0.017026901245117188, 0.017589807510375977, 0.018152713775634766, 0.018715620040893555, 0.019278526306152344, 0.019841432571411133, 0.020404338836669922, 0.02096724510192871, 0.0215301513671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 17.0, 30.0, 76.0, 138.0, 241.0, 213.0, 134.0, 73.0, 40.0, 17.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05832286924123764, -0.055631037801504135, -0.05293920636177063, -0.050247374922037125, -0.04755554348230362, -0.044863712042570114, -0.04217188060283661, -0.039480045437812805, -0.0367882177233696, -0.03409638628363609, -0.03140455484390259, -0.028712723404169083, -0.026020891964435577, -0.023329060524702072, -0.020637227222323418, -0.017945395782589912, -0.015253562480211258, -0.012561731040477753, -0.009869899600744247, -0.007178067229688168, -0.004486235789954662, -0.001794404350221157, 0.0008974280208349228, 0.003589259460568428, 0.006281090900301933, 0.008972922340035439, 0.011664753779768944, 0.014356586150825024, 0.017048418521881104, 0.01974024996161461, 0.022432081401348114, 0.02512391284108162, 0.027815744280815125, 0.03050757572054863, 0.033199407160282135, 0.03589123860001564, 0.038583070039749146, 0.04127490147948265, 0.043966732919216156, 0.04665856808423996, 0.049350395798683167, 0.05204222723841667, 0.05473405867815018, 0.05742589011788368, 0.06011772155761719, 0.06280955672264099, 0.0655013844370842, 0.068193219602108, 0.07088504731655121, 0.07357688248157501, 0.07626871019601822, 0.07896054536104202, 0.08165237307548523, 0.08434420824050903, 0.08703603595495224, 0.08972787111997604, 0.09241970628499985, 0.09511154145002365, 0.09780336916446686, 0.10049520432949066, 0.10318703204393387, 0.10587886720895767, 0.10857069492340088, 0.11126253008842468, 0.11395435780286789]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 11.0, 8.0, 11.0, 9.0, 17.0, 17.0, 28.0, 22.0, 25.0, 26.0, 36.0, 39.0, 30.0, 49.0, 41.0, 43.0, 50.0, 54.0, 39.0, 63.0, 44.0, 59.0, 29.0, 32.0, 34.0, 25.0, 34.0, 17.0, 20.0, 23.0, 13.0, 16.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04069274663925171, -0.039581507444381714, -0.03847026452422142, -0.03735902160406113, -0.03624778240919113, -0.035136543214321136, -0.03402530029416084, -0.03291405737400055, -0.031802818179130554, -0.03069157712161541, -0.029580336064100266, -0.02846909500658512, -0.027357853949069977, -0.026246612891554832, -0.025135371834039688, -0.024024130776524544, -0.0229128897190094, -0.021801648661494255, -0.02069040760397911, -0.019579166546463966, -0.018467925488948822, -0.017356684431433678, -0.016245443373918533, -0.015134202316403389, -0.014022961258888245, -0.0129117202013731, -0.011800479143857956, -0.010689238086342812, -0.009577997028827667, -0.008466755971312523, -0.0073555149137973785, -0.006244273856282234, -0.00513303279876709, -0.0040217917412519455, -0.002910550683736801, -0.0017993096262216568, -0.0006880685687065125, 0.0004231724888086319, 0.0015344135463237762, 0.0026456546038389206, 0.003756895661354065, 0.004868136718869209, 0.005979377776384354, 0.007090618833899498, 0.008201859891414642, 0.009313100948929787, 0.010424342006444931, 0.011535583063960075, 0.01264682412147522, 0.013758065178990364, 0.014869306236505508, 0.015980547294020653, 0.017091788351535797, 0.01820302940905094, 0.019314270466566086, 0.02042551152408123, 0.021536752581596375, 0.02264799363911152, 0.023759234696626663, 0.024870475754141808, 0.025981716811656952, 0.027092957869172096, 0.02820419892668724, 0.029315439984202385, 0.03042668104171753]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 11.0, 15.0, 22.0, 21.0, 30.0, 35.0, 51.0, 90.0, 77.0, 140.0, 170.0, 243.0, 378.0, 611.0, 1162.0, 3244.0, 15635.0, 238326.0, 734470.0, 43670.0, 6099.0, 1755.0, 778.0, 452.0, 258.0, 200.0, 148.0, 93.0, 74.0, 70.0, 49.0, 41.0, 15.0, 21.0, 17.0, 11.0, 9.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0347900390625, -0.03374290466308594, -0.032695770263671875, -0.03164863586425781, -0.03060150146484375, -0.029554367065429688, -0.028507232666015625, -0.027460098266601562, -0.0264129638671875, -0.025365829467773438, -0.024318695068359375, -0.023271560668945312, -0.02222442626953125, -0.021177291870117188, -0.020130157470703125, -0.019083023071289062, -0.018035888671875, -0.016988754272460938, -0.015941619873046875, -0.014894485473632812, -0.01384735107421875, -0.012800216674804688, -0.011753082275390625, -0.010705947875976562, -0.0096588134765625, -0.008611679077148438, -0.007564544677734375, -0.0065174102783203125, -0.00547027587890625, -0.0044231414794921875, -0.003376007080078125, -0.0023288726806640625, -0.00128173828125, -0.0002346038818359375, 0.000812530517578125, 0.0018596649169921875, 0.00290679931640625, 0.0039539337158203125, 0.005001068115234375, 0.0060482025146484375, 0.0070953369140625, 0.008142471313476562, 0.009189605712890625, 0.010236740112304688, 0.01128387451171875, 0.012331008911132812, 0.013378143310546875, 0.014425277709960938, 0.015472412109375, 0.016519546508789062, 0.017566680908203125, 0.018613815307617188, 0.01966094970703125, 0.020708084106445312, 0.021755218505859375, 0.022802352905273438, 0.0238494873046875, 0.024896621704101562, 0.025943756103515625, 0.026990890502929688, 0.02803802490234375, 0.029085159301757812, 0.030132293701171875, 0.031179428100585938, 0.0322265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 35.0, 68.0, 146.0, 188.0, 202.0, 169.0, 111.0, 44.0, 24.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.020316600799560547, -0.019621849060058594, -0.01892709732055664, -0.018232345581054688, -0.017537593841552734, -0.01684284210205078, -0.016148090362548828, -0.015453338623046875, -0.014758586883544922, -0.014063835144042969, -0.013369083404541016, -0.012674331665039062, -0.01197957992553711, -0.011284828186035156, -0.010590076446533203, -0.00989532470703125, -0.009200572967529297, -0.008505821228027344, -0.007811069488525391, -0.0071163177490234375, -0.006421566009521484, -0.005726814270019531, -0.005032062530517578, -0.004337310791015625, -0.003642559051513672, -0.0029478073120117188, -0.0022530555725097656, -0.0015583038330078125, -0.0008635520935058594, -0.00016880035400390625, 0.0005259513854980469, 0.001220703125, 0.0019154548645019531, 0.0026102066040039062, 0.0033049583435058594, 0.0039997100830078125, 0.004694461822509766, 0.005389213562011719, 0.006083965301513672, 0.006778717041015625, 0.007473468780517578, 0.008168220520019531, 0.008862972259521484, 0.009557723999023438, 0.01025247573852539, 0.010947227478027344, 0.011641979217529297, 0.01233673095703125, 0.013031482696533203, 0.013726234436035156, 0.01442098617553711, 0.015115737915039062, 0.015810489654541016, 0.01650524139404297, 0.017199993133544922, 0.017894744873046875, 0.018589496612548828, 0.01928424835205078, 0.019979000091552734, 0.020673751831054688, 0.02136850357055664, 0.022063255310058594, 0.022758007049560547, 0.0234527587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 13.0, 14.0, 17.0, 34.0, 36.0, 60.0, 81.0, 148.0, 260.0, 406.0, 820.0, 1622.0, 3749.0, 10417.0, 33717.0, 135550.0, 495573.0, 274823.0, 62592.0, 17707.0, 6021.0, 2423.0, 1073.0, 561.0, 281.0, 157.0, 125.0, 68.0, 49.0, 43.0, 20.0, 18.0, 13.0, 15.0, 6.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.016937255859375, -0.01643514633178711, -0.01593303680419922, -0.015430927276611328, -0.014928817749023438, -0.014426708221435547, -0.013924598693847656, -0.013422489166259766, -0.012920379638671875, -0.012418270111083984, -0.011916160583496094, -0.011414051055908203, -0.010911941528320312, -0.010409832000732422, -0.009907722473144531, -0.00940561294555664, -0.00890350341796875, -0.00840139389038086, -0.007899284362792969, -0.007397174835205078, -0.0068950653076171875, -0.006392955780029297, -0.005890846252441406, -0.005388736724853516, -0.004886627197265625, -0.004384517669677734, -0.0038824081420898438, -0.003380298614501953, -0.0028781890869140625, -0.002376079559326172, -0.0018739700317382812, -0.0013718605041503906, -0.0008697509765625, -0.0003676414489746094, 0.00013446807861328125, 0.0006365776062011719, 0.0011386871337890625, 0.0016407966613769531, 0.0021429061889648438, 0.0026450157165527344, 0.003147125244140625, 0.0036492347717285156, 0.004151344299316406, 0.004653453826904297, 0.0051555633544921875, 0.005657672882080078, 0.006159782409667969, 0.006661891937255859, 0.00716400146484375, 0.007666110992431641, 0.008168220520019531, 0.008670330047607422, 0.009172439575195312, 0.009674549102783203, 0.010176658630371094, 0.010678768157958984, 0.011180877685546875, 0.011682987213134766, 0.012185096740722656, 0.012687206268310547, 0.013189315795898438, 0.013691425323486328, 0.014193534851074219, 0.01469564437866211, 0.01519775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 6.0, 4.0, 6.0, 3.0, 12.0, 9.0, 17.0, 14.0, 14.0, 20.0, 25.0, 26.0, 30.0, 45.0, 47.0, 44.0, 27.0, 49.0, 43.0, 52.0, 30.0, 51.0, 37.0, 25.0, 49.0, 41.0, 26.0, 36.0, 30.0, 37.0, 24.0, 16.0, 19.0, 16.0, 18.0, 8.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.014789342880249023, -0.014304637908935547, -0.01381993293762207, -0.013335227966308594, -0.012850522994995117, -0.01236581802368164, -0.011881113052368164, -0.011396408081054688, -0.010911703109741211, -0.010426998138427734, -0.009942293167114258, -0.009457588195800781, -0.008972883224487305, -0.008488178253173828, -0.008003473281860352, -0.007518768310546875, -0.0070340633392333984, -0.006549358367919922, -0.006064653396606445, -0.005579948425292969, -0.005095243453979492, -0.004610538482666016, -0.004125833511352539, -0.0036411285400390625, -0.003156423568725586, -0.0026717185974121094, -0.002187013626098633, -0.0017023086547851562, -0.0012176036834716797, -0.0007328987121582031, -0.00024819374084472656, 0.00023651123046875, 0.0007212162017822266, 0.0012059211730957031, 0.0016906261444091797, 0.0021753311157226562, 0.002660036087036133, 0.0031447410583496094, 0.003629446029663086, 0.0041141510009765625, 0.004598855972290039, 0.005083560943603516, 0.005568265914916992, 0.006052970886230469, 0.006537675857543945, 0.007022380828857422, 0.0075070858001708984, 0.007991790771484375, 0.008476495742797852, 0.008961200714111328, 0.009445905685424805, 0.009930610656738281, 0.010415315628051758, 0.010900020599365234, 0.011384725570678711, 0.011869430541992188, 0.012354135513305664, 0.01283884048461914, 0.013323545455932617, 0.013808250427246094, 0.01429295539855957, 0.014777660369873047, 0.015262365341186523, 0.0157470703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 11.0, 5.0, 16.0, 12.0, 24.0, 46.0, 57.0, 85.0, 154.0, 232.0, 383.0, 785.0, 1462.0, 3226.0, 7610.0, 21042.0, 66557.0, 239735.0, 460548.0, 170848.0, 48274.0, 16042.0, 5964.0, 2676.0, 1232.0, 593.0, 353.0, 202.0, 111.0, 72.0, 63.0, 35.0, 27.0, 8.0, 18.0, 12.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004596710205078125, -0.004440188407897949, -0.0042836666107177734, -0.004127144813537598, -0.003970623016357422, -0.003814101219177246, -0.0036575794219970703, -0.0035010576248168945, -0.0033445358276367188, -0.003188014030456543, -0.003031492233276367, -0.0028749704360961914, -0.0027184486389160156, -0.00256192684173584, -0.002405405044555664, -0.0022488832473754883, -0.0020923614501953125, -0.0019358396530151367, -0.001779317855834961, -0.0016227960586547852, -0.0014662742614746094, -0.0013097524642944336, -0.0011532306671142578, -0.000996708869934082, -0.0008401870727539062, -0.0006836652755737305, -0.0005271434783935547, -0.0003706216812133789, -0.00021409988403320312, -5.7578086853027344e-05, 9.894371032714844e-05, 0.0002554655075073242, 0.0004119873046875, 0.0005685091018676758, 0.0007250308990478516, 0.0008815526962280273, 0.0010380744934082031, 0.001194596290588379, 0.0013511180877685547, 0.0015076398849487305, 0.0016641616821289062, 0.001820683479309082, 0.001977205276489258, 0.0021337270736694336, 0.0022902488708496094, 0.002446770668029785, 0.002603292465209961, 0.0027598142623901367, 0.0029163360595703125, 0.0030728578567504883, 0.003229379653930664, 0.00338590145111084, 0.0035424232482910156, 0.0036989450454711914, 0.003855466842651367, 0.004011988639831543, 0.004168510437011719, 0.0043250322341918945, 0.00448155403137207, 0.004638075828552246, 0.004794597625732422, 0.004951119422912598, 0.0051076412200927734, 0.005264163017272949, 0.005420684814453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 4.0, 5.0, 7.0, 8.0, 8.0, 9.0, 13.0, 17.0, 20.0, 25.0, 42.0, 34.0, 46.0, 67.0, 78.0, 82.0, 84.0, 73.0, 57.0, 64.0, 57.0, 49.0, 30.0, 24.0, 10.0, 14.0, 15.0, 6.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.9787573516368866e-05, -4.813633859157562e-05, -4.648510366678238e-05, -4.4833868741989136e-05, -4.318263381719589e-05, -4.153139889240265e-05, -3.9880163967609406e-05, -3.822892904281616e-05, -3.657769411802292e-05, -3.4926459193229675e-05, -3.327522426843643e-05, -3.162398934364319e-05, -2.9972754418849945e-05, -2.83215194940567e-05, -2.6670284569263458e-05, -2.5019049644470215e-05, -2.336781471967697e-05, -2.1716579794883728e-05, -2.0065344870090485e-05, -1.841410994529724e-05, -1.6762875020503998e-05, -1.5111640095710754e-05, -1.3460405170917511e-05, -1.1809170246124268e-05, -1.0157935321331024e-05, -8.50670039653778e-06, -6.855465471744537e-06, -5.204230546951294e-06, -3.5529956221580505e-06, -1.9017606973648071e-06, -2.505257725715637e-07, 1.4007091522216797e-06, 3.051944077014923e-06, 4.7031790018081665e-06, 6.35441392660141e-06, 8.005648851394653e-06, 9.656883776187897e-06, 1.130811870098114e-05, 1.2959353625774384e-05, 1.4610588550567627e-05, 1.626182347536087e-05, 1.7913058400154114e-05, 1.9564293324947357e-05, 2.12155282497406e-05, 2.2866763174533844e-05, 2.4517998099327087e-05, 2.616923302412033e-05, 2.7820467948913574e-05, 2.9471702873706818e-05, 3.112293779850006e-05, 3.2774172723293304e-05, 3.442540764808655e-05, 3.607664257287979e-05, 3.7727877497673035e-05, 3.937911242246628e-05, 4.103034734725952e-05, 4.2681582272052765e-05, 4.433281719684601e-05, 4.598405212163925e-05, 4.7635287046432495e-05, 4.928652197122574e-05, 5.093775689601898e-05, 5.2588991820812225e-05, 5.424022674560547e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 17.0, 24.0, 37.0, 63.0, 77.0, 110.0, 201.0, 308.0, 647.0, 1334.0, 3020.0, 8552.0, 30185.0, 129849.0, 527542.0, 266769.0, 56517.0, 14753.0, 4769.0, 1830.0, 833.0, 423.0, 226.0, 149.0, 87.0, 64.0, 46.0, 19.0, 22.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00655364990234375, -0.006347060203552246, -0.006140470504760742, -0.005933880805969238, -0.005727291107177734, -0.0055207014083862305, -0.0053141117095947266, -0.005107522010803223, -0.004900932312011719, -0.004694342613220215, -0.004487752914428711, -0.004281163215637207, -0.004074573516845703, -0.0038679838180541992, -0.0036613941192626953, -0.0034548044204711914, -0.0032482147216796875, -0.0030416250228881836, -0.0028350353240966797, -0.0026284456253051758, -0.002421855926513672, -0.002215266227722168, -0.002008676528930664, -0.0018020868301391602, -0.0015954971313476562, -0.0013889074325561523, -0.0011823177337646484, -0.0009757280349731445, -0.0007691383361816406, -0.0005625486373901367, -0.0003559589385986328, -0.0001493692398071289, 5.7220458984375e-05, 0.0002638101577758789, 0.0004703998565673828, 0.0006769895553588867, 0.0008835792541503906, 0.0010901689529418945, 0.0012967586517333984, 0.0015033483505249023, 0.0017099380493164062, 0.0019165277481079102, 0.002123117446899414, 0.002329707145690918, 0.002536296844482422, 0.0027428865432739258, 0.0029494762420654297, 0.0031560659408569336, 0.0033626556396484375, 0.0035692453384399414, 0.0037758350372314453, 0.003982424736022949, 0.004189014434814453, 0.004395604133605957, 0.004602193832397461, 0.004808783531188965, 0.005015373229980469, 0.005221962928771973, 0.0054285526275634766, 0.0056351423263549805, 0.005841732025146484, 0.006048321723937988, 0.006254911422729492, 0.006461501121520996, 0.0066680908203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 10.0, 6.0, 9.0, 13.0, 10.0, 14.0, 9.0, 14.0, 27.0, 33.0, 40.0, 62.0, 63.0, 78.0, 103.0, 91.0, 76.0, 77.0, 61.0, 38.0, 44.0, 18.0, 17.0, 10.0, 9.0, 10.0, 10.0, 4.0, 11.0, 7.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004029631614685059, -0.003878355026245117, -0.0037270784378051758, -0.0035758018493652344, -0.003424525260925293, -0.0032732486724853516, -0.00312197208404541, -0.0029706954956054688, -0.0028194189071655273, -0.002668142318725586, -0.0025168657302856445, -0.002365589141845703, -0.0022143125534057617, -0.0020630359649658203, -0.001911759376525879, -0.0017604827880859375, -0.001609206199645996, -0.0014579296112060547, -0.0013066530227661133, -0.0011553764343261719, -0.0010040998458862305, -0.0008528232574462891, -0.0007015466690063477, -0.0005502700805664062, -0.00039899349212646484, -0.00024771690368652344, -9.644031524658203e-05, 5.4836273193359375e-05, 0.00020611286163330078, 0.0003573894500732422, 0.0005086660385131836, 0.000659942626953125, 0.0008112192153930664, 0.0009624958038330078, 0.0011137723922729492, 0.0012650489807128906, 0.001416325569152832, 0.0015676021575927734, 0.0017188787460327148, 0.0018701553344726562, 0.0020214319229125977, 0.002172708511352539, 0.0023239850997924805, 0.002475261688232422, 0.0026265382766723633, 0.0027778148651123047, 0.002929091453552246, 0.0030803680419921875, 0.003231644630432129, 0.0033829212188720703, 0.0035341978073120117, 0.003685474395751953, 0.0038367509841918945, 0.003988027572631836, 0.004139304161071777, 0.004290580749511719, 0.00444185733795166, 0.0045931339263916016, 0.004744410514831543, 0.004895687103271484, 0.005046963691711426, 0.005198240280151367, 0.005349516868591309, 0.00550079345703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 37.0, 66.0, 165.0, 254.0, 258.0, 122.0, 57.0, 16.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11946487426757812, -0.11543509364128113, -0.11140531301498413, -0.10737553238868713, -0.10334575176239014, -0.09931597113609314, -0.09528619050979614, -0.09125640988349915, -0.08722662925720215, -0.08319684863090515, -0.07916706800460815, -0.07513728737831116, -0.07110750675201416, -0.06707772612571716, -0.06304794549942017, -0.05901816114783287, -0.054988376796245575, -0.05095859616994858, -0.04692881554365158, -0.042899034917354584, -0.03886925429105759, -0.03483947366476059, -0.030809689313173294, -0.026779908686876297, -0.0227501280605793, -0.018720347434282303, -0.014690565876662731, -0.01066078431904316, -0.006631003692746162, -0.0026012230664491653, 0.001428559422492981, 0.005458340048789978, 0.009488120675086975, 0.013517901301383972, 0.01754768192768097, 0.021577464416623116, 0.025607245042920113, 0.02963702566921711, 0.033666808158159256, 0.03769658878445625, 0.04172636941075325, 0.04575615003705025, 0.049785930663347244, 0.05381571501493454, 0.05784549564123154, 0.061875276267528534, 0.06590505689382553, 0.06993483752012253, 0.07396461814641953, 0.07799439877271652, 0.08202417939901352, 0.08605396002531052, 0.09008374065160751, 0.09411352127790451, 0.0981433093547821, 0.1021730899810791, 0.1062028706073761, 0.1102326512336731, 0.11426243185997009, 0.11829221248626709, 0.12232199311256409, 0.12635177373886108, 0.13038155436515808, 0.13441133499145508, 0.13844111561775208]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 6.0, 10.0, 12.0, 7.0, 5.0, 9.0, 21.0, 20.0, 16.0, 31.0, 29.0, 24.0, 34.0, 32.0, 30.0, 24.0, 45.0, 49.0, 42.0, 40.0, 36.0, 30.0, 47.0, 39.0, 33.0, 32.0, 39.0, 35.0, 34.0, 24.0, 19.0, 20.0, 19.0, 18.0, 22.0, 13.0, 13.0, 9.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04824399948120117, -0.04679631069302559, -0.045348621904850006, -0.04390093684196472, -0.04245324805378914, -0.041005559265613556, -0.03955787420272827, -0.03811018541455269, -0.036662496626377106, -0.03521480783820152, -0.03376711905002594, -0.032319433987140656, -0.030871745198965073, -0.02942405641078949, -0.027976369485259056, -0.026528682559728622, -0.02508099377155304, -0.023633304983377457, -0.022185618057847023, -0.02073793113231659, -0.019290242344141006, -0.017842553555965424, -0.01639486663043499, -0.014947178773581982, -0.013499490916728973, -0.012051803059875965, -0.010604115203022957, -0.009156427346169949, -0.00770873948931694, -0.006261051632463932, -0.004813363775610924, -0.0033656759187579155, -0.0019179880619049072, -0.00047030020505189896, 0.0009773876518011093, 0.0024250755086541176, 0.003872763365507126, 0.005320451222360134, 0.006768139079213142, 0.00821582693606615, 0.009663514792919159, 0.011111202649772167, 0.012558890506625175, 0.014006578363478184, 0.015454266220331192, 0.016901955008506775, 0.01834964193403721, 0.019797328859567642, 0.021245017647743225, 0.022692706435918808, 0.02414039336144924, 0.025588080286979675, 0.027035769075155258, 0.02848345786333084, 0.029931144788861275, 0.03137883171439171, 0.03282652050256729, 0.034274209290742874, 0.03572189807891846, 0.03716958314180374, 0.038617271929979324, 0.04006496071815491, 0.04151264578104019, 0.042960334569215775, 0.04440802335739136]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 13.0, 15.0, 23.0, 64.0, 109.0, 246.0, 649.0, 2918.0, 16871.0, 4038820.0, 127585.0, 5306.0, 981.0, 330.0, 178.0, 84.0, 39.0, 32.0, 9.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.044742584228515625, -0.04312896728515625, -0.041515350341796875, -0.0399017333984375, -0.038288116455078125, -0.03667449951171875, -0.035060882568359375, -0.033447265625, -0.031833648681640625, -0.03022003173828125, -0.028606414794921875, -0.0269927978515625, -0.025379180908203125, -0.02376556396484375, -0.022151947021484375, -0.020538330078125, -0.018924713134765625, -0.01731109619140625, -0.015697479248046875, -0.0140838623046875, -0.012470245361328125, -0.01085662841796875, -0.009243011474609375, -0.00762939453125, -0.006015777587890625, -0.00440216064453125, -0.002788543701171875, -0.0011749267578125, 0.000438690185546875, 0.00205230712890625, 0.003665924072265625, 0.005279541015625, 0.006893157958984375, 0.00850677490234375, 0.010120391845703125, 0.0117340087890625, 0.013347625732421875, 0.01496124267578125, 0.016574859619140625, 0.0181884765625, 0.019802093505859375, 0.02141571044921875, 0.023029327392578125, 0.0246429443359375, 0.026256561279296875, 0.02787017822265625, 0.029483795166015625, 0.031097412109375, 0.032711029052734375, 0.03432464599609375, 0.035938262939453125, 0.0375518798828125, 0.039165496826171875, 0.04077911376953125, 0.042392730712890625, 0.04400634765625, 0.045619964599609375, 0.04723358154296875, 0.048847198486328125, 0.0504608154296875, 0.052074432373046875, 0.05368804931640625, 0.055301666259765625, 0.056915283203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 25.0, 90.0, 143.0, 157.0, 211.0, 163.0, 116.0, 63.0, 19.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211029052734375, -0.02040576934814453, -0.019708633422851562, -0.019011497497558594, -0.018314361572265625, -0.017617225646972656, -0.016920089721679688, -0.01622295379638672, -0.01552581787109375, -0.014828681945800781, -0.014131546020507812, -0.013434410095214844, -0.012737274169921875, -0.012040138244628906, -0.011343002319335938, -0.010645866394042969, -0.00994873046875, -0.009251594543457031, -0.008554458618164062, -0.007857322692871094, -0.007160186767578125, -0.006463050842285156, -0.0057659149169921875, -0.005068778991699219, -0.00437164306640625, -0.0036745071411132812, -0.0029773712158203125, -0.0022802352905273438, -0.001583099365234375, -0.0008859634399414062, -0.0001888275146484375, 0.0005083084106445312, 0.0012054443359375, 0.0019025802612304688, 0.0025997161865234375, 0.0032968521118164062, 0.003993988037109375, 0.004691123962402344, 0.0053882598876953125, 0.006085395812988281, 0.00678253173828125, 0.007479667663574219, 0.008176803588867188, 0.008873939514160156, 0.009571075439453125, 0.010268211364746094, 0.010965347290039062, 0.011662483215332031, 0.012359619140625, 0.013056755065917969, 0.013753890991210938, 0.014451026916503906, 0.015148162841796875, 0.015845298767089844, 0.016542434692382812, 0.01723957061767578, 0.01793670654296875, 0.01863384246826172, 0.019330978393554688, 0.020028114318847656, 0.020725250244140625, 0.021422386169433594, 0.022119522094726562, 0.02281665802001953, 0.0235137939453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 10.0, 7.0, 10.0, 15.0, 31.0, 48.0, 66.0, 90.0, 173.0, 279.0, 424.0, 735.0, 1225.0, 2469.0, 5838.0, 17978.0, 78009.0, 792114.0, 3081826.0, 165065.0, 31274.0, 9086.0, 3476.0, 1706.0, 894.0, 516.0, 336.0, 211.0, 120.0, 74.0, 48.0, 24.0, 33.0, 15.0, 10.0, 6.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01238250732421875, -0.011943459510803223, -0.011504411697387695, -0.011065363883972168, -0.01062631607055664, -0.010187268257141113, -0.009748220443725586, -0.009309172630310059, -0.008870124816894531, -0.008431077003479004, -0.007992029190063477, -0.007552981376647949, -0.007113933563232422, -0.0066748857498168945, -0.006235837936401367, -0.00579679012298584, -0.0053577423095703125, -0.004918694496154785, -0.004479646682739258, -0.0040405988693237305, -0.003601551055908203, -0.0031625032424926758, -0.0027234554290771484, -0.002284407615661621, -0.0018453598022460938, -0.0014063119888305664, -0.0009672641754150391, -0.0005282163619995117, -8.916854858398438e-05, 0.00034987926483154297, 0.0007889270782470703, 0.0012279748916625977, 0.001667022705078125, 0.0021060705184936523, 0.0025451183319091797, 0.002984166145324707, 0.0034232139587402344, 0.0038622617721557617, 0.004301309585571289, 0.004740357398986816, 0.005179405212402344, 0.005618453025817871, 0.0060575008392333984, 0.006496548652648926, 0.006935596466064453, 0.0073746442794799805, 0.007813692092895508, 0.008252739906311035, 0.008691787719726562, 0.00913083553314209, 0.009569883346557617, 0.010008931159973145, 0.010447978973388672, 0.0108870267868042, 0.011326074600219727, 0.011765122413635254, 0.012204170227050781, 0.012643218040466309, 0.013082265853881836, 0.013521313667297363, 0.01396036148071289, 0.014399409294128418, 0.014838457107543945, 0.015277504920959473, 0.015716552734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 8.0, 15.0, 32.0, 51.0, 95.0, 176.0, 364.0, 1173.0, 1297.0, 425.0, 172.0, 90.0, 71.0, 30.0, 28.0, 14.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0161285400390625, -0.015510320663452148, -0.014892101287841797, -0.014273881912231445, -0.013655662536621094, -0.013037443161010742, -0.01241922378540039, -0.011801004409790039, -0.011182785034179688, -0.010564565658569336, -0.009946346282958984, -0.009328126907348633, -0.008709907531738281, -0.00809168815612793, -0.007473468780517578, -0.0068552494049072266, -0.006237030029296875, -0.0056188106536865234, -0.005000591278076172, -0.00438237190246582, -0.0037641525268554688, -0.003145933151245117, -0.0025277137756347656, -0.001909494400024414, -0.0012912750244140625, -0.0006730556488037109, -5.4836273193359375e-05, 0.0005633831024169922, 0.0011816024780273438, 0.0017998218536376953, 0.002418041229248047, 0.0030362606048583984, 0.00365447998046875, 0.0042726993560791016, 0.004890918731689453, 0.005509138107299805, 0.006127357482910156, 0.006745576858520508, 0.007363796234130859, 0.007982015609741211, 0.008600234985351562, 0.009218454360961914, 0.009836673736572266, 0.010454893112182617, 0.011073112487792969, 0.01169133186340332, 0.012309551239013672, 0.012927770614624023, 0.013545989990234375, 0.014164209365844727, 0.014782428741455078, 0.01540064811706543, 0.01601886749267578, 0.016637086868286133, 0.017255306243896484, 0.017873525619506836, 0.018491744995117188, 0.01910996437072754, 0.01972818374633789, 0.020346403121948242, 0.020964622497558594, 0.021582841873168945, 0.022201061248779297, 0.02281928062438965, 0.0234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 13.0, 39.0, 78.0, 134.0, 195.0, 211.0, 158.0, 92.0, 41.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13335302472114563, -0.13037721812725067, -0.1274014115333557, -0.12442560493946075, -0.1214497983455658, -0.11847399175167084, -0.11549818515777588, -0.11252237111330032, -0.10954656451940536, -0.1065707579255104, -0.10359495133161545, -0.10061914473772049, -0.09764333814382553, -0.09466752409934998, -0.09169171750545502, -0.08871591091156006, -0.0857401043176651, -0.08276429772377014, -0.07978849112987518, -0.07681268453598022, -0.07383687794208527, -0.07086107134819031, -0.06788526475429535, -0.0649094507098198, -0.06193365156650543, -0.058957844972610474, -0.055982038378715515, -0.05300623178482056, -0.0500304214656353, -0.04705461487174034, -0.04407880827784538, -0.041102997958660126, -0.03812718763947487, -0.03515138104557991, -0.03217557445168495, -0.029199765995144844, -0.026223957538604736, -0.023248150944709778, -0.02027234435081482, -0.01729653589427471, -0.014320729300379753, -0.01134492177516222, -0.008369114249944687, -0.005393307656049728, -0.0024175001308321953, 0.0005583073943853378, 0.0035341139882802963, 0.006509922444820404, 0.009485729038715363, 0.012461536563932896, 0.015437344089150429, 0.018413150683045387, 0.021388959139585495, 0.024364765733480453, 0.027340572327375412, 0.03031638078391552, 0.03329218924045563, 0.036267995834350586, 0.039243802428245544, 0.0422196090221405, 0.04519541934132576, 0.04817122593522072, 0.05114703252911568, 0.054122842848300934, 0.057098645716905594]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 6.0, 6.0, 10.0, 18.0, 20.0, 25.0, 33.0, 36.0, 38.0, 38.0, 22.0, 38.0, 51.0, 41.0, 54.0, 53.0, 52.0, 45.0, 42.0, 53.0, 46.0, 58.0, 31.0, 29.0, 29.0, 29.0, 24.0, 14.0, 10.0, 10.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.046895623207092285, -0.04558660089969635, -0.04427757486701012, -0.04296854883432388, -0.04165952652692795, -0.04035050421953201, -0.03904147818684578, -0.037732452154159546, -0.03642342984676361, -0.035114407539367676, -0.03380538150668144, -0.03249635547399521, -0.031187333166599274, -0.02987830899655819, -0.028569284826517105, -0.02726026065647602, -0.025951236486434937, -0.024642212316393852, -0.023333188146352768, -0.022024163976311684, -0.0207151398062706, -0.019406115636229515, -0.01809709146618843, -0.016788067296147346, -0.015479043126106262, -0.014170018956065178, -0.012860994786024094, -0.01155197061598301, -0.010242946445941925, -0.00893392227590084, -0.0076248981058597565, -0.006315873935818672, -0.005006849765777588, -0.0036978255957365036, -0.0023888014256954193, -0.001079777255654335, 0.00022924691438674927, 0.0015382710844278336, 0.002847295254468918, 0.004156319424510002, 0.005465343594551086, 0.006774367764592171, 0.008083391934633255, 0.00939241610467434, 0.010701440274715424, 0.012010464444756508, 0.013319488614797592, 0.014628512784838676, 0.01593753695487976, 0.017246561124920845, 0.01855558529496193, 0.019864609465003014, 0.021173633635044098, 0.022482657805085182, 0.023791681975126266, 0.02510070614516735, 0.026409730315208435, 0.02771875448524952, 0.029027778655290604, 0.030336802825331688, 0.03164582699537277, 0.03295484930276871, 0.03426387533545494, 0.035572901368141174, 0.03688192367553711]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 8.0, 13.0, 22.0, 23.0, 37.0, 35.0, 63.0, 72.0, 110.0, 171.0, 246.0, 366.0, 560.0, 1213.0, 3118.0, 16789.0, 290099.0, 690403.0, 36581.0, 4984.0, 1513.0, 713.0, 442.0, 277.0, 199.0, 135.0, 90.0, 59.0, 55.0, 28.0, 28.0, 20.0, 16.0, 13.0, 8.0, 7.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.04009532928466797, -0.03880882263183594, -0.037522315979003906, -0.036235809326171875, -0.034949302673339844, -0.03366279602050781, -0.03237628936767578, -0.03108978271484375, -0.02980327606201172, -0.028516769409179688, -0.027230262756347656, -0.025943756103515625, -0.024657249450683594, -0.023370742797851562, -0.02208423614501953, -0.0207977294921875, -0.01951122283935547, -0.018224716186523438, -0.016938209533691406, -0.015651702880859375, -0.014365196228027344, -0.013078689575195312, -0.011792182922363281, -0.01050567626953125, -0.009219169616699219, -0.007932662963867188, -0.006646156311035156, -0.005359649658203125, -0.004073143005371094, -0.0027866363525390625, -0.0015001296997070312, -0.000213623046875, 0.0010728836059570312, 0.0023593902587890625, 0.0036458969116210938, 0.004932403564453125, 0.006218910217285156, 0.0075054168701171875, 0.008791923522949219, 0.01007843017578125, 0.011364936828613281, 0.012651443481445312, 0.013937950134277344, 0.015224456787109375, 0.016510963439941406, 0.017797470092773438, 0.01908397674560547, 0.0203704833984375, 0.02165699005126953, 0.022943496704101562, 0.024230003356933594, 0.025516510009765625, 0.026803016662597656, 0.028089523315429688, 0.02937602996826172, 0.03066253662109375, 0.03194904327392578, 0.03323554992675781, 0.034522056579589844, 0.035808563232421875, 0.037095069885253906, 0.03838157653808594, 0.03966808319091797, 0.04095458984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 44.0, 89.0, 149.0, 168.0, 207.0, 149.0, 111.0, 55.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226287841796875, -0.02190113067626953, -0.021173477172851562, -0.020445823669433594, -0.019718170166015625, -0.018990516662597656, -0.018262863159179688, -0.01753520965576172, -0.01680755615234375, -0.01607990264892578, -0.015352249145507812, -0.014624595642089844, -0.013896942138671875, -0.013169288635253906, -0.012441635131835938, -0.011713981628417969, -0.010986328125, -0.010258674621582031, -0.009531021118164062, -0.008803367614746094, -0.008075714111328125, -0.007348060607910156, -0.0066204071044921875, -0.005892753601074219, -0.00516510009765625, -0.004437446594238281, -0.0037097930908203125, -0.0029821395874023438, -0.002254486083984375, -0.0015268325805664062, -0.0007991790771484375, -7.152557373046875e-05, 0.0006561279296875, 0.0013837814331054688, 0.0021114349365234375, 0.0028390884399414062, 0.003566741943359375, 0.004294395446777344, 0.0050220489501953125, 0.005749702453613281, 0.00647735595703125, 0.007205009460449219, 0.007932662963867188, 0.008660316467285156, 0.009387969970703125, 0.010115623474121094, 0.010843276977539062, 0.011570930480957031, 0.012298583984375, 0.013026237487792969, 0.013753890991210938, 0.014481544494628906, 0.015209197998046875, 0.015936851501464844, 0.016664505004882812, 0.01739215850830078, 0.01811981201171875, 0.01884746551513672, 0.019575119018554688, 0.020302772521972656, 0.021030426025390625, 0.021758079528808594, 0.022485733032226562, 0.02321338653564453, 0.0239410400390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 12.0, 8.0, 11.0, 17.0, 29.0, 43.0, 68.0, 59.0, 131.0, 183.0, 334.0, 594.0, 1107.0, 2106.0, 4406.0, 9797.0, 26866.0, 96809.0, 414529.0, 366834.0, 83120.0, 23938.0, 9043.0, 4130.0, 1928.0, 1078.0, 557.0, 301.0, 177.0, 102.0, 70.0, 41.0, 39.0, 15.0, 24.0, 14.0, 7.0, 8.0, 4.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0216064453125, -0.02100539207458496, -0.020404338836669922, -0.019803285598754883, -0.019202232360839844, -0.018601179122924805, -0.018000125885009766, -0.017399072647094727, -0.016798019409179688, -0.01619696617126465, -0.01559591293334961, -0.01499485969543457, -0.014393806457519531, -0.013792753219604492, -0.013191699981689453, -0.012590646743774414, -0.011989593505859375, -0.011388540267944336, -0.010787487030029297, -0.010186433792114258, -0.009585380554199219, -0.00898432731628418, -0.00838327407836914, -0.0077822208404541016, -0.0071811676025390625, -0.0065801143646240234, -0.005979061126708984, -0.005378007888793945, -0.004776954650878906, -0.004175901412963867, -0.003574848175048828, -0.002973794937133789, -0.00237274169921875, -0.001771688461303711, -0.0011706352233886719, -0.0005695819854736328, 3.147125244140625e-05, 0.0006325244903564453, 0.0012335777282714844, 0.0018346309661865234, 0.0024356842041015625, 0.0030367374420166016, 0.0036377906799316406, 0.00423884391784668, 0.004839897155761719, 0.005440950393676758, 0.006042003631591797, 0.006643056869506836, 0.007244110107421875, 0.007845163345336914, 0.008446216583251953, 0.009047269821166992, 0.009648323059082031, 0.01024937629699707, 0.01085042953491211, 0.011451482772827148, 0.012052536010742188, 0.012653589248657227, 0.013254642486572266, 0.013855695724487305, 0.014456748962402344, 0.015057802200317383, 0.015658855438232422, 0.01625990867614746, 0.0168609619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 12.0, 8.0, 7.0, 13.0, 20.0, 19.0, 22.0, 33.0, 37.0, 40.0, 52.0, 51.0, 64.0, 75.0, 82.0, 58.0, 53.0, 49.0, 40.0, 45.0, 37.0, 33.0, 32.0, 26.0, 24.0, 9.0, 6.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.02414870262145996, -0.023379802703857422, -0.022610902786254883, -0.021842002868652344, -0.021073102951049805, -0.020304203033447266, -0.019535303115844727, -0.018766403198242188, -0.01799750328063965, -0.01722860336303711, -0.01645970344543457, -0.01569080352783203, -0.014921903610229492, -0.014153003692626953, -0.013384103775024414, -0.012615203857421875, -0.011846303939819336, -0.011077404022216797, -0.010308504104614258, -0.009539604187011719, -0.00877070426940918, -0.00800180435180664, -0.0072329044342041016, -0.0064640045166015625, -0.0056951045989990234, -0.004926204681396484, -0.004157304763793945, -0.0033884048461914062, -0.002619504928588867, -0.0018506050109863281, -0.001081705093383789, -0.00031280517578125, 0.00045609474182128906, 0.0012249946594238281, 0.001993894577026367, 0.0027627944946289062, 0.0035316944122314453, 0.004300594329833984, 0.0050694942474365234, 0.0058383941650390625, 0.0066072940826416016, 0.007376194000244141, 0.00814509391784668, 0.008913993835449219, 0.009682893753051758, 0.010451793670654297, 0.011220693588256836, 0.011989593505859375, 0.012758493423461914, 0.013527393341064453, 0.014296293258666992, 0.015065193176269531, 0.01583409309387207, 0.01660299301147461, 0.01737189292907715, 0.018140792846679688, 0.018909692764282227, 0.019678592681884766, 0.020447492599487305, 0.021216392517089844, 0.021985292434692383, 0.022754192352294922, 0.02352309226989746, 0.0242919921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 3.0, 4.0, 7.0, 14.0, 25.0, 32.0, 40.0, 62.0, 98.0, 163.0, 273.0, 513.0, 883.0, 1763.0, 3579.0, 7468.0, 16722.0, 41461.0, 134433.0, 514361.0, 224882.0, 59854.0, 22523.0, 9877.0, 4670.0, 2246.0, 1156.0, 619.0, 325.0, 174.0, 106.0, 67.0, 42.0, 34.0, 27.0, 16.0, 12.0, 5.0, 10.0, 5.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072021484375, -0.006959438323974609, -0.006716728210449219, -0.006474018096923828, -0.0062313079833984375, -0.005988597869873047, -0.005745887756347656, -0.005503177642822266, -0.005260467529296875, -0.005017757415771484, -0.004775047302246094, -0.004532337188720703, -0.0042896270751953125, -0.004046916961669922, -0.0038042068481445312, -0.0035614967346191406, -0.00331878662109375, -0.0030760765075683594, -0.0028333663940429688, -0.002590656280517578, -0.0023479461669921875, -0.002105236053466797, -0.0018625259399414062, -0.0016198158264160156, -0.001377105712890625, -0.0011343955993652344, -0.0008916854858398438, -0.0006489753723144531, -0.0004062652587890625, -0.00016355514526367188, 7.915496826171875e-05, 0.0003218650817871094, 0.0005645751953125, 0.0008072853088378906, 0.0010499954223632812, 0.0012927055358886719, 0.0015354156494140625, 0.0017781257629394531, 0.0020208358764648438, 0.0022635459899902344, 0.002506256103515625, 0.0027489662170410156, 0.0029916763305664062, 0.003234386444091797, 0.0034770965576171875, 0.003719806671142578, 0.003962516784667969, 0.004205226898193359, 0.00444793701171875, 0.004690647125244141, 0.004933357238769531, 0.005176067352294922, 0.0054187774658203125, 0.005661487579345703, 0.005904197692871094, 0.006146907806396484, 0.006389617919921875, 0.006632328033447266, 0.006875038146972656, 0.007117748260498047, 0.0073604583740234375, 0.007603168487548828, 0.007845878601074219, 0.00808858871459961, 0.008331298828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 12.0, 19.0, 23.0, 34.0, 49.0, 60.0, 67.0, 76.0, 88.0, 71.0, 93.0, 71.0, 81.0, 63.0, 54.0, 31.0, 25.0, 21.0, 9.0, 5.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.9664249420166016e-05, -5.7783909142017365e-05, -5.590356886386871e-05, -5.402322858572006e-05, -5.214288830757141e-05, -5.026254802942276e-05, -4.838220775127411e-05, -4.650186747312546e-05, -4.462152719497681e-05, -4.2741186916828156e-05, -4.0860846638679504e-05, -3.898050636053085e-05, -3.71001660823822e-05, -3.521982580423355e-05, -3.33394855260849e-05, -3.145914524793625e-05, -2.9578804969787598e-05, -2.7698464691638947e-05, -2.5818124413490295e-05, -2.3937784135341644e-05, -2.2057443857192993e-05, -2.0177103579044342e-05, -1.829676330089569e-05, -1.641642302274704e-05, -1.4536082744598389e-05, -1.2655742466449738e-05, -1.0775402188301086e-05, -8.895061910152435e-06, -7.014721632003784e-06, -5.134381353855133e-06, -3.254041075706482e-06, -1.3737007975578308e-06, 5.066394805908203e-07, 2.3869797587394714e-06, 4.2673200368881226e-06, 6.147660315036774e-06, 8.028000593185425e-06, 9.908340871334076e-06, 1.1788681149482727e-05, 1.3669021427631378e-05, 1.554936170578003e-05, 1.742970198392868e-05, 1.931004226207733e-05, 2.1190382540225983e-05, 2.3070722818374634e-05, 2.4951063096523285e-05, 2.6831403374671936e-05, 2.8711743652820587e-05, 3.059208393096924e-05, 3.247242420911789e-05, 3.435276448726654e-05, 3.623310476541519e-05, 3.811344504356384e-05, 3.9993785321712494e-05, 4.1874125599861145e-05, 4.3754465878009796e-05, 4.563480615615845e-05, 4.75151464343071e-05, 4.939548671245575e-05, 5.12758269906044e-05, 5.315616726875305e-05, 5.50365075469017e-05, 5.6916847825050354e-05, 5.8797188103199005e-05, 6.0677528381347656e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 16.0, 20.0, 22.0, 36.0, 55.0, 100.0, 153.0, 324.0, 687.0, 1454.0, 3527.0, 9388.0, 29239.0, 114672.0, 585012.0, 230291.0, 49610.0, 14770.0, 5127.0, 2077.0, 933.0, 450.0, 233.0, 130.0, 77.0, 46.0, 32.0, 14.0, 11.0, 3.0, 7.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.01105499267578125, -0.010736465454101562, -0.010417938232421875, -0.010099411010742188, -0.0097808837890625, -0.009462356567382812, -0.009143829345703125, -0.008825302124023438, -0.00850677490234375, -0.008188247680664062, -0.007869720458984375, -0.0075511932373046875, -0.007232666015625, -0.0069141387939453125, -0.006595611572265625, -0.0062770843505859375, -0.00595855712890625, -0.0056400299072265625, -0.005321502685546875, -0.0050029754638671875, -0.0046844482421875, -0.0043659210205078125, -0.004047393798828125, -0.0037288665771484375, -0.00341033935546875, -0.0030918121337890625, -0.002773284912109375, -0.0024547576904296875, -0.00213623046875, -0.0018177032470703125, -0.001499176025390625, -0.0011806488037109375, -0.00086212158203125, -0.0005435943603515625, -0.000225067138671875, 9.34600830078125e-05, 0.0004119873046875, 0.0007305145263671875, 0.001049041748046875, 0.0013675689697265625, 0.00168609619140625, 0.0020046234130859375, 0.002323150634765625, 0.0026416778564453125, 0.002960205078125, 0.0032787322998046875, 0.003597259521484375, 0.0039157867431640625, 0.00423431396484375, 0.0045528411865234375, 0.004871368408203125, 0.0051898956298828125, 0.0055084228515625, 0.0058269500732421875, 0.006145477294921875, 0.0064640045166015625, 0.00678253173828125, 0.0071010589599609375, 0.007419586181640625, 0.0077381134033203125, 0.008056640625, 0.008375167846679688, 0.008693695068359375, 0.009012222290039062, 0.00933074951171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 13.0, 16.0, 20.0, 24.0, 29.0, 23.0, 43.0, 57.0, 88.0, 158.0, 160.0, 80.0, 52.0, 46.0, 40.0, 26.0, 28.0, 17.0, 17.0, 11.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006984710693359375, -0.006715595722198486, -0.006446480751037598, -0.006177365779876709, -0.00590825080871582, -0.005639135837554932, -0.005370020866394043, -0.005100905895233154, -0.004831790924072266, -0.004562675952911377, -0.004293560981750488, -0.0040244460105896, -0.003755331039428711, -0.0034862160682678223, -0.0032171010971069336, -0.002947986125946045, -0.0026788711547851562, -0.0024097561836242676, -0.002140641212463379, -0.0018715262413024902, -0.0016024112701416016, -0.0013332962989807129, -0.0010641813278198242, -0.0007950663566589355, -0.0005259513854980469, -0.0002568364143371582, 1.2278556823730469e-05, 0.00028139352798461914, 0.0005505084991455078, 0.0008196234703063965, 0.0010887384414672852, 0.0013578534126281738, 0.0016269683837890625, 0.0018960833549499512, 0.00216519832611084, 0.0024343132972717285, 0.002703428268432617, 0.002972543239593506, 0.0032416582107543945, 0.003510773181915283, 0.003779888153076172, 0.0040490031242370605, 0.004318118095397949, 0.004587233066558838, 0.0048563480377197266, 0.005125463008880615, 0.005394577980041504, 0.005663692951202393, 0.005932807922363281, 0.00620192289352417, 0.006471037864685059, 0.006740152835845947, 0.007009267807006836, 0.007278382778167725, 0.007547497749328613, 0.007816612720489502, 0.00808572769165039, 0.00835484266281128, 0.008623957633972168, 0.008893072605133057, 0.009162187576293945, 0.009431302547454834, 0.009700417518615723, 0.009969532489776611, 0.0102386474609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 14.0, 42.0, 71.0, 133.0, 183.0, 170.0, 150.0, 99.0, 57.0, 31.0, 18.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09029798209667206, -0.0861680805683136, -0.08203817903995514, -0.07790827006101608, -0.07377836853265762, -0.06964846700429916, -0.06551855802536011, -0.06138865649700165, -0.05725875496864319, -0.05312885344028473, -0.04899894818663597, -0.04486904293298721, -0.040739141404628754, -0.036609239876270294, -0.032479334622621536, -0.028349431231617928, -0.02421952784061432, -0.02008962444961071, -0.0159597210586071, -0.011829817667603493, -0.007699914276599884, -0.0035700108855962753, 0.0005598925054073334, 0.004689795896410942, 0.00881969928741455, 0.01294960267841816, 0.017079506069421768, 0.021209409460425377, 0.025339312851428986, 0.029469216242432594, 0.0335991196334362, 0.03772902488708496, 0.04185891151428223, 0.045988813042640686, 0.050118718296289444, 0.0542486235499382, 0.05837852507829666, 0.06250842660665512, 0.06663833558559418, 0.07076823711395264, 0.0748981386423111, 0.07902804017066956, 0.08315794169902802, 0.08728785067796707, 0.09141775220632553, 0.09554765373468399, 0.09967756271362305, 0.1038074642419815, 0.10793736577033997, 0.11206726729869843, 0.11619716882705688, 0.12032707780599594, 0.1244569793343544, 0.12858688831329346, 0.13271678984165192, 0.13684669137001038, 0.14097659289836884, 0.1451064944267273, 0.14923639595508575, 0.1533662974834442, 0.15749621391296387, 0.16162611544132233, 0.1657560169696808, 0.16988591849803925, 0.1740158200263977]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 11.0, 12.0, 11.0, 14.0, 18.0, 33.0, 23.0, 36.0, 33.0, 33.0, 35.0, 38.0, 60.0, 59.0, 64.0, 52.0, 48.0, 48.0, 44.0, 41.0, 47.0, 52.0, 36.0, 24.0, 22.0, 22.0, 14.0, 18.0, 10.0, 5.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0652388334274292, -0.06305601447820663, -0.06087320297956467, -0.0586903840303421, -0.056507568806409836, -0.05432475358247757, -0.052141934633255005, -0.04995911940932274, -0.04777630418539047, -0.045593488961458206, -0.04341067373752594, -0.041227854788303375, -0.03904503956437111, -0.03686222434043884, -0.03467940539121628, -0.03249659016728401, -0.030313774943351746, -0.02813095971941948, -0.025948142632842064, -0.02376532554626465, -0.021582510322332382, -0.019399695098400116, -0.0172168780118227, -0.01503406185656786, -0.012851245701313019, -0.010668429546058178, -0.008485613390803337, -0.006302797235548496, -0.004119981080293655, -0.0019371649250388145, 0.0002456512302160263, 0.002428467385470867, 0.004611283540725708, 0.006794099695980549, 0.00897691585123539, 0.01115973200649023, 0.013342548161745071, 0.015525364316999912, 0.017708180472254753, 0.01989099755883217, 0.022073812782764435, 0.0242566280066967, 0.026439445093274117, 0.028622262179851532, 0.030805077403783798, 0.032987892627716064, 0.03517071157693863, 0.037353526800870895, 0.03953634202480316, 0.04171915724873543, 0.043901972472667694, 0.04608479142189026, 0.048267606645822525, 0.05045042186975479, 0.052633240818977356, 0.05481605604290962, 0.05699887126684189, 0.059181686490774155, 0.06136450171470642, 0.06354732066392899, 0.06573013961315155, 0.06791295111179352, 0.07009577006101608, 0.07227858155965805, 0.07446140050888062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 14.0, 8.0, 16.0, 14.0, 20.0, 28.0, 41.0, 51.0, 82.0, 99.0, 140.0, 223.0, 394.0, 702.0, 1701.0, 3612.0, 9481.0, 50049.0, 1706378.0, 2337990.0, 63763.0, 12140.0, 4017.0, 1526.0, 686.0, 352.0, 223.0, 140.0, 96.0, 66.0, 47.0, 32.0, 41.0, 24.0, 15.0, 17.0, 7.0, 6.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0244598388671875, -0.02371954917907715, -0.022979259490966797, -0.022238969802856445, -0.021498680114746094, -0.020758390426635742, -0.02001810073852539, -0.01927781105041504, -0.018537521362304688, -0.017797231674194336, -0.017056941986083984, -0.016316652297973633, -0.015576362609863281, -0.01483607292175293, -0.014095783233642578, -0.013355493545532227, -0.012615203857421875, -0.011874914169311523, -0.011134624481201172, -0.01039433479309082, -0.009654045104980469, -0.008913755416870117, -0.008173465728759766, -0.007433176040649414, -0.0066928863525390625, -0.005952596664428711, -0.005212306976318359, -0.004472017288208008, -0.0037317276000976562, -0.0029914379119873047, -0.002251148223876953, -0.0015108585357666016, -0.00077056884765625, -3.0279159545898438e-05, 0.0007100105285644531, 0.0014503002166748047, 0.0021905899047851562, 0.002930879592895508, 0.0036711692810058594, 0.004411458969116211, 0.0051517486572265625, 0.005892038345336914, 0.006632328033447266, 0.007372617721557617, 0.008112907409667969, 0.00885319709777832, 0.009593486785888672, 0.010333776473999023, 0.011074066162109375, 0.011814355850219727, 0.012554645538330078, 0.01329493522644043, 0.014035224914550781, 0.014775514602661133, 0.015515804290771484, 0.016256093978881836, 0.016996383666992188, 0.01773667335510254, 0.01847696304321289, 0.019217252731323242, 0.019957542419433594, 0.020697832107543945, 0.021438121795654297, 0.02217841148376465, 0.022918701171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 13.0, 50.0, 102.0, 184.0, 208.0, 185.0, 123.0, 95.0, 29.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.024368762969970703, -0.023575782775878906, -0.02278280258178711, -0.021989822387695312, -0.021196842193603516, -0.02040386199951172, -0.019610881805419922, -0.018817901611328125, -0.018024921417236328, -0.01723194122314453, -0.016438961029052734, -0.015645980834960938, -0.01485300064086914, -0.014060020446777344, -0.013267040252685547, -0.01247406005859375, -0.011681079864501953, -0.010888099670410156, -0.01009511947631836, -0.009302139282226562, -0.008509159088134766, -0.007716178894042969, -0.006923198699951172, -0.006130218505859375, -0.005337238311767578, -0.004544258117675781, -0.0037512779235839844, -0.0029582977294921875, -0.0021653175354003906, -0.0013723373413085938, -0.0005793571472167969, 0.000213623046875, 0.0010066032409667969, 0.0017995834350585938, 0.0025925636291503906, 0.0033855438232421875, 0.004178524017333984, 0.004971504211425781, 0.005764484405517578, 0.006557464599609375, 0.007350444793701172, 0.008143424987792969, 0.008936405181884766, 0.009729385375976562, 0.01052236557006836, 0.011315345764160156, 0.012108325958251953, 0.01290130615234375, 0.013694286346435547, 0.014487266540527344, 0.01528024673461914, 0.016073226928710938, 0.016866207122802734, 0.01765918731689453, 0.018452167510986328, 0.019245147705078125, 0.020038127899169922, 0.02083110809326172, 0.021624088287353516, 0.022417068481445312, 0.02321004867553711, 0.024003028869628906, 0.024796009063720703, 0.0255889892578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 5.0, 8.0, 8.0, 13.0, 20.0, 24.0, 39.0, 59.0, 84.0, 136.0, 235.0, 386.0, 632.0, 1273.0, 2630.0, 5976.0, 17067.0, 74445.0, 731695.0, 3115389.0, 192928.0, 33318.0, 9805.0, 3928.0, 1871.0, 934.0, 530.0, 291.0, 176.0, 123.0, 70.0, 60.0, 32.0, 26.0, 24.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0158233642578125, -0.015242576599121094, -0.014661788940429688, -0.014081001281738281, -0.013500213623046875, -0.012919425964355469, -0.012338638305664062, -0.011757850646972656, -0.01117706298828125, -0.010596275329589844, -0.010015487670898438, -0.009434700012207031, -0.008853912353515625, -0.008273124694824219, -0.0076923370361328125, -0.007111549377441406, -0.00653076171875, -0.005949974060058594, -0.0053691864013671875, -0.004788398742675781, -0.004207611083984375, -0.0036268234252929688, -0.0030460357666015625, -0.0024652481079101562, -0.00188446044921875, -0.0013036727905273438, -0.0007228851318359375, -0.00014209747314453125, 0.000438690185546875, 0.0010194778442382812, 0.0016002655029296875, 0.0021810531616210938, 0.0027618408203125, 0.0033426284790039062, 0.0039234161376953125, 0.004504203796386719, 0.005084991455078125, 0.005665779113769531, 0.0062465667724609375, 0.006827354431152344, 0.00740814208984375, 0.007988929748535156, 0.008569717407226562, 0.009150505065917969, 0.009731292724609375, 0.010312080383300781, 0.010892868041992188, 0.011473655700683594, 0.012054443359375, 0.012635231018066406, 0.013216018676757812, 0.013796806335449219, 0.014377593994140625, 0.014958381652832031, 0.015539169311523438, 0.016119956970214844, 0.01670074462890625, 0.017281532287597656, 0.017862319946289062, 0.01844310760498047, 0.019023895263671875, 0.01960468292236328, 0.020185470581054688, 0.020766258239746094, 0.0213470458984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 12.0, 5.0, 17.0, 22.0, 31.0, 73.0, 113.0, 207.0, 446.0, 1080.0, 1053.0, 475.0, 199.0, 121.0, 78.0, 53.0, 26.0, 17.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.024522066116333008, -0.023821353912353516, -0.023120641708374023, -0.02241992950439453, -0.02171921730041504, -0.021018505096435547, -0.020317792892456055, -0.019617080688476562, -0.01891636848449707, -0.018215656280517578, -0.017514944076538086, -0.016814231872558594, -0.0161135196685791, -0.01541280746459961, -0.014712095260620117, -0.014011383056640625, -0.013310670852661133, -0.01260995864868164, -0.011909246444702148, -0.011208534240722656, -0.010507822036743164, -0.009807109832763672, -0.00910639762878418, -0.008405685424804688, -0.007704973220825195, -0.007004261016845703, -0.006303548812866211, -0.005602836608886719, -0.0049021244049072266, -0.004201412200927734, -0.003500699996948242, -0.00279998779296875, -0.002099275588989258, -0.0013985633850097656, -0.0006978511810302734, 2.86102294921875e-06, 0.0007035732269287109, 0.0014042854309082031, 0.0021049976348876953, 0.0028057098388671875, 0.0035064220428466797, 0.004207134246826172, 0.004907846450805664, 0.005608558654785156, 0.0063092708587646484, 0.007009983062744141, 0.007710695266723633, 0.008411407470703125, 0.009112119674682617, 0.00981283187866211, 0.010513544082641602, 0.011214256286621094, 0.011914968490600586, 0.012615680694580078, 0.01331639289855957, 0.014017105102539062, 0.014717817306518555, 0.015418529510498047, 0.01611924171447754, 0.01681995391845703, 0.017520666122436523, 0.018221378326416016, 0.018922090530395508, 0.019622802734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 26.0, 71.0, 191.0, 298.0, 266.0, 94.0, 31.0, 11.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2374257594347, -0.23108816146850586, -0.2247505784034729, -0.21841298043727875, -0.2120753824710846, -0.20573779940605164, -0.19940020143985748, -0.19306260347366333, -0.18672500550746918, -0.18038740754127502, -0.17404982447624207, -0.1677122265100479, -0.16137462854385376, -0.1550370454788208, -0.14869944751262665, -0.1423618495464325, -0.13602426648139954, -0.12968666851520538, -0.12334907799959183, -0.11701148748397827, -0.11067388951778412, -0.10433629900217056, -0.097998708486557, -0.09166111052036285, -0.0853235125541687, -0.07898592203855515, -0.07264832407236099, -0.06631073355674744, -0.059973135590553284, -0.05363554507493973, -0.04729795083403587, -0.04096035659313202, -0.034622758626937866, -0.028285164386034012, -0.021947570145130157, -0.015609977766871452, -0.009272383525967598, -0.002934791147708893, 0.0034028030931949615, 0.009740397334098816, 0.01607799157500267, 0.022415585815906525, 0.02875318005681038, 0.03509077429771423, 0.04142836481332779, 0.047765959054231644, 0.0541035532951355, 0.06044114753603935, 0.0667787417769432, 0.07311633229255676, 0.07945393025875092, 0.08579152077436447, 0.09212911874055862, 0.09846670925617218, 0.10480430722236633, 0.11114189773797989, 0.11747948825359344, 0.123817078769207, 0.13015466928482056, 0.1364922672510147, 0.14282986521720886, 0.14916744828224182, 0.15550504624843597, 0.16184264421463013, 0.16818024218082428]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 6.0, 20.0, 10.0, 11.0, 26.0, 33.0, 19.0, 31.0, 42.0, 45.0, 45.0, 44.0, 52.0, 43.0, 58.0, 60.0, 58.0, 56.0, 54.0, 44.0, 39.0, 33.0, 28.0, 34.0, 23.0, 20.0, 10.0, 9.0, 7.0, 10.0, 13.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06550824642181396, -0.06372520327568054, -0.06194215267896652, -0.0601591058075428, -0.05837605893611908, -0.05659301206469536, -0.05480996519327164, -0.053026918321847916, -0.051243871450424194, -0.04946082457900047, -0.04767777770757675, -0.04589473083615303, -0.04411168396472931, -0.04232863709330559, -0.040545590221881866, -0.038762543350458145, -0.036979496479034424, -0.0351964496076107, -0.03341340273618698, -0.03163035586476326, -0.02984730899333954, -0.028064262121915817, -0.026281215250492096, -0.024498168379068375, -0.022715121507644653, -0.020932074636220932, -0.01914902776479721, -0.01736598089337349, -0.015582934021949768, -0.013799887150526047, -0.012016840279102325, -0.010233793407678604, -0.008450746536254883, -0.0066676996648311615, -0.00488465279340744, -0.003101605921983719, -0.0013185590505599976, 0.00046448782086372375, 0.002247534692287445, 0.004030581563711166, 0.005813628435134888, 0.007596675306558609, 0.00937972217798233, 0.011162769049406052, 0.012945815920829773, 0.014728862792253494, 0.016511909663677216, 0.018294956535100937, 0.020078003406524658, 0.02186105027794838, 0.0236440971493721, 0.025427144020795822, 0.027210190892219543, 0.028993237763643265, 0.030776284635066986, 0.03255933150649071, 0.03434237837791443, 0.03612542524933815, 0.03790847212076187, 0.03969151899218559, 0.041474565863609314, 0.043257612735033035, 0.04504065960645676, 0.04682370647788048, 0.0486067533493042]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 10.0, 12.0, 9.0, 14.0, 27.0, 43.0, 45.0, 66.0, 103.0, 116.0, 146.0, 266.0, 405.0, 829.0, 1924.0, 6555.0, 40570.0, 690160.0, 280306.0, 19581.0, 4239.0, 1333.0, 672.0, 352.0, 205.0, 149.0, 112.0, 44.0, 52.0, 41.0, 32.0, 26.0, 22.0, 16.0, 13.0, 9.0, 10.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0435791015625, -0.04201316833496094, -0.040447235107421875, -0.03888130187988281, -0.03731536865234375, -0.03574943542480469, -0.034183502197265625, -0.03261756896972656, -0.0310516357421875, -0.029485702514648438, -0.027919769287109375, -0.026353836059570312, -0.02478790283203125, -0.023221969604492188, -0.021656036376953125, -0.020090103149414062, -0.018524169921875, -0.016958236694335938, -0.015392303466796875, -0.013826370239257812, -0.01226043701171875, -0.010694503784179688, -0.009128570556640625, -0.0075626373291015625, -0.0059967041015625, -0.0044307708740234375, -0.002864837646484375, -0.0012989044189453125, 0.00026702880859375, 0.0018329620361328125, 0.003398895263671875, 0.0049648284912109375, 0.00653076171875, 0.008096694946289062, 0.009662628173828125, 0.011228561401367188, 0.01279449462890625, 0.014360427856445312, 0.015926361083984375, 0.017492294311523438, 0.0190582275390625, 0.020624160766601562, 0.022190093994140625, 0.023756027221679688, 0.02532196044921875, 0.026887893676757812, 0.028453826904296875, 0.030019760131835938, 0.031585693359375, 0.03315162658691406, 0.034717559814453125, 0.03628349304199219, 0.03784942626953125, 0.03941535949707031, 0.040981292724609375, 0.04254722595214844, 0.0441131591796875, 0.04567909240722656, 0.047245025634765625, 0.04881095886230469, 0.05037689208984375, 0.05194282531738281, 0.053508758544921875, 0.05507469177246094, 0.056640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 21.0, 55.0, 101.0, 183.0, 194.0, 152.0, 150.0, 77.0, 48.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247650146484375, -0.02398514747619629, -0.023205280303955078, -0.022425413131713867, -0.021645545959472656, -0.020865678787231445, -0.020085811614990234, -0.019305944442749023, -0.018526077270507812, -0.0177462100982666, -0.01696634292602539, -0.01618647575378418, -0.015406608581542969, -0.014626741409301758, -0.013846874237060547, -0.013067007064819336, -0.012287139892578125, -0.011507272720336914, -0.010727405548095703, -0.009947538375854492, -0.009167671203613281, -0.00838780403137207, -0.007607936859130859, -0.0068280696868896484, -0.0060482025146484375, -0.0052683353424072266, -0.004488468170166016, -0.0037086009979248047, -0.0029287338256835938, -0.002148866653442383, -0.0013689994812011719, -0.0005891323089599609, 0.00019073486328125, 0.0009706020355224609, 0.0017504692077636719, 0.002530336380004883, 0.0033102035522460938, 0.004090070724487305, 0.004869937896728516, 0.0056498050689697266, 0.0064296722412109375, 0.0072095394134521484, 0.00798940658569336, 0.00876927375793457, 0.009549140930175781, 0.010329008102416992, 0.011108875274658203, 0.011888742446899414, 0.012668609619140625, 0.013448476791381836, 0.014228343963623047, 0.015008211135864258, 0.01578807830810547, 0.01656794548034668, 0.01734781265258789, 0.0181276798248291, 0.018907546997070312, 0.019687414169311523, 0.020467281341552734, 0.021247148513793945, 0.022027015686035156, 0.022806882858276367, 0.023586750030517578, 0.02436661720275879, 0.025146484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 3.0, 9.0, 12.0, 14.0, 25.0, 30.0, 64.0, 102.0, 156.0, 250.0, 397.0, 765.0, 1470.0, 3045.0, 6827.0, 17946.0, 56450.0, 258351.0, 517676.0, 130451.0, 32823.0, 11868.0, 4847.0, 2249.0, 1212.0, 604.0, 332.0, 189.0, 126.0, 96.0, 61.0, 26.0, 24.0, 11.0, 8.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.026275634765625, -0.025509357452392578, -0.024743080139160156, -0.023976802825927734, -0.023210525512695312, -0.02244424819946289, -0.02167797088623047, -0.020911693572998047, -0.020145416259765625, -0.019379138946533203, -0.01861286163330078, -0.01784658432006836, -0.017080307006835938, -0.016314029693603516, -0.015547752380371094, -0.014781475067138672, -0.01401519775390625, -0.013248920440673828, -0.012482643127441406, -0.011716365814208984, -0.010950088500976562, -0.01018381118774414, -0.009417533874511719, -0.008651256561279297, -0.007884979248046875, -0.007118701934814453, -0.006352424621582031, -0.005586147308349609, -0.0048198699951171875, -0.004053592681884766, -0.0032873153686523438, -0.002521038055419922, -0.0017547607421875, -0.0009884834289550781, -0.00022220611572265625, 0.0005440711975097656, 0.0013103485107421875, 0.0020766258239746094, 0.0028429031372070312, 0.003609180450439453, 0.004375457763671875, 0.005141735076904297, 0.005908012390136719, 0.006674289703369141, 0.0074405670166015625, 0.008206844329833984, 0.008973121643066406, 0.009739398956298828, 0.01050567626953125, 0.011271953582763672, 0.012038230895996094, 0.012804508209228516, 0.013570785522460938, 0.01433706283569336, 0.015103340148925781, 0.015869617462158203, 0.016635894775390625, 0.017402172088623047, 0.01816844940185547, 0.01893472671508789, 0.019701004028320312, 0.020467281341552734, 0.021233558654785156, 0.021999835968017578, 0.02276611328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 16.0, 16.0, 17.0, 25.0, 33.0, 38.0, 53.0, 79.0, 68.0, 62.0, 75.0, 70.0, 48.0, 60.0, 48.0, 53.0, 43.0, 33.0, 26.0, 34.0, 9.0, 22.0, 12.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02227783203125, -0.021418094635009766, -0.02055835723876953, -0.019698619842529297, -0.018838882446289062, -0.017979145050048828, -0.017119407653808594, -0.01625967025756836, -0.015399932861328125, -0.01454019546508789, -0.013680458068847656, -0.012820720672607422, -0.011960983276367188, -0.011101245880126953, -0.010241508483886719, -0.009381771087646484, -0.00852203369140625, -0.007662296295166016, -0.006802558898925781, -0.005942821502685547, -0.0050830841064453125, -0.004223346710205078, -0.0033636093139648438, -0.0025038719177246094, -0.001644134521484375, -0.0007843971252441406, 7.534027099609375e-05, 0.0009350776672363281, 0.0017948150634765625, 0.002654552459716797, 0.0035142898559570312, 0.004374027252197266, 0.0052337646484375, 0.006093502044677734, 0.006953239440917969, 0.007812976837158203, 0.008672714233398438, 0.009532451629638672, 0.010392189025878906, 0.01125192642211914, 0.012111663818359375, 0.01297140121459961, 0.013831138610839844, 0.014690876007080078, 0.015550613403320312, 0.016410350799560547, 0.01727008819580078, 0.018129825592041016, 0.01898956298828125, 0.019849300384521484, 0.02070903778076172, 0.021568775177001953, 0.022428512573242188, 0.023288249969482422, 0.024147987365722656, 0.02500772476196289, 0.025867462158203125, 0.02672719955444336, 0.027586936950683594, 0.028446674346923828, 0.029306411743164062, 0.030166149139404297, 0.03102588653564453, 0.031885623931884766, 0.032745361328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 10.0, 10.0, 12.0, 24.0, 27.0, 46.0, 52.0, 87.0, 117.0, 153.0, 239.0, 320.0, 547.0, 778.0, 1328.0, 2186.0, 4249.0, 9393.0, 29317.0, 241268.0, 671234.0, 59818.0, 14201.0, 5749.0, 2778.0, 1607.0, 970.0, 655.0, 412.0, 280.0, 199.0, 131.0, 91.0, 76.0, 40.0, 39.0, 23.0, 19.0, 15.0, 12.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.017822265625, -0.017251253128051758, -0.016680240631103516, -0.016109228134155273, -0.015538215637207031, -0.014967203140258789, -0.014396190643310547, -0.013825178146362305, -0.013254165649414062, -0.01268315315246582, -0.012112140655517578, -0.011541128158569336, -0.010970115661621094, -0.010399103164672852, -0.00982809066772461, -0.009257078170776367, -0.008686065673828125, -0.008115053176879883, -0.007544040679931641, -0.0069730281829833984, -0.006402015686035156, -0.005831003189086914, -0.005259990692138672, -0.00468897819519043, -0.0041179656982421875, -0.0035469532012939453, -0.002975940704345703, -0.002404928207397461, -0.0018339157104492188, -0.0012629032135009766, -0.0006918907165527344, -0.00012087821960449219, 0.00045013427734375, 0.0010211467742919922, 0.0015921592712402344, 0.0021631717681884766, 0.0027341842651367188, 0.003305196762084961, 0.003876209259033203, 0.004447221755981445, 0.0050182342529296875, 0.00558924674987793, 0.006160259246826172, 0.006731271743774414, 0.007302284240722656, 0.007873296737670898, 0.00844430923461914, 0.009015321731567383, 0.009586334228515625, 0.010157346725463867, 0.01072835922241211, 0.011299371719360352, 0.011870384216308594, 0.012441396713256836, 0.013012409210205078, 0.01358342170715332, 0.014154434204101562, 0.014725446701049805, 0.015296459197998047, 0.01586747169494629, 0.01643848419189453, 0.017009496688842773, 0.017580509185791016, 0.018151521682739258, 0.0187225341796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 15.0, 23.0, 18.0, 32.0, 43.0, 69.0, 89.0, 108.0, 164.0, 117.0, 89.0, 63.0, 49.0, 22.0, 22.0, 13.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.673833847045898e-05, -9.393226355314255e-05, -9.112618863582611e-05, -8.832011371850967e-05, -8.551403880119324e-05, -8.27079638838768e-05, -7.990188896656036e-05, -7.709581404924393e-05, -7.428973913192749e-05, -7.148366421461105e-05, -6.867758929729462e-05, -6.587151437997818e-05, -6.306543946266174e-05, -6.0259364545345306e-05, -5.745328962802887e-05, -5.464721471071243e-05, -5.1841139793395996e-05, -4.903506487607956e-05, -4.622898995876312e-05, -4.3422915041446686e-05, -4.061684012413025e-05, -3.781076520681381e-05, -3.5004690289497375e-05, -3.219861537218094e-05, -2.9392540454864502e-05, -2.6586465537548065e-05, -2.378039062023163e-05, -2.097431570291519e-05, -1.8168240785598755e-05, -1.5362165868282318e-05, -1.2556090950965881e-05, -9.750016033649445e-06, -6.943941116333008e-06, -4.137866199016571e-06, -1.3317912817001343e-06, 1.4742836356163025e-06, 4.280358552932739e-06, 7.086433470249176e-06, 9.892508387565613e-06, 1.269858330488205e-05, 1.5504658222198486e-05, 1.8310733139514923e-05, 2.111680805683136e-05, 2.3922882974147797e-05, 2.6728957891464233e-05, 2.953503280878067e-05, 3.234110772609711e-05, 3.5147182643413544e-05, 3.795325756072998e-05, 4.075933247804642e-05, 4.3565407395362854e-05, 4.637148231267929e-05, 4.917755722999573e-05, 5.1983632147312164e-05, 5.47897070646286e-05, 5.759578198194504e-05, 6.0401856899261475e-05, 6.320793181657791e-05, 6.601400673389435e-05, 6.882008165121078e-05, 7.162615656852722e-05, 7.443223148584366e-05, 7.72383064031601e-05, 8.004438132047653e-05, 8.285045623779297e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 14.0, 10.0, 32.0, 31.0, 67.0, 99.0, 149.0, 319.0, 480.0, 967.0, 1747.0, 3287.0, 7466.0, 19941.0, 73627.0, 539350.0, 322669.0, 50768.0, 15253.0, 6158.0, 2761.0, 1441.0, 791.0, 446.0, 255.0, 136.0, 88.0, 51.0, 35.0, 22.0, 23.0, 10.0, 5.0, 7.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0135345458984375, -0.013109922409057617, -0.012685298919677734, -0.012260675430297852, -0.011836051940917969, -0.011411428451538086, -0.010986804962158203, -0.01056218147277832, -0.010137557983398438, -0.009712934494018555, -0.009288311004638672, -0.008863687515258789, -0.008439064025878906, -0.008014440536499023, -0.007589817047119141, -0.007165193557739258, -0.006740570068359375, -0.006315946578979492, -0.005891323089599609, -0.0054666996002197266, -0.005042076110839844, -0.004617452621459961, -0.004192829132080078, -0.0037682056427001953, -0.0033435821533203125, -0.0029189586639404297, -0.002494335174560547, -0.002069711685180664, -0.0016450881958007812, -0.0012204647064208984, -0.0007958412170410156, -0.0003712177276611328, 5.340576171875e-05, 0.0004780292510986328, 0.0009026527404785156, 0.0013272762298583984, 0.0017518997192382812, 0.002176523208618164, 0.002601146697998047, 0.0030257701873779297, 0.0034503936767578125, 0.0038750171661376953, 0.004299640655517578, 0.004724264144897461, 0.005148887634277344, 0.0055735111236572266, 0.005998134613037109, 0.006422758102416992, 0.006847381591796875, 0.007272005081176758, 0.007696628570556641, 0.008121252059936523, 0.008545875549316406, 0.008970499038696289, 0.009395122528076172, 0.009819746017456055, 0.010244369506835938, 0.01066899299621582, 0.011093616485595703, 0.011518239974975586, 0.011942863464355469, 0.012367486953735352, 0.012792110443115234, 0.013216733932495117, 0.013641357421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 5.0, 17.0, 8.0, 22.0, 26.0, 50.0, 110.0, 254.0, 219.0, 110.0, 45.0, 22.0, 13.0, 11.0, 14.0, 10.0, 6.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0184783935546875, -0.017933368682861328, -0.017388343811035156, -0.016843318939208984, -0.016298294067382812, -0.01575326919555664, -0.015208244323730469, -0.014663219451904297, -0.014118194580078125, -0.013573169708251953, -0.013028144836425781, -0.01248311996459961, -0.011938095092773438, -0.011393070220947266, -0.010848045349121094, -0.010303020477294922, -0.00975799560546875, -0.009212970733642578, -0.008667945861816406, -0.008122920989990234, -0.0075778961181640625, -0.007032871246337891, -0.006487846374511719, -0.005942821502685547, -0.005397796630859375, -0.004852771759033203, -0.004307746887207031, -0.0037627220153808594, -0.0032176971435546875, -0.0026726722717285156, -0.0021276473999023438, -0.0015826225280761719, -0.00103759765625, -0.0004925727844238281, 5.245208740234375e-05, 0.0005974769592285156, 0.0011425018310546875, 0.0016875267028808594, 0.0022325515747070312, 0.002777576446533203, 0.003322601318359375, 0.003867626190185547, 0.004412651062011719, 0.004957675933837891, 0.0055027008056640625, 0.006047725677490234, 0.006592750549316406, 0.007137775421142578, 0.00768280029296875, 0.008227825164794922, 0.008772850036621094, 0.009317874908447266, 0.009862899780273438, 0.01040792465209961, 0.010952949523925781, 0.011497974395751953, 0.012042999267578125, 0.012588024139404297, 0.013133049011230469, 0.01367807388305664, 0.014223098754882812, 0.014768123626708984, 0.015313148498535156, 0.015858173370361328, 0.0164031982421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 17.0, 50.0, 210.0, 386.0, 207.0, 82.0, 30.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21220669150352478, -0.20177192986011505, -0.19133715331554413, -0.1809023916721344, -0.17046761512756348, -0.16003285348415375, -0.14959809184074402, -0.1391633152961731, -0.12872855365276337, -0.11829378455877304, -0.10785901546478271, -0.09742425382137299, -0.08698948472738266, -0.07655471563339233, -0.0661199539899826, -0.05568518489599228, -0.04525041580200195, -0.03481564670801163, -0.0243808813393116, -0.013946115970611572, -0.0035113468766212463, 0.00692342221736908, 0.01735818386077881, 0.027792952954769135, 0.03822772204875946, 0.048662491142749786, 0.059097256511449814, 0.06953202188014984, 0.07996679097414017, 0.0904015600681305, 0.10083632171154022, 0.11127109080553055, 0.12170583009719849, 0.13214059174060822, 0.14257536828517914, 0.15301012992858887, 0.1634449064731598, 0.17387966811656952, 0.18431442975997925, 0.19474920630455017, 0.2051839679479599, 0.21561872959136963, 0.22605350613594055, 0.23648826777935028, 0.24692302942276, 0.25735780596733093, 0.26779258251190186, 0.2782273292541504, 0.2886621057987213, 0.29909688234329224, 0.30953162908554077, 0.3199664056301117, 0.3304011821746826, 0.34083592891693115, 0.3512707054615021, 0.361705482006073, 0.37214022874832153, 0.38257500529289246, 0.393009752035141, 0.4034445285797119, 0.41387930512428284, 0.42431408166885376, 0.4347488284111023, 0.4451836049556732, 0.45561838150024414]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 7.0, 6.0, 14.0, 10.0, 11.0, 18.0, 25.0, 29.0, 31.0, 43.0, 58.0, 60.0, 54.0, 56.0, 55.0, 69.0, 57.0, 47.0, 41.0, 44.0, 54.0, 32.0, 32.0, 32.0, 19.0, 22.0, 21.0, 14.0, 12.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06769245862960815, -0.06512940675020218, -0.0625663548707962, -0.06000330671668053, -0.05744025483727455, -0.054877202957868576, -0.0523141548037529, -0.049751102924346924, -0.04718805104494095, -0.04462499916553497, -0.042061947286129, -0.03949889913201332, -0.036935847252607346, -0.03437279537320137, -0.03180974721908569, -0.029246695339679718, -0.026683643460273743, -0.024120591580867767, -0.02155754156410694, -0.018994491547346115, -0.01643143966794014, -0.013868388719856739, -0.011305337771773338, -0.008742287755012512, -0.006179235875606537, -0.003616184927523136, -0.0010531339794397354, 0.0015099169686436653, 0.004072967916727066, 0.006636018864810467, 0.009199069812893867, 0.011762119829654694, 0.014325171709060669, 0.016888223588466644, 0.01945127360522747, 0.022014323621988297, 0.024577375501394272, 0.027140427380800247, 0.029703477397561073, 0.0322665274143219, 0.034829579293727875, 0.03739263117313385, 0.039955683052539825, 0.0425187312066555, 0.04508178308606148, 0.04764483496546745, 0.05020788311958313, 0.052770934998989105, 0.05533398687839508, 0.057897038757801056, 0.06046009063720703, 0.063023142516613, 0.06558619439601898, 0.06814923882484436, 0.07071229070425034, 0.07327534258365631, 0.07583839446306229, 0.07840144634246826, 0.08096449822187424, 0.08352755010128021, 0.08609059453010559, 0.08865364640951157, 0.09121669828891754, 0.09377975016832352, 0.09634280204772949]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 7.0, 14.0, 26.0, 33.0, 52.0, 100.0, 196.0, 450.0, 1409.0, 7710.0, 107363.0, 3982209.0, 85616.0, 6861.0, 1405.0, 421.0, 186.0, 93.0, 48.0, 29.0, 19.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044586181640625, -0.04312276840209961, -0.04165935516357422, -0.04019594192504883, -0.03873252868652344, -0.03726911544799805, -0.035805702209472656, -0.034342288970947266, -0.032878875732421875, -0.031415462493896484, -0.029952049255371094, -0.028488636016845703, -0.027025222778320312, -0.025561809539794922, -0.02409839630126953, -0.02263498306274414, -0.02117156982421875, -0.01970815658569336, -0.01824474334716797, -0.016781330108642578, -0.015317916870117188, -0.013854503631591797, -0.012391090393066406, -0.010927677154541016, -0.009464263916015625, -0.008000850677490234, -0.006537437438964844, -0.005074024200439453, -0.0036106109619140625, -0.002147197723388672, -0.0006837844848632812, 0.0007796287536621094, 0.0022430419921875, 0.0037064552307128906, 0.005169868469238281, 0.006633281707763672, 0.008096694946289062, 0.009560108184814453, 0.011023521423339844, 0.012486934661865234, 0.013950347900390625, 0.015413761138916016, 0.016877174377441406, 0.018340587615966797, 0.019804000854492188, 0.021267414093017578, 0.02273082733154297, 0.02419424057006836, 0.02565765380859375, 0.02712106704711914, 0.02858448028564453, 0.030047893524169922, 0.03151130676269531, 0.0329747200012207, 0.034438133239746094, 0.035901546478271484, 0.037364959716796875, 0.038828372955322266, 0.040291786193847656, 0.04175519943237305, 0.04321861267089844, 0.04468202590942383, 0.04614543914794922, 0.04760885238647461, 0.049072265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 12.0, 33.0, 71.0, 119.0, 166.0, 177.0, 152.0, 132.0, 71.0, 40.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.024810791015625, -0.024048566818237305, -0.02328634262084961, -0.022524118423461914, -0.02176189422607422, -0.020999670028686523, -0.020237445831298828, -0.019475221633911133, -0.018712997436523438, -0.017950773239135742, -0.017188549041748047, -0.01642632484436035, -0.015664100646972656, -0.014901876449584961, -0.014139652252197266, -0.01337742805480957, -0.012615203857421875, -0.01185297966003418, -0.011090755462646484, -0.010328531265258789, -0.009566307067871094, -0.008804082870483398, -0.008041858673095703, -0.007279634475708008, -0.0065174102783203125, -0.005755186080932617, -0.004992961883544922, -0.0042307376861572266, -0.0034685134887695312, -0.002706289291381836, -0.0019440650939941406, -0.0011818408966064453, -0.00041961669921875, 0.0003426074981689453, 0.0011048316955566406, 0.001867055892944336, 0.0026292800903320312, 0.0033915042877197266, 0.004153728485107422, 0.004915952682495117, 0.0056781768798828125, 0.006440401077270508, 0.007202625274658203, 0.007964849472045898, 0.008727073669433594, 0.009489297866821289, 0.010251522064208984, 0.01101374626159668, 0.011775970458984375, 0.01253819465637207, 0.013300418853759766, 0.014062643051147461, 0.014824867248535156, 0.015587091445922852, 0.016349315643310547, 0.017111539840698242, 0.017873764038085938, 0.018635988235473633, 0.019398212432861328, 0.020160436630249023, 0.02092266082763672, 0.021684885025024414, 0.02244710922241211, 0.023209333419799805, 0.0239715576171875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 10.0, 3.0, 11.0, 13.0, 19.0, 31.0, 57.0, 90.0, 149.0, 272.0, 501.0, 931.0, 2176.0, 5190.0, 16322.0, 79628.0, 1525268.0, 2436574.0, 97489.0, 18870.0, 5881.0, 2390.0, 1134.0, 552.0, 309.0, 165.0, 77.0, 60.0, 36.0, 14.0, 20.0, 15.0, 11.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.029022216796875, -0.028169870376586914, -0.027317523956298828, -0.026465177536010742, -0.025612831115722656, -0.02476048469543457, -0.023908138275146484, -0.0230557918548584, -0.022203445434570312, -0.021351099014282227, -0.02049875259399414, -0.019646406173706055, -0.01879405975341797, -0.017941713333129883, -0.017089366912841797, -0.01623702049255371, -0.015384674072265625, -0.014532327651977539, -0.013679981231689453, -0.012827634811401367, -0.011975288391113281, -0.011122941970825195, -0.01027059555053711, -0.009418249130249023, -0.008565902709960938, -0.0077135562896728516, -0.006861209869384766, -0.00600886344909668, -0.005156517028808594, -0.004304170608520508, -0.003451824188232422, -0.002599477767944336, -0.00174713134765625, -0.0008947849273681641, -4.2438507080078125e-05, 0.0008099079132080078, 0.0016622543334960938, 0.0025146007537841797, 0.0033669471740722656, 0.0042192935943603516, 0.0050716400146484375, 0.0059239864349365234, 0.006776332855224609, 0.007628679275512695, 0.008481025695800781, 0.009333372116088867, 0.010185718536376953, 0.011038064956665039, 0.011890411376953125, 0.012742757797241211, 0.013595104217529297, 0.014447450637817383, 0.015299797058105469, 0.016152143478393555, 0.01700448989868164, 0.017856836318969727, 0.018709182739257812, 0.0195615291595459, 0.020413875579833984, 0.02126622200012207, 0.022118568420410156, 0.022970914840698242, 0.023823261260986328, 0.024675607681274414, 0.0255279541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 9.0, 12.0, 13.0, 18.0, 28.0, 52.0, 78.0, 105.0, 248.0, 480.0, 1193.0, 935.0, 356.0, 223.0, 113.0, 68.0, 45.0, 24.0, 17.0, 21.0, 5.0, 11.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0276641845703125, -0.02689075469970703, -0.026117324829101562, -0.025343894958496094, -0.024570465087890625, -0.023797035217285156, -0.023023605346679688, -0.02225017547607422, -0.02147674560546875, -0.02070331573486328, -0.019929885864257812, -0.019156455993652344, -0.018383026123046875, -0.017609596252441406, -0.016836166381835938, -0.01606273651123047, -0.015289306640625, -0.014515876770019531, -0.013742446899414062, -0.012969017028808594, -0.012195587158203125, -0.011422157287597656, -0.010648727416992188, -0.009875297546386719, -0.00910186767578125, -0.008328437805175781, -0.0075550079345703125, -0.006781578063964844, -0.006008148193359375, -0.005234718322753906, -0.0044612884521484375, -0.0036878585815429688, -0.0029144287109375, -0.0021409988403320312, -0.0013675689697265625, -0.0005941390991210938, 0.000179290771484375, 0.0009527206420898438, 0.0017261505126953125, 0.0024995803833007812, 0.00327301025390625, 0.004046440124511719, 0.0048198699951171875, 0.005593299865722656, 0.006366729736328125, 0.007140159606933594, 0.007913589477539062, 0.008687019348144531, 0.00946044921875, 0.010233879089355469, 0.011007308959960938, 0.011780738830566406, 0.012554168701171875, 0.013327598571777344, 0.014101028442382812, 0.014874458312988281, 0.01564788818359375, 0.01642131805419922, 0.017194747924804688, 0.017968177795410156, 0.018741607666015625, 0.019515037536621094, 0.020288467407226562, 0.02106189727783203, 0.0218353271484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 10.0, 29.0, 39.0, 128.0, 247.0, 291.0, 145.0, 51.0, 38.0, 8.0, 4.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.32973966002464294, -0.32270506024360657, -0.3156704902648926, -0.3086358904838562, -0.3016012907028198, -0.29456669092178345, -0.28753212094306946, -0.2804975211620331, -0.2734629213809967, -0.2664283215999603, -0.25939375162124634, -0.25235915184020996, -0.24532455205917358, -0.2382899671792984, -0.23125536739826202, -0.22422078251838684, -0.21718618273735046, -0.21015159785747528, -0.2031169980764389, -0.19608241319656372, -0.18904781341552734, -0.18201322853565216, -0.17497862875461578, -0.1679440438747406, -0.16090945899486542, -0.15387487411499023, -0.14684027433395386, -0.13980568945407867, -0.1327710896730423, -0.12573650479316711, -0.11870190501213074, -0.11166732013225555, -0.10463272035121918, -0.0975981280207634, -0.09056353569030762, -0.08352894335985184, -0.07649435102939606, -0.06945976614952087, -0.062425170093774796, -0.055390577763319016, -0.048355985432863235, -0.041321393102407455, -0.034286800771951675, -0.027252210304141045, -0.020217617973685265, -0.013183027505874634, -0.006148435175418854, 0.0008861571550369263, 0.007920749485492706, 0.014955341815948486, 0.021989934146404266, 0.029024524614214897, 0.036059118807315826, 0.04309370741248131, 0.05012829974293709, 0.05716289207339287, 0.06419748067855835, 0.07123207300901413, 0.07826666533946991, 0.08530125766992569, 0.09233585000038147, 0.09937043488025665, 0.10640503466129303, 0.11343961954116821, 0.12047421932220459]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 10.0, 12.0, 12.0, 17.0, 28.0, 20.0, 28.0, 31.0, 43.0, 39.0, 40.0, 45.0, 58.0, 54.0, 66.0, 54.0, 60.0, 60.0, 53.0, 45.0, 45.0, 31.0, 27.0, 20.0, 27.0, 16.0, 14.0, 10.0, 8.0, 9.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08672666549682617, -0.0843854695558548, -0.08204426616430283, -0.07970306277275085, -0.07736186683177948, -0.0750206708908081, -0.07267946749925613, -0.07033826410770416, -0.06799706816673279, -0.06565587222576141, -0.06331466883420944, -0.06097346916794777, -0.058632269501686096, -0.05629106983542442, -0.05394987016916275, -0.05160867050290108, -0.049267470836639404, -0.04692627117037773, -0.04458507150411606, -0.042243871837854385, -0.03990267217159271, -0.03756147250533104, -0.035220272839069366, -0.032879073172807693, -0.03053787350654602, -0.028196673840284348, -0.025855474174022675, -0.023514274507761, -0.02117307484149933, -0.018831875175237656, -0.016490675508975983, -0.01414947584271431, -0.011808276176452637, -0.009467076510190964, -0.007125876843929291, -0.004784677177667618, -0.002443477511405945, -0.00010227784514427185, 0.002238921821117401, 0.004580121487379074, 0.006921321153640747, 0.00926252081990242, 0.011603720486164093, 0.013944920152425766, 0.01628611981868744, 0.018627319484949112, 0.020968519151210785, 0.023309718817472458, 0.02565091848373413, 0.027992118149995804, 0.030333317816257477, 0.03267451748251915, 0.03501571714878082, 0.037356916815042496, 0.03969811648130417, 0.04203931614756584, 0.044380515813827515, 0.04672171548008919, 0.04906291514635086, 0.051404114812612534, 0.05374531447887421, 0.05608651414513588, 0.05842771381139755, 0.060768913477659225, 0.0631101131439209]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 12.0, 25.0, 23.0, 40.0, 74.0, 92.0, 133.0, 218.0, 307.0, 532.0, 931.0, 2234.0, 8955.0, 82462.0, 738644.0, 192081.0, 15697.0, 3180.0, 1217.0, 547.0, 375.0, 232.0, 132.0, 110.0, 67.0, 52.0, 37.0, 30.0, 24.0, 15.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0574951171875, -0.055619239807128906, -0.05374336242675781, -0.05186748504638672, -0.049991607666015625, -0.04811573028564453, -0.04623985290527344, -0.044363975524902344, -0.04248809814453125, -0.040612220764160156, -0.03873634338378906, -0.03686046600341797, -0.034984588623046875, -0.03310871124267578, -0.031232833862304688, -0.029356956481933594, -0.0274810791015625, -0.025605201721191406, -0.023729324340820312, -0.02185344696044922, -0.019977569580078125, -0.01810169219970703, -0.016225814819335938, -0.014349937438964844, -0.01247406005859375, -0.010598182678222656, -0.008722305297851562, -0.006846427917480469, -0.004970550537109375, -0.0030946731567382812, -0.0012187957763671875, 0.0006570816040039062, 0.002532958984375, 0.004408836364746094, 0.0062847137451171875, 0.008160591125488281, 0.010036468505859375, 0.011912345886230469, 0.013788223266601562, 0.015664100646972656, 0.01753997802734375, 0.019415855407714844, 0.021291732788085938, 0.02316761016845703, 0.025043487548828125, 0.02691936492919922, 0.028795242309570312, 0.030671119689941406, 0.0325469970703125, 0.034422874450683594, 0.03629875183105469, 0.03817462921142578, 0.040050506591796875, 0.04192638397216797, 0.04380226135253906, 0.045678138732910156, 0.04755401611328125, 0.049429893493652344, 0.05130577087402344, 0.05318164825439453, 0.055057525634765625, 0.05693340301513672, 0.05880928039550781, 0.060685157775878906, 0.06256103515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 39.0, 82.0, 120.0, 166.0, 166.0, 144.0, 123.0, 73.0, 50.0, 16.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.027191162109375, -0.026380300521850586, -0.025569438934326172, -0.024758577346801758, -0.023947715759277344, -0.02313685417175293, -0.022325992584228516, -0.0215151309967041, -0.020704269409179688, -0.019893407821655273, -0.01908254623413086, -0.018271684646606445, -0.01746082305908203, -0.016649961471557617, -0.015839099884033203, -0.015028238296508789, -0.014217376708984375, -0.013406515121459961, -0.012595653533935547, -0.011784791946411133, -0.010973930358886719, -0.010163068771362305, -0.00935220718383789, -0.008541345596313477, -0.0077304840087890625, -0.0069196224212646484, -0.006108760833740234, -0.00529789924621582, -0.004487037658691406, -0.003676176071166992, -0.002865314483642578, -0.002054452896118164, -0.00124359130859375, -0.00043272972106933594, 0.0003781318664550781, 0.0011889934539794922, 0.0019998550415039062, 0.0028107166290283203, 0.0036215782165527344, 0.0044324398040771484, 0.0052433013916015625, 0.0060541629791259766, 0.006865024566650391, 0.007675886154174805, 0.008486747741699219, 0.009297609329223633, 0.010108470916748047, 0.010919332504272461, 0.011730194091796875, 0.012541055679321289, 0.013351917266845703, 0.014162778854370117, 0.014973640441894531, 0.015784502029418945, 0.01659536361694336, 0.017406225204467773, 0.018217086791992188, 0.0190279483795166, 0.019838809967041016, 0.02064967155456543, 0.021460533142089844, 0.022271394729614258, 0.023082256317138672, 0.023893117904663086, 0.0247039794921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 16.0, 10.0, 14.0, 25.0, 45.0, 52.0, 114.0, 179.0, 289.0, 484.0, 851.0, 1601.0, 3116.0, 6278.0, 13697.0, 33161.0, 88003.0, 235090.0, 357649.0, 189396.0, 69216.0, 26810.0, 11445.0, 5144.0, 2631.0, 1327.0, 764.0, 424.0, 285.0, 172.0, 89.0, 57.0, 28.0, 27.0, 12.0, 10.0, 7.0, 9.0, 4.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.02199530601501465, -0.021316051483154297, -0.020636796951293945, -0.019957542419433594, -0.019278287887573242, -0.01859903335571289, -0.01791977882385254, -0.017240524291992188, -0.016561269760131836, -0.015882015228271484, -0.015202760696411133, -0.014523506164550781, -0.01384425163269043, -0.013164997100830078, -0.012485742568969727, -0.011806488037109375, -0.011127233505249023, -0.010447978973388672, -0.00976872444152832, -0.009089469909667969, -0.008410215377807617, -0.007730960845947266, -0.007051706314086914, -0.0063724517822265625, -0.005693197250366211, -0.005013942718505859, -0.004334688186645508, -0.0036554336547851562, -0.0029761791229248047, -0.002296924591064453, -0.0016176700592041016, -0.00093841552734375, -0.00025916099548339844, 0.0004200935363769531, 0.0010993480682373047, 0.0017786026000976562, 0.002457857131958008, 0.0031371116638183594, 0.003816366195678711, 0.0044956207275390625, 0.005174875259399414, 0.005854129791259766, 0.006533384323120117, 0.007212638854980469, 0.00789189338684082, 0.008571147918701172, 0.009250402450561523, 0.009929656982421875, 0.010608911514282227, 0.011288166046142578, 0.01196742057800293, 0.012646675109863281, 0.013325929641723633, 0.014005184173583984, 0.014684438705444336, 0.015363693237304688, 0.01604294776916504, 0.01672220230102539, 0.017401456832885742, 0.018080711364746094, 0.018759965896606445, 0.019439220428466797, 0.02011847496032715, 0.0207977294921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 9.0, 3.0, 8.0, 15.0, 7.0, 12.0, 18.0, 25.0, 33.0, 30.0, 29.0, 31.0, 38.0, 59.0, 49.0, 54.0, 43.0, 56.0, 53.0, 40.0, 45.0, 55.0, 30.0, 39.0, 29.0, 30.0, 30.0, 24.0, 24.0, 19.0, 19.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0234375, -0.02261519432067871, -0.021792888641357422, -0.020970582962036133, -0.020148277282714844, -0.019325971603393555, -0.018503665924072266, -0.017681360244750977, -0.016859054565429688, -0.0160367488861084, -0.01521444320678711, -0.01439213752746582, -0.013569831848144531, -0.012747526168823242, -0.011925220489501953, -0.011102914810180664, -0.010280609130859375, -0.009458303451538086, -0.008635997772216797, -0.007813692092895508, -0.006991386413574219, -0.00616908073425293, -0.005346775054931641, -0.0045244693756103516, -0.0037021636962890625, -0.0028798580169677734, -0.0020575523376464844, -0.0012352466583251953, -0.00041294097900390625, 0.0004093647003173828, 0.0012316703796386719, 0.002053976058959961, 0.00287628173828125, 0.003698587417602539, 0.004520893096923828, 0.005343198776245117, 0.006165504455566406, 0.006987810134887695, 0.007810115814208984, 0.008632421493530273, 0.009454727172851562, 0.010277032852172852, 0.01109933853149414, 0.01192164421081543, 0.012743949890136719, 0.013566255569458008, 0.014388561248779297, 0.015210866928100586, 0.016033172607421875, 0.016855478286743164, 0.017677783966064453, 0.018500089645385742, 0.01932239532470703, 0.02014470100402832, 0.02096700668334961, 0.0217893123626709, 0.022611618041992188, 0.023433923721313477, 0.024256229400634766, 0.025078535079956055, 0.025900840759277344, 0.026723146438598633, 0.027545452117919922, 0.02836775779724121, 0.0291900634765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 14.0, 24.0, 31.0, 57.0, 68.0, 89.0, 117.0, 209.0, 339.0, 513.0, 755.0, 1249.0, 1898.0, 3327.0, 5894.0, 10966.0, 22319.0, 50442.0, 133286.0, 357922.0, 283258.0, 97592.0, 38851.0, 17867.0, 8845.0, 4963.0, 2866.0, 1736.0, 1047.0, 667.0, 456.0, 273.0, 208.0, 131.0, 73.0, 59.0, 38.0, 25.0, 19.0, 16.0, 6.0, 11.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00896453857421875, -0.008683085441589355, -0.008401632308959961, -0.008120179176330566, -0.007838726043701172, -0.007557272911071777, -0.007275819778442383, -0.006994366645812988, -0.006712913513183594, -0.006431460380554199, -0.006150007247924805, -0.00586855411529541, -0.005587100982666016, -0.005305647850036621, -0.0050241947174072266, -0.004742741584777832, -0.0044612884521484375, -0.004179835319519043, -0.0038983821868896484, -0.003616929054260254, -0.0033354759216308594, -0.003054022789001465, -0.0027725696563720703, -0.0024911165237426758, -0.0022096633911132812, -0.0019282102584838867, -0.0016467571258544922, -0.0013653039932250977, -0.0010838508605957031, -0.0008023977279663086, -0.0005209445953369141, -0.00023949146270751953, 4.1961669921875e-05, 0.00032341480255126953, 0.0006048679351806641, 0.0008863210678100586, 0.0011677742004394531, 0.0014492273330688477, 0.0017306804656982422, 0.0020121335983276367, 0.0022935867309570312, 0.0025750398635864258, 0.0028564929962158203, 0.003137946128845215, 0.0034193992614746094, 0.003700852394104004, 0.0039823055267333984, 0.004263758659362793, 0.0045452117919921875, 0.004826664924621582, 0.0051081180572509766, 0.005389571189880371, 0.005671024322509766, 0.00595247745513916, 0.006233930587768555, 0.006515383720397949, 0.006796836853027344, 0.007078289985656738, 0.007359743118286133, 0.007641196250915527, 0.007922649383544922, 0.008204102516174316, 0.008485555648803711, 0.008767008781433105, 0.0090484619140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 5.0, 5.0, 7.0, 11.0, 8.0, 15.0, 10.0, 38.0, 28.0, 41.0, 48.0, 62.0, 73.0, 90.0, 91.0, 88.0, 75.0, 52.0, 48.0, 42.0, 28.0, 27.0, 19.0, 17.0, 13.0, 10.0, 8.0, 6.0, 4.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.012222290039062e-05, -8.743628859519958e-05, -8.475035429000854e-05, -8.20644199848175e-05, -7.937848567962646e-05, -7.669255137443542e-05, -7.400661706924438e-05, -7.132068276405334e-05, -6.86347484588623e-05, -6.594881415367126e-05, -6.326287984848022e-05, -6.0576945543289185e-05, -5.7891011238098145e-05, -5.5205076932907104e-05, -5.2519142627716064e-05, -4.9833208322525024e-05, -4.7147274017333984e-05, -4.4461339712142944e-05, -4.1775405406951904e-05, -3.9089471101760864e-05, -3.6403536796569824e-05, -3.3717602491378784e-05, -3.1031668186187744e-05, -2.8345733880996704e-05, -2.5659799575805664e-05, -2.2973865270614624e-05, -2.0287930965423584e-05, -1.7601996660232544e-05, -1.4916062355041504e-05, -1.2230128049850464e-05, -9.544193744659424e-06, -6.858259439468384e-06, -4.172325134277344e-06, -1.4863908290863037e-06, 1.1995434761047363e-06, 3.885477781295776e-06, 6.571412086486816e-06, 9.257346391677856e-06, 1.1943280696868896e-05, 1.4629215002059937e-05, 1.7315149307250977e-05, 2.0001083612442017e-05, 2.2687017917633057e-05, 2.5372952222824097e-05, 2.8058886528015137e-05, 3.074482083320618e-05, 3.343075513839722e-05, 3.611668944358826e-05, 3.88026237487793e-05, 4.148855805397034e-05, 4.417449235916138e-05, 4.686042666435242e-05, 4.954636096954346e-05, 5.22322952747345e-05, 5.491822957992554e-05, 5.760416388511658e-05, 6.029009819030762e-05, 6.297603249549866e-05, 6.56619668006897e-05, 6.834790110588074e-05, 7.103383541107178e-05, 7.371976971626282e-05, 7.640570402145386e-05, 7.90916383266449e-05, 8.177757263183594e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 21.0, 28.0, 36.0, 64.0, 104.0, 196.0, 342.0, 721.0, 1369.0, 2643.0, 5326.0, 11628.0, 28025.0, 77713.0, 261495.0, 432523.0, 144550.0, 47326.0, 18531.0, 8067.0, 3801.0, 1883.0, 920.0, 506.0, 268.0, 153.0, 94.0, 52.0, 42.0, 27.0, 19.0, 12.0, 8.0, 3.0, 9.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.01181793212890625, -0.01147305965423584, -0.01112818717956543, -0.01078331470489502, -0.01043844223022461, -0.0100935697555542, -0.009748697280883789, -0.009403824806213379, -0.009058952331542969, -0.008714079856872559, -0.008369207382202148, -0.008024334907531738, -0.007679462432861328, -0.007334589958190918, -0.006989717483520508, -0.006644845008850098, -0.0062999725341796875, -0.005955100059509277, -0.005610227584838867, -0.005265355110168457, -0.004920482635498047, -0.004575610160827637, -0.0042307376861572266, -0.0038858652114868164, -0.0035409927368164062, -0.003196120262145996, -0.002851247787475586, -0.0025063753128051758, -0.0021615028381347656, -0.0018166303634643555, -0.0014717578887939453, -0.0011268854141235352, -0.000782012939453125, -0.00043714046478271484, -9.226799011230469e-05, 0.00025260448455810547, 0.0005974769592285156, 0.0009423494338989258, 0.001287221908569336, 0.001632094383239746, 0.0019769668579101562, 0.0023218393325805664, 0.0026667118072509766, 0.0030115842819213867, 0.003356456756591797, 0.003701329231262207, 0.004046201705932617, 0.004391074180603027, 0.0047359466552734375, 0.005080819129943848, 0.005425691604614258, 0.005770564079284668, 0.006115436553955078, 0.006460309028625488, 0.0068051815032958984, 0.007150053977966309, 0.007494926452636719, 0.007839798927307129, 0.008184671401977539, 0.00852954387664795, 0.00887441635131836, 0.00921928882598877, 0.00956416130065918, 0.00990903377532959, 0.01025390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 7.0, 6.0, 7.0, 11.0, 11.0, 20.0, 21.0, 20.0, 44.0, 43.0, 48.0, 100.0, 110.0, 119.0, 98.0, 69.0, 72.0, 39.0, 39.0, 30.0, 15.0, 12.0, 15.0, 15.0, 6.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0138092041015625, -0.013407349586486816, -0.013005495071411133, -0.01260364055633545, -0.012201786041259766, -0.011799931526184082, -0.011398077011108398, -0.010996222496032715, -0.010594367980957031, -0.010192513465881348, -0.009790658950805664, -0.00938880443572998, -0.008986949920654297, -0.008585095405578613, -0.00818324089050293, -0.007781386375427246, -0.0073795318603515625, -0.006977677345275879, -0.006575822830200195, -0.006173968315124512, -0.005772113800048828, -0.0053702592849731445, -0.004968404769897461, -0.004566550254821777, -0.004164695739746094, -0.00376284122467041, -0.0033609867095947266, -0.002959132194519043, -0.0025572776794433594, -0.0021554231643676758, -0.0017535686492919922, -0.0013517141342163086, -0.000949859619140625, -0.0005480051040649414, -0.0001461505889892578, 0.0002557039260864258, 0.0006575584411621094, 0.001059412956237793, 0.0014612674713134766, 0.0018631219863891602, 0.0022649765014648438, 0.0026668310165405273, 0.003068685531616211, 0.0034705400466918945, 0.003872394561767578, 0.004274249076843262, 0.004676103591918945, 0.005077958106994629, 0.0054798126220703125, 0.005881667137145996, 0.00628352165222168, 0.006685376167297363, 0.007087230682373047, 0.0074890851974487305, 0.007890939712524414, 0.008292794227600098, 0.008694648742675781, 0.009096503257751465, 0.009498357772827148, 0.009900212287902832, 0.010302066802978516, 0.0107039213180542, 0.011105775833129883, 0.011507630348205566, 0.01190948486328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 14.0, 16.0, 28.0, 45.0, 102.0, 126.0, 147.0, 164.0, 114.0, 96.0, 57.0, 37.0, 19.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.24636536836624146, -0.24099762737751007, -0.23562990128993988, -0.2302621603012085, -0.2248944342136383, -0.21952669322490692, -0.21415895223617554, -0.20879122614860535, -0.20342348515987396, -0.19805574417114258, -0.1926880180835724, -0.187320277094841, -0.18195253610610962, -0.17658481001853943, -0.17121706902980804, -0.16584932804107666, -0.16048160195350647, -0.15511386096477509, -0.1497461348772049, -0.1443783938884735, -0.13901066780090332, -0.13364292681217194, -0.12827518582344055, -0.12290745228528976, -0.11753971874713898, -0.11217198520898819, -0.1068042516708374, -0.10143651068210602, -0.09606877714395523, -0.09070104360580444, -0.08533330261707306, -0.07996556907892227, -0.07459785044193268, -0.06923011690378189, -0.0638623833656311, -0.05849464237689972, -0.05312690883874893, -0.047759175300598145, -0.04239143803715706, -0.03702370077371597, -0.031655967235565186, -0.02628823183476925, -0.020920496433973312, -0.015552761033177376, -0.01018502563238144, -0.004817290231585503, 0.000550445169210434, 0.00591818243265152, 0.011285915970802307, 0.016653651371598244, 0.02202138677239418, 0.027389122173190117, 0.03275685757398605, 0.03812459111213684, 0.04349232837557793, 0.04886006563901901, 0.0542277991771698, 0.05959553271532059, 0.06496326625347137, 0.07033100724220276, 0.07569874078035355, 0.08106647431850433, 0.08643421530723572, 0.0918019488453865, 0.09716968238353729]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 6.0, 11.0, 10.0, 8.0, 15.0, 8.0, 19.0, 17.0, 20.0, 18.0, 32.0, 28.0, 29.0, 34.0, 50.0, 43.0, 38.0, 39.0, 30.0, 41.0, 50.0, 44.0, 49.0, 43.0, 32.0, 36.0, 25.0, 36.0, 29.0, 22.0, 20.0, 30.0, 30.0, 9.0, 9.0, 11.0, 8.0, 9.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06681299209594727, -0.06453660130500793, -0.062260210514068604, -0.05998382344841957, -0.05770743265748024, -0.05543104186654091, -0.053154654800891876, -0.050878264009952545, -0.048601873219013214, -0.04632548242807388, -0.04404909163713455, -0.04177270457148552, -0.03949631378054619, -0.03721992298960686, -0.034943535923957825, -0.032667145133018494, -0.030390754342079163, -0.02811436355113983, -0.02583797462284565, -0.023561585694551468, -0.021285194903612137, -0.019008804112672806, -0.016732415184378624, -0.014456026256084442, -0.012179635465145111, -0.009903245605528355, -0.007626855745911598, -0.005350465886294842, -0.0030740760266780853, -0.0007976861670613289, 0.0014787036925554276, 0.0037550926208496094, 0.00603148341178894, 0.008307873271405697, 0.010584263131022453, 0.01286065299063921, 0.015137042850255966, 0.017413433641195297, 0.01968982256948948, 0.02196621149778366, 0.024242602288722992, 0.026518993079662323, 0.028795382007956505, 0.031071770936250687, 0.03334816172719002, 0.03562455251812935, 0.03790093958377838, 0.04017733037471771, 0.04245372116565704, 0.044730111956596375, 0.047006502747535706, 0.04928288981318474, 0.05155928060412407, 0.0538356713950634, 0.05611205846071243, 0.058388449251651764, 0.060664840042591095, 0.06294123083353043, 0.06521762162446976, 0.06749401241540909, 0.06977039575576782, 0.07204678654670715, 0.07432317733764648, 0.07659956812858582, 0.07887595891952515]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 7.0, 24.0, 24.0, 38.0, 41.0, 78.0, 140.0, 178.0, 428.0, 1157.0, 4082.0, 14666.0, 96326.0, 3365343.0, 662207.0, 38033.0, 7763.0, 2273.0, 761.0, 300.0, 140.0, 97.0, 53.0, 30.0, 25.0, 16.0, 12.0, 12.0, 2.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029541015625, -0.028548717498779297, -0.027556419372558594, -0.02656412124633789, -0.025571823120117188, -0.024579524993896484, -0.02358722686767578, -0.022594928741455078, -0.021602630615234375, -0.020610332489013672, -0.01961803436279297, -0.018625736236572266, -0.017633438110351562, -0.01664113998413086, -0.015648841857910156, -0.014656543731689453, -0.01366424560546875, -0.012671947479248047, -0.011679649353027344, -0.01068735122680664, -0.009695053100585938, -0.008702754974365234, -0.007710456848144531, -0.006718158721923828, -0.005725860595703125, -0.004733562469482422, -0.0037412643432617188, -0.0027489662170410156, -0.0017566680908203125, -0.0007643699645996094, 0.00022792816162109375, 0.0012202262878417969, 0.0022125244140625, 0.003204822540283203, 0.004197120666503906, 0.005189418792724609, 0.0061817169189453125, 0.007174015045166016, 0.008166313171386719, 0.009158611297607422, 0.010150909423828125, 0.011143207550048828, 0.012135505676269531, 0.013127803802490234, 0.014120101928710938, 0.01511240005493164, 0.016104698181152344, 0.017096996307373047, 0.01808929443359375, 0.019081592559814453, 0.020073890686035156, 0.02106618881225586, 0.022058486938476562, 0.023050785064697266, 0.02404308319091797, 0.025035381317138672, 0.026027679443359375, 0.027019977569580078, 0.02801227569580078, 0.029004573822021484, 0.029996871948242188, 0.03098917007446289, 0.031981468200683594, 0.0329737663269043, 0.033966064453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 31.0, 61.0, 93.0, 138.0, 167.0, 172.0, 127.0, 91.0, 54.0, 40.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0282745361328125, -0.027416467666625977, -0.026558399200439453, -0.02570033073425293, -0.024842262268066406, -0.023984193801879883, -0.02312612533569336, -0.022268056869506836, -0.021409988403320312, -0.02055191993713379, -0.019693851470947266, -0.018835783004760742, -0.01797771453857422, -0.017119646072387695, -0.016261577606201172, -0.015403509140014648, -0.014545440673828125, -0.013687372207641602, -0.012829303741455078, -0.011971235275268555, -0.011113166809082031, -0.010255098342895508, -0.009397029876708984, -0.008538961410522461, -0.0076808929443359375, -0.006822824478149414, -0.005964756011962891, -0.005106687545776367, -0.004248619079589844, -0.0033905506134033203, -0.002532482147216797, -0.0016744136810302734, -0.00081634521484375, 4.172325134277344e-05, 0.0008997917175292969, 0.0017578601837158203, 0.0026159286499023438, 0.003473997116088867, 0.004332065582275391, 0.005190134048461914, 0.0060482025146484375, 0.006906270980834961, 0.007764339447021484, 0.008622407913208008, 0.009480476379394531, 0.010338544845581055, 0.011196613311767578, 0.012054681777954102, 0.012912750244140625, 0.013770818710327148, 0.014628887176513672, 0.015486955642700195, 0.01634502410888672, 0.017203092575073242, 0.018061161041259766, 0.01891922950744629, 0.019777297973632812, 0.020635366439819336, 0.02149343490600586, 0.022351503372192383, 0.023209571838378906, 0.02406764030456543, 0.024925708770751953, 0.025783777236938477, 0.026641845703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 11.0, 25.0, 45.0, 45.0, 75.0, 145.0, 209.0, 378.0, 636.0, 1246.0, 2442.0, 5443.0, 15545.0, 64130.0, 647123.0, 3251388.0, 160626.0, 28559.0, 8787.0, 3543.0, 1714.0, 903.0, 470.0, 273.0, 181.0, 100.0, 73.0, 45.0, 29.0, 24.0, 9.0, 8.0, 10.0, 5.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.031280517578125, -0.030392885208129883, -0.029505252838134766, -0.02861762046813965, -0.02772998809814453, -0.026842355728149414, -0.025954723358154297, -0.02506709098815918, -0.024179458618164062, -0.023291826248168945, -0.022404193878173828, -0.02151656150817871, -0.020628929138183594, -0.019741296768188477, -0.01885366439819336, -0.017966032028198242, -0.017078399658203125, -0.016190767288208008, -0.01530313491821289, -0.014415502548217773, -0.013527870178222656, -0.012640237808227539, -0.011752605438232422, -0.010864973068237305, -0.009977340698242188, -0.00908970832824707, -0.008202075958251953, -0.007314443588256836, -0.006426811218261719, -0.0055391788482666016, -0.004651546478271484, -0.003763914108276367, -0.00287628173828125, -0.001988649368286133, -0.0011010169982910156, -0.00021338462829589844, 0.0006742477416992188, 0.001561880111694336, 0.002449512481689453, 0.0033371448516845703, 0.0042247772216796875, 0.005112409591674805, 0.006000041961669922, 0.006887674331665039, 0.007775306701660156, 0.008662939071655273, 0.00955057144165039, 0.010438203811645508, 0.011325836181640625, 0.012213468551635742, 0.01310110092163086, 0.013988733291625977, 0.014876365661621094, 0.01576399803161621, 0.016651630401611328, 0.017539262771606445, 0.018426895141601562, 0.01931452751159668, 0.020202159881591797, 0.021089792251586914, 0.02197742462158203, 0.02286505699157715, 0.023752689361572266, 0.024640321731567383, 0.0255279541015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 11.0, 17.0, 19.0, 36.0, 43.0, 66.0, 112.0, 240.0, 487.0, 1177.0, 960.0, 401.0, 175.0, 104.0, 67.0, 47.0, 29.0, 17.0, 18.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0269927978515625, -0.026195526123046875, -0.02539825439453125, -0.024600982666015625, -0.0238037109375, -0.023006439208984375, -0.02220916748046875, -0.021411895751953125, -0.0206146240234375, -0.019817352294921875, -0.01902008056640625, -0.018222808837890625, -0.017425537109375, -0.016628265380859375, -0.01583099365234375, -0.015033721923828125, -0.0142364501953125, -0.013439178466796875, -0.01264190673828125, -0.011844635009765625, -0.01104736328125, -0.010250091552734375, -0.00945281982421875, -0.008655548095703125, -0.0078582763671875, -0.007061004638671875, -0.00626373291015625, -0.005466461181640625, -0.004669189453125, -0.003871917724609375, -0.00307464599609375, -0.002277374267578125, -0.0014801025390625, -0.000682830810546875, 0.00011444091796875, 0.000911712646484375, 0.001708984375, 0.002506256103515625, 0.00330352783203125, 0.004100799560546875, 0.0048980712890625, 0.005695343017578125, 0.00649261474609375, 0.007289886474609375, 0.008087158203125, 0.008884429931640625, 0.00968170166015625, 0.010478973388671875, 0.0112762451171875, 0.012073516845703125, 0.01287078857421875, 0.013668060302734375, 0.01446533203125, 0.015262603759765625, 0.01605987548828125, 0.016857147216796875, 0.0176544189453125, 0.018451690673828125, 0.01924896240234375, 0.020046234130859375, 0.020843505859375, 0.021640777587890625, 0.02243804931640625, 0.023235321044921875, 0.0240325927734375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 17.0, 45.0, 134.0, 288.0, 299.0, 130.0, 43.0, 32.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3527269959449768, -0.34388798475265503, -0.33504897356033325, -0.3262099623680115, -0.3173709511756897, -0.3085319399833679, -0.29969292879104614, -0.29085391759872437, -0.2820149064064026, -0.2731758952140808, -0.26433688402175903, -0.25549787282943726, -0.24665886163711548, -0.2378198504447937, -0.22898082435131073, -0.22014181315898895, -0.21130278706550598, -0.2024637758731842, -0.19362476468086243, -0.18478575348854065, -0.17594674229621887, -0.1671077311038971, -0.15826870501041412, -0.14942969381809235, -0.14059068262577057, -0.1317516714334488, -0.12291266024112701, -0.11407364159822464, -0.10523463040590286, -0.09639561921358109, -0.08755660057067871, -0.07871758937835693, -0.06987857818603516, -0.06103956699371338, -0.0522005520761013, -0.04336153715848923, -0.03452252596616745, -0.025683514773845673, -0.016844499856233597, -0.008005484938621521, 0.0008335262537002563, 0.009672539308667183, 0.01851155236363411, 0.027350565418601036, 0.03618957847356796, 0.04502858966588974, 0.053867604583501816, 0.06270661950111389, 0.07154563069343567, 0.08038464188575745, 0.08922365307807922, 0.0980626717209816, 0.10690168291330338, 0.11574069410562515, 0.12457971274852753, 0.1334187239408493, 0.14225773513317108, 0.15109674632549286, 0.15993575751781464, 0.1687747687101364, 0.17761379480361938, 0.18645280599594116, 0.19529181718826294, 0.20413082838058472, 0.2129698395729065]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 15.0, 13.0, 18.0, 27.0, 28.0, 39.0, 41.0, 54.0, 57.0, 52.0, 52.0, 54.0, 68.0, 36.0, 44.0, 48.0, 49.0, 42.0, 42.0, 43.0, 28.0, 20.0, 22.0, 19.0, 12.0, 16.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.08969593048095703, -0.08738823235034943, -0.08508054167032242, -0.08277285099029541, -0.0804651528596878, -0.0781574547290802, -0.07584976404905319, -0.07354207336902618, -0.07123437523841858, -0.06892667710781097, -0.06661898642778397, -0.06431129574775696, -0.06200359761714935, -0.059695903211832047, -0.05738820880651474, -0.055080514401197433, -0.05277281999588013, -0.05046512559056282, -0.048157431185245514, -0.04584973677992821, -0.0435420423746109, -0.041234347969293594, -0.03892665356397629, -0.03661895915865898, -0.034311264753341675, -0.03200357034802437, -0.029695875942707062, -0.027388181537389755, -0.02508048713207245, -0.022772792726755142, -0.020465098321437836, -0.01815740391612053, -0.015849709510803223, -0.013542015105485916, -0.01123432070016861, -0.008926626294851303, -0.006618931889533997, -0.00431123748421669, -0.0020035430788993835, 0.000304151326417923, 0.0026118457317352295, 0.004919540137052536, 0.0072272345423698425, 0.009534928947687149, 0.011842623353004456, 0.014150317758321762, 0.01645801216363907, 0.018765706568956375, 0.02107340097427368, 0.023381095379590988, 0.025688789784908295, 0.0279964841902256, 0.030304178595542908, 0.032611873000860214, 0.03491956740617752, 0.03722726181149483, 0.039534956216812134, 0.04184265062212944, 0.04415034502744675, 0.04645803943276405, 0.04876573383808136, 0.051073428243398666, 0.05338112264871597, 0.05568881705403328, 0.057996511459350586]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 6.0, 9.0, 17.0, 19.0, 28.0, 60.0, 60.0, 84.0, 143.0, 191.0, 315.0, 459.0, 758.0, 1419.0, 3369.0, 10570.0, 51964.0, 366807.0, 509723.0, 79783.0, 14543.0, 4180.0, 1654.0, 861.0, 498.0, 304.0, 228.0, 153.0, 87.0, 75.0, 40.0, 34.0, 28.0, 26.0, 10.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.06146240234375, -0.05971193313598633, -0.057961463928222656, -0.056210994720458984, -0.05446052551269531, -0.05271005630493164, -0.05095958709716797, -0.0492091178894043, -0.047458648681640625, -0.04570817947387695, -0.04395771026611328, -0.04220724105834961, -0.04045677185058594, -0.038706302642822266, -0.036955833435058594, -0.03520536422729492, -0.03345489501953125, -0.03170442581176758, -0.029953956604003906, -0.028203487396240234, -0.026453018188476562, -0.02470254898071289, -0.02295207977294922, -0.021201610565185547, -0.019451141357421875, -0.017700672149658203, -0.01595020294189453, -0.01419973373413086, -0.012449264526367188, -0.010698795318603516, -0.008948326110839844, -0.007197856903076172, -0.0054473876953125, -0.003696918487548828, -0.0019464492797851562, -0.00019598007202148438, 0.0015544891357421875, 0.0033049583435058594, 0.005055427551269531, 0.006805896759033203, 0.008556365966796875, 0.010306835174560547, 0.012057304382324219, 0.01380777359008789, 0.015558242797851562, 0.017308712005615234, 0.019059181213378906, 0.020809650421142578, 0.02256011962890625, 0.024310588836669922, 0.026061058044433594, 0.027811527252197266, 0.029561996459960938, 0.03131246566772461, 0.03306293487548828, 0.03481340408325195, 0.036563873291015625, 0.0383143424987793, 0.04006481170654297, 0.04181528091430664, 0.04356575012207031, 0.045316219329833984, 0.047066688537597656, 0.04881715774536133, 0.050567626953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 13.0, 31.0, 56.0, 98.0, 120.0, 145.0, 133.0, 132.0, 99.0, 69.0, 53.0, 24.0, 12.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0270843505859375, -0.026269912719726562, -0.025455474853515625, -0.024641036987304688, -0.02382659912109375, -0.023012161254882812, -0.022197723388671875, -0.021383285522460938, -0.02056884765625, -0.019754409790039062, -0.018939971923828125, -0.018125534057617188, -0.01731109619140625, -0.016496658325195312, -0.015682220458984375, -0.014867782592773438, -0.0140533447265625, -0.013238906860351562, -0.012424468994140625, -0.011610031127929688, -0.01079559326171875, -0.009981155395507812, -0.009166717529296875, -0.008352279663085938, -0.007537841796875, -0.0067234039306640625, -0.005908966064453125, -0.0050945281982421875, -0.00428009033203125, -0.0034656524658203125, -0.002651214599609375, -0.0018367767333984375, -0.0010223388671875, -0.0002079010009765625, 0.000606536865234375, 0.0014209747314453125, 0.00223541259765625, 0.0030498504638671875, 0.003864288330078125, 0.0046787261962890625, 0.0054931640625, 0.0063076019287109375, 0.007122039794921875, 0.007936477661132812, 0.00875091552734375, 0.009565353393554688, 0.010379791259765625, 0.011194229125976562, 0.0120086669921875, 0.012823104858398438, 0.013637542724609375, 0.014451980590820312, 0.01526641845703125, 0.016080856323242188, 0.016895294189453125, 0.017709732055664062, 0.018524169921875, 0.019338607788085938, 0.020153045654296875, 0.020967483520507812, 0.02178192138671875, 0.022596359252929688, 0.023410797119140625, 0.024225234985351562, 0.0250396728515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 10.0, 16.0, 36.0, 25.0, 59.0, 69.0, 156.0, 242.0, 385.0, 711.0, 1270.0, 2469.0, 5126.0, 11225.0, 26599.0, 68009.0, 188620.0, 391175.0, 219380.0, 78299.0, 30159.0, 12790.0, 5767.0, 2656.0, 1453.0, 806.0, 404.0, 228.0, 142.0, 88.0, 61.0, 39.0, 26.0, 17.0, 8.0, 10.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.03533935546875, -0.03437304496765137, -0.033406734466552734, -0.0324404239654541, -0.03147411346435547, -0.030507802963256836, -0.029541492462158203, -0.02857518196105957, -0.027608871459960938, -0.026642560958862305, -0.025676250457763672, -0.02470993995666504, -0.023743629455566406, -0.022777318954467773, -0.02181100845336914, -0.020844697952270508, -0.019878387451171875, -0.018912076950073242, -0.01794576644897461, -0.016979455947875977, -0.016013145446777344, -0.015046834945678711, -0.014080524444580078, -0.013114213943481445, -0.012147903442382812, -0.01118159294128418, -0.010215282440185547, -0.009248971939086914, -0.008282661437988281, -0.0073163509368896484, -0.006350040435791016, -0.005383729934692383, -0.00441741943359375, -0.003451108932495117, -0.0024847984313964844, -0.0015184879302978516, -0.0005521774291992188, 0.00041413307189941406, 0.0013804435729980469, 0.0023467540740966797, 0.0033130645751953125, 0.004279375076293945, 0.005245685577392578, 0.006211996078491211, 0.007178306579589844, 0.008144617080688477, 0.00911092758178711, 0.010077238082885742, 0.011043548583984375, 0.012009859085083008, 0.01297616958618164, 0.013942480087280273, 0.014908790588378906, 0.01587510108947754, 0.016841411590576172, 0.017807722091674805, 0.018774032592773438, 0.01974034309387207, 0.020706653594970703, 0.021672964096069336, 0.02263927459716797, 0.0236055850982666, 0.024571895599365234, 0.025538206100463867, 0.0265045166015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 6.0, 8.0, 8.0, 15.0, 12.0, 19.0, 19.0, 24.0, 35.0, 33.0, 27.0, 53.0, 45.0, 57.0, 61.0, 65.0, 48.0, 43.0, 57.0, 54.0, 46.0, 50.0, 37.0, 28.0, 25.0, 31.0, 20.0, 17.0, 13.0, 8.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.04669189453125, -0.045441627502441406, -0.04419136047363281, -0.04294109344482422, -0.041690826416015625, -0.04044055938720703, -0.03919029235839844, -0.037940025329589844, -0.03668975830078125, -0.035439491271972656, -0.03418922424316406, -0.03293895721435547, -0.031688690185546875, -0.03043842315673828, -0.029188156127929688, -0.027937889099121094, -0.0266876220703125, -0.025437355041503906, -0.024187088012695312, -0.02293682098388672, -0.021686553955078125, -0.02043628692626953, -0.019186019897460938, -0.017935752868652344, -0.01668548583984375, -0.015435218811035156, -0.014184951782226562, -0.012934684753417969, -0.011684417724609375, -0.010434150695800781, -0.009183883666992188, -0.007933616638183594, -0.006683349609375, -0.005433082580566406, -0.0041828155517578125, -0.0029325485229492188, -0.001682281494140625, -0.00043201446533203125, 0.0008182525634765625, 0.0020685195922851562, 0.00331878662109375, 0.004569053649902344, 0.0058193206787109375, 0.007069587707519531, 0.008319854736328125, 0.009570121765136719, 0.010820388793945312, 0.012070655822753906, 0.0133209228515625, 0.014571189880371094, 0.015821456909179688, 0.01707172393798828, 0.018321990966796875, 0.01957225799560547, 0.020822525024414062, 0.022072792053222656, 0.02332305908203125, 0.024573326110839844, 0.025823593139648438, 0.02707386016845703, 0.028324127197265625, 0.02957439422607422, 0.030824661254882812, 0.032074928283691406, 0.0333251953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 17.0, 28.0, 40.0, 49.0, 75.0, 92.0, 123.0, 187.0, 252.0, 315.0, 469.0, 654.0, 1039.0, 1602.0, 2650.0, 5588.0, 14508.0, 50214.0, 295682.0, 553092.0, 84140.0, 21041.0, 7535.0, 3470.0, 1841.0, 1147.0, 782.0, 545.0, 373.0, 274.0, 195.0, 147.0, 109.0, 66.0, 60.0, 40.0, 17.0, 23.0, 10.0, 13.0, 6.0, 9.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0231170654296875, -0.022296428680419922, -0.021475791931152344, -0.020655155181884766, -0.019834518432617188, -0.01901388168334961, -0.01819324493408203, -0.017372608184814453, -0.016551971435546875, -0.015731334686279297, -0.014910697937011719, -0.01409006118774414, -0.013269424438476562, -0.012448787689208984, -0.011628150939941406, -0.010807514190673828, -0.00998687744140625, -0.009166240692138672, -0.008345603942871094, -0.007524967193603516, -0.0067043304443359375, -0.005883693695068359, -0.005063056945800781, -0.004242420196533203, -0.003421783447265625, -0.002601146697998047, -0.0017805099487304688, -0.0009598731994628906, -0.0001392364501953125, 0.0006814002990722656, 0.0015020370483398438, 0.002322673797607422, 0.003143310546875, 0.003963947296142578, 0.004784584045410156, 0.005605220794677734, 0.0064258575439453125, 0.007246494293212891, 0.008067131042480469, 0.008887767791748047, 0.009708404541015625, 0.010529041290283203, 0.011349678039550781, 0.01217031478881836, 0.012990951538085938, 0.013811588287353516, 0.014632225036621094, 0.015452861785888672, 0.01627349853515625, 0.017094135284423828, 0.017914772033691406, 0.018735408782958984, 0.019556045532226562, 0.02037668228149414, 0.02119731903076172, 0.022017955780029297, 0.022838592529296875, 0.023659229278564453, 0.02447986602783203, 0.02530050277709961, 0.026121139526367188, 0.026941776275634766, 0.027762413024902344, 0.028583049774169922, 0.0294036865234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 3.0, 8.0, 6.0, 7.0, 10.0, 8.0, 15.0, 20.0, 20.0, 31.0, 26.0, 32.0, 49.0, 66.0, 68.0, 78.0, 90.0, 100.0, 71.0, 53.0, 50.0, 44.0, 31.0, 13.0, 23.0, 19.0, 16.0, 8.0, 6.0, 5.0, 1.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.710124969482422e-05, -5.514174699783325e-05, -5.3182244300842285e-05, -5.122274160385132e-05, -4.926323890686035e-05, -4.7303736209869385e-05, -4.534423351287842e-05, -4.338473081588745e-05, -4.1425228118896484e-05, -3.946572542190552e-05, -3.750622272491455e-05, -3.5546720027923584e-05, -3.358721733093262e-05, -3.162771463394165e-05, -2.9668211936950684e-05, -2.7708709239959717e-05, -2.574920654296875e-05, -2.3789703845977783e-05, -2.1830201148986816e-05, -1.987069845199585e-05, -1.7911195755004883e-05, -1.5951693058013916e-05, -1.399219036102295e-05, -1.2032687664031982e-05, -1.0073184967041016e-05, -8.113682270050049e-06, -6.154179573059082e-06, -4.194676876068115e-06, -2.2351741790771484e-06, -2.7567148208618164e-07, 1.6838312149047852e-06, 3.643333911895752e-06, 5.602836608886719e-06, 7.5623393058776855e-06, 9.521842002868652e-06, 1.1481344699859619e-05, 1.3440847396850586e-05, 1.5400350093841553e-05, 1.735985279083252e-05, 1.9319355487823486e-05, 2.1278858184814453e-05, 2.323836088180542e-05, 2.5197863578796387e-05, 2.7157366275787354e-05, 2.911686897277832e-05, 3.107637166976929e-05, 3.3035874366760254e-05, 3.499537706375122e-05, 3.695487976074219e-05, 3.8914382457733154e-05, 4.087388515472412e-05, 4.283338785171509e-05, 4.4792890548706055e-05, 4.675239324569702e-05, 4.871189594268799e-05, 5.0671398639678955e-05, 5.263090133666992e-05, 5.459040403366089e-05, 5.6549906730651855e-05, 5.850940942764282e-05, 6.046891212463379e-05, 6.242841482162476e-05, 6.438791751861572e-05, 6.634742021560669e-05, 6.830692291259766e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 7.0, 14.0, 8.0, 30.0, 28.0, 51.0, 60.0, 134.0, 161.0, 297.0, 434.0, 896.0, 1630.0, 3514.0, 8265.0, 25757.0, 102341.0, 533220.0, 288703.0, 56140.0, 15749.0, 5603.0, 2590.0, 1230.0, 650.0, 363.0, 217.0, 141.0, 107.0, 75.0, 45.0, 25.0, 16.0, 15.0, 7.0, 10.0, 7.0, 0.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02154541015625, -0.02086782455444336, -0.02019023895263672, -0.019512653350830078, -0.018835067749023438, -0.018157482147216797, -0.017479896545410156, -0.016802310943603516, -0.016124725341796875, -0.015447139739990234, -0.014769554138183594, -0.014091968536376953, -0.013414382934570312, -0.012736797332763672, -0.012059211730957031, -0.01138162612915039, -0.01070404052734375, -0.01002645492553711, -0.009348869323730469, -0.008671283721923828, -0.007993698120117188, -0.007316112518310547, -0.006638526916503906, -0.005960941314697266, -0.005283355712890625, -0.004605770111083984, -0.003928184509277344, -0.003250598907470703, -0.0025730133056640625, -0.0018954277038574219, -0.0012178421020507812, -0.0005402565002441406, 0.0001373291015625, 0.0008149147033691406, 0.0014925003051757812, 0.002170085906982422, 0.0028476715087890625, 0.003525257110595703, 0.004202842712402344, 0.004880428314208984, 0.005558013916015625, 0.006235599517822266, 0.006913185119628906, 0.007590770721435547, 0.008268356323242188, 0.008945941925048828, 0.009623527526855469, 0.01030111312866211, 0.01097869873046875, 0.01165628433227539, 0.012333869934082031, 0.013011455535888672, 0.013689041137695312, 0.014366626739501953, 0.015044212341308594, 0.015721797943115234, 0.016399383544921875, 0.017076969146728516, 0.017754554748535156, 0.018432140350341797, 0.019109725952148438, 0.019787311553955078, 0.02046489715576172, 0.02114248275756836, 0.021820068359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 18.0, 11.0, 31.0, 32.0, 54.0, 83.0, 178.0, 185.0, 150.0, 92.0, 44.0, 29.0, 16.0, 16.0, 16.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022369384765625, -0.02149057388305664, -0.02061176300048828, -0.019732952117919922, -0.018854141235351562, -0.017975330352783203, -0.017096519470214844, -0.016217708587646484, -0.015338897705078125, -0.014460086822509766, -0.013581275939941406, -0.012702465057373047, -0.011823654174804688, -0.010944843292236328, -0.010066032409667969, -0.00918722152709961, -0.00830841064453125, -0.007429599761962891, -0.006550788879394531, -0.005671977996826172, -0.0047931671142578125, -0.003914356231689453, -0.0030355453491210938, -0.0021567344665527344, -0.001277923583984375, -0.0003991127014160156, 0.00047969818115234375, 0.0013585090637207031, 0.0022373199462890625, 0.003116130828857422, 0.003994941711425781, 0.004873752593994141, 0.0057525634765625, 0.006631374359130859, 0.007510185241699219, 0.008388996124267578, 0.009267807006835938, 0.010146617889404297, 0.011025428771972656, 0.011904239654541016, 0.012783050537109375, 0.013661861419677734, 0.014540672302246094, 0.015419483184814453, 0.016298294067382812, 0.017177104949951172, 0.01805591583251953, 0.01893472671508789, 0.01981353759765625, 0.02069234848022461, 0.02157115936279297, 0.022449970245361328, 0.023328781127929688, 0.024207592010498047, 0.025086402893066406, 0.025965213775634766, 0.026844024658203125, 0.027722835540771484, 0.028601646423339844, 0.029480457305908203, 0.030359268188476562, 0.031238079071044922, 0.03211688995361328, 0.03299570083618164, 0.03387451171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 4.0, 7.0, 17.0, 23.0, 29.0, 70.0, 87.0, 136.0, 124.0, 103.0, 113.0, 78.0, 67.0, 39.0, 26.0, 15.0, 11.0, 11.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20814645290374756, -0.20171432197093964, -0.19528217613697052, -0.1888500452041626, -0.18241789937019348, -0.17598576843738556, -0.16955362260341644, -0.16312149167060852, -0.1566893458366394, -0.15025721490383148, -0.14382506906986237, -0.13739293813705444, -0.13096079230308533, -0.1245286613702774, -0.11809651553630829, -0.11166438460350037, -0.10523224622011185, -0.09880010783672333, -0.09236796945333481, -0.08593583106994629, -0.07950369268655777, -0.07307155430316925, -0.06663942337036133, -0.06020728126168251, -0.05377514287829399, -0.04734300449490547, -0.04091086611151695, -0.03447873145341873, -0.028046591207385063, -0.021614454686641693, -0.015182316303253174, -0.008750177919864655, -0.0023180395364761353, 0.004114098381251097, 0.010546236298978329, 0.016978373751044273, 0.023410512134432793, 0.029842648655176163, 0.03627478703856468, 0.0427069254219532, 0.04913906380534172, 0.05557120218873024, 0.06200334057211876, 0.06843547523021698, 0.0748676136136055, 0.08129975199699402, 0.08773189038038254, 0.09416402876377106, 0.10059616714715958, 0.1070283055305481, 0.11346044391393661, 0.11989258229732513, 0.12632471323013306, 0.13275685906410217, 0.1391889899969101, 0.1456211358308792, 0.15205326676368713, 0.15848539769649506, 0.16491754353046417, 0.1713496744632721, 0.1777818202972412, 0.18421395123004913, 0.19064609706401825, 0.19707822799682617, 0.2035103738307953]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 14.0, 17.0, 6.0, 12.0, 20.0, 15.0, 16.0, 17.0, 22.0, 27.0, 29.0, 31.0, 37.0, 29.0, 32.0, 27.0, 26.0, 28.0, 41.0, 52.0, 36.0, 33.0, 44.0, 41.0, 36.0, 30.0, 31.0, 26.0, 37.0, 23.0, 16.0, 18.0, 14.0, 13.0, 19.0, 10.0, 13.0, 12.0, 4.0, 10.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0795784592628479, -0.07692801207304001, -0.07427756488323212, -0.07162711769342422, -0.06897667050361633, -0.06632623076438904, -0.06367578357458115, -0.061025336384773254, -0.05837488919496536, -0.05572444200515747, -0.05307399481534958, -0.050423551350831985, -0.047773104161024094, -0.0451226569712162, -0.04247221350669861, -0.03982176631689072, -0.037171319127082825, -0.03452087193727493, -0.03187042474746704, -0.029219981282949448, -0.026569534093141556, -0.023919086903333664, -0.02126864157617092, -0.01861819624900818, -0.015967749059200287, -0.01331730280071497, -0.010666856542229652, -0.008016410283744335, -0.005365964025259018, -0.0027155177667737007, -6.507150828838348e-05, 0.002585373818874359, 0.005235821008682251, 0.007886267267167568, 0.010536713525652885, 0.013187159784138203, 0.01583760604262352, 0.018488053232431412, 0.021138498559594154, 0.023788943886756897, 0.02643939107656479, 0.02908983826637268, 0.03174028545618057, 0.034390728920698166, 0.03704117611050606, 0.03969162330031395, 0.04234206676483154, 0.044992513954639435, 0.04764296114444733, 0.05029340833425522, 0.05294385552406311, 0.055594298988580704, 0.058244746178388596, 0.06089519336819649, 0.06354563683271408, 0.06619608402252197, 0.06884653121232986, 0.07149697840213776, 0.07414742559194565, 0.07679787278175354, 0.07944831252098083, 0.08209875971078873, 0.08474920690059662, 0.08739965409040451, 0.0900501012802124]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 18.0, 23.0, 46.0, 143.0, 449.0, 2142.0, 19848.0, 1727072.0, 2417803.0, 23559.0, 2468.0, 466.0, 142.0, 50.0, 30.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06475067138671875, -0.0627288818359375, -0.06070709228515625, -0.058685302734375, -0.05666351318359375, -0.0546417236328125, -0.05261993408203125, -0.05059814453125, -0.04857635498046875, -0.0465545654296875, -0.04453277587890625, -0.042510986328125, -0.04048919677734375, -0.0384674072265625, -0.03644561767578125, -0.034423828125, -0.03240203857421875, -0.0303802490234375, -0.02835845947265625, -0.026336669921875, -0.02431488037109375, -0.0222930908203125, -0.02027130126953125, -0.01824951171875, -0.01622772216796875, -0.0142059326171875, -0.01218414306640625, -0.010162353515625, -0.00814056396484375, -0.0061187744140625, -0.00409698486328125, -0.0020751953125, -5.340576171875e-05, 0.0019683837890625, 0.00399017333984375, 0.006011962890625, 0.00803375244140625, 0.0100555419921875, 0.01207733154296875, 0.01409912109375, 0.01612091064453125, 0.0181427001953125, 0.02016448974609375, 0.022186279296875, 0.02420806884765625, 0.0262298583984375, 0.02825164794921875, 0.0302734375, 0.03229522705078125, 0.0343170166015625, 0.03633880615234375, 0.038360595703125, 0.04038238525390625, 0.0424041748046875, 0.04442596435546875, 0.04644775390625, 0.04846954345703125, 0.0504913330078125, 0.05251312255859375, 0.054534912109375, 0.05655670166015625, 0.0585784912109375, 0.06060028076171875, 0.0626220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 11.0, 13.0, 31.0, 57.0, 70.0, 110.0, 120.0, 135.0, 123.0, 113.0, 82.0, 64.0, 32.0, 17.0, 13.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028228759765625, -0.027362823486328125, -0.02649688720703125, -0.025630950927734375, -0.0247650146484375, -0.023899078369140625, -0.02303314208984375, -0.022167205810546875, -0.02130126953125, -0.020435333251953125, -0.01956939697265625, -0.018703460693359375, -0.0178375244140625, -0.016971588134765625, -0.01610565185546875, -0.015239715576171875, -0.014373779296875, -0.013507843017578125, -0.01264190673828125, -0.011775970458984375, -0.0109100341796875, -0.010044097900390625, -0.00917816162109375, -0.008312225341796875, -0.0074462890625, -0.006580352783203125, -0.00571441650390625, -0.004848480224609375, -0.0039825439453125, -0.003116607666015625, -0.00225067138671875, -0.001384735107421875, -0.000518798828125, 0.000347137451171875, 0.00121307373046875, 0.002079010009765625, 0.0029449462890625, 0.003810882568359375, 0.00467681884765625, 0.005542755126953125, 0.00640869140625, 0.007274627685546875, 0.00814056396484375, 0.009006500244140625, 0.0098724365234375, 0.010738372802734375, 0.01160430908203125, 0.012470245361328125, 0.013336181640625, 0.014202117919921875, 0.01506805419921875, 0.015933990478515625, 0.0167999267578125, 0.017665863037109375, 0.01853179931640625, 0.019397735595703125, 0.020263671875, 0.021129608154296875, 0.02199554443359375, 0.022861480712890625, 0.0237274169921875, 0.024593353271484375, 0.02545928955078125, 0.026325225830078125, 0.027191162109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 7.0, 16.0, 29.0, 36.0, 43.0, 83.0, 116.0, 199.0, 337.0, 561.0, 990.0, 1851.0, 3918.0, 9570.0, 27620.0, 111859.0, 1695859.0, 2168860.0, 123908.0, 29705.0, 10101.0, 4099.0, 1925.0, 1043.0, 558.0, 357.0, 209.0, 126.0, 85.0, 61.0, 42.0, 33.0, 14.0, 8.0, 8.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.033416748046875, -0.03237342834472656, -0.031330108642578125, -0.030286788940429688, -0.02924346923828125, -0.028200149536132812, -0.027156829833984375, -0.026113510131835938, -0.0250701904296875, -0.024026870727539062, -0.022983551025390625, -0.021940231323242188, -0.02089691162109375, -0.019853591918945312, -0.018810272216796875, -0.017766952514648438, -0.0167236328125, -0.015680313110351562, -0.014636993408203125, -0.013593673706054688, -0.01255035400390625, -0.011507034301757812, -0.010463714599609375, -0.009420394897460938, -0.0083770751953125, -0.0073337554931640625, -0.006290435791015625, -0.0052471160888671875, -0.00420379638671875, -0.0031604766845703125, -0.002117156982421875, -0.0010738372802734375, -3.0517578125e-05, 0.0010128021240234375, 0.002056121826171875, 0.0030994415283203125, 0.00414276123046875, 0.0051860809326171875, 0.006229400634765625, 0.0072727203369140625, 0.0083160400390625, 0.009359359741210938, 0.010402679443359375, 0.011445999145507812, 0.01248931884765625, 0.013532638549804688, 0.014575958251953125, 0.015619277954101562, 0.01666259765625, 0.017705917358398438, 0.018749237060546875, 0.019792556762695312, 0.02083587646484375, 0.021879196166992188, 0.022922515869140625, 0.023965835571289062, 0.0250091552734375, 0.026052474975585938, 0.027095794677734375, 0.028139114379882812, 0.02918243408203125, 0.030225753784179688, 0.031269073486328125, 0.03231239318847656, 0.033355712890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 15.0, 14.0, 22.0, 30.0, 39.0, 56.0, 98.0, 146.0, 220.0, 506.0, 1075.0, 881.0, 389.0, 223.0, 106.0, 56.0, 45.0, 40.0, 18.0, 23.0, 13.0, 9.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0259246826171875, -0.02499556541442871, -0.024066448211669922, -0.023137331008911133, -0.022208213806152344, -0.021279096603393555, -0.020349979400634766, -0.019420862197875977, -0.018491744995117188, -0.0175626277923584, -0.01663351058959961, -0.01570439338684082, -0.014775276184082031, -0.013846158981323242, -0.012917041778564453, -0.011987924575805664, -0.011058807373046875, -0.010129690170288086, -0.009200572967529297, -0.008271455764770508, -0.007342338562011719, -0.00641322135925293, -0.005484104156494141, -0.0045549869537353516, -0.0036258697509765625, -0.0026967525482177734, -0.0017676353454589844, -0.0008385181427001953, 9.059906005859375e-05, 0.0010197162628173828, 0.0019488334655761719, 0.002877950668334961, 0.00380706787109375, 0.004736185073852539, 0.005665302276611328, 0.006594419479370117, 0.007523536682128906, 0.008452653884887695, 0.009381771087646484, 0.010310888290405273, 0.011240005493164062, 0.012169122695922852, 0.01309823989868164, 0.01402735710144043, 0.014956474304199219, 0.015885591506958008, 0.016814708709716797, 0.017743825912475586, 0.018672943115234375, 0.019602060317993164, 0.020531177520751953, 0.021460294723510742, 0.02238941192626953, 0.02331852912902832, 0.02424764633178711, 0.0251767635345459, 0.026105880737304688, 0.027034997940063477, 0.027964115142822266, 0.028893232345581055, 0.029822349548339844, 0.030751466751098633, 0.03168058395385742, 0.03260970115661621, 0.033538818359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 18.0, 48.0, 142.0, 330.0, 281.0, 100.0, 46.0, 18.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43314528465270996, -0.41948965191841125, -0.40583401918411255, -0.39217838644981384, -0.37852275371551514, -0.36486712098121643, -0.3512114882469177, -0.337555855512619, -0.3239002227783203, -0.3102445900440216, -0.2965889573097229, -0.2829333245754242, -0.2692776918411255, -0.2556220591068268, -0.24196642637252808, -0.22831079363822937, -0.21465517580509186, -0.20099954307079315, -0.18734391033649445, -0.17368827760219574, -0.16003264486789703, -0.14637702703475952, -0.13272139430046082, -0.11906575411558151, -0.1054101213812828, -0.0917544886469841, -0.0780988559126854, -0.06444323062896729, -0.05078759416937828, -0.03713196516036987, -0.023476332426071167, -0.009820699691772461, 0.003834933042526245, 0.01749056577682495, 0.031146196648478508, 0.044801827520132065, 0.05845746025443077, 0.07211308926343918, 0.08576872199773788, 0.09942435473203659, 0.1130799874663353, 0.1267356127500534, 0.1403912454843521, 0.15404687821865082, 0.16770251095294952, 0.18135814368724823, 0.19501377642154694, 0.20866940915584564, 0.22232504189014435, 0.23598067462444305, 0.24963630735874176, 0.2632919251918793, 0.276947557926178, 0.2906031906604767, 0.3042588233947754, 0.3179144561290741, 0.3315700888633728, 0.3452257215976715, 0.3588813543319702, 0.3725369870662689, 0.3861926198005676, 0.39984825253486633, 0.41350388526916504, 0.42715951800346375, 0.44081515073776245]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 12.0, 16.0, 17.0, 19.0, 38.0, 36.0, 33.0, 47.0, 56.0, 61.0, 41.0, 38.0, 58.0, 56.0, 53.0, 64.0, 48.0, 36.0, 41.0, 37.0, 40.0, 26.0, 28.0, 28.0, 17.0, 13.0, 7.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11802500486373901, -0.11464447528123856, -0.1112639456987381, -0.10788341611623764, -0.10450288653373718, -0.10112236440181732, -0.09774183481931686, -0.0943613052368164, -0.09098077565431595, -0.08760024607181549, -0.08421971648931503, -0.08083918690681458, -0.07745866477489471, -0.07407812774181366, -0.0706976056098938, -0.06731707602739334, -0.06393654644489288, -0.060556016862392426, -0.05717548727989197, -0.05379496142268181, -0.05041443184018135, -0.04703390225768089, -0.043653376400470734, -0.040272846817970276, -0.03689231723546982, -0.03351178765296936, -0.030131259933114052, -0.026750732213258743, -0.023370202630758286, -0.019989673048257828, -0.01660914532840252, -0.01322861760854721, -0.009848088026046753, -0.00646755937486887, -0.0030870307236909866, 0.0002934979274868965, 0.0036740265786647797, 0.007054556161165237, 0.010435083881020546, 0.013815611600875854, 0.017196141183376312, 0.02057667076587677, 0.02395719848573208, 0.027337726205587387, 0.030718255788087845, 0.0340987853705883, 0.03747931122779846, 0.04085984081029892, 0.04424037039279938, 0.047620899975299835, 0.05100142955780029, 0.05438195541501045, 0.05776248499751091, 0.06114301458001137, 0.06452354043722153, 0.06790407001972198, 0.07128459960222244, 0.0746651291847229, 0.07804565876722336, 0.08142618834972382, 0.08480671048164368, 0.08818724751472473, 0.09156776964664459, 0.09494829922914505, 0.09832882881164551]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 14.0, 11.0, 17.0, 19.0, 29.0, 40.0, 54.0, 94.0, 130.0, 176.0, 275.0, 478.0, 868.0, 2044.0, 5358.0, 18223.0, 78592.0, 359351.0, 439352.0, 107723.0, 24082.0, 6744.0, 2405.0, 1008.0, 552.0, 316.0, 171.0, 111.0, 92.0, 56.0, 55.0, 23.0, 26.0, 15.0, 19.0, 6.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.06866455078125, -0.0666508674621582, -0.0646371841430664, -0.06262350082397461, -0.06060981750488281, -0.058596134185791016, -0.05658245086669922, -0.05456876754760742, -0.052555084228515625, -0.05054140090942383, -0.04852771759033203, -0.046514034271240234, -0.04450035095214844, -0.04248666763305664, -0.040472984313964844, -0.03845930099487305, -0.03644561767578125, -0.03443193435668945, -0.032418251037597656, -0.03040456771850586, -0.028390884399414062, -0.026377201080322266, -0.02436351776123047, -0.022349834442138672, -0.020336151123046875, -0.018322467803955078, -0.01630878448486328, -0.014295101165771484, -0.012281417846679688, -0.01026773452758789, -0.008254051208496094, -0.006240367889404297, -0.0042266845703125, -0.002213001251220703, -0.00019931793212890625, 0.0018143653869628906, 0.0038280487060546875, 0.005841732025146484, 0.007855415344238281, 0.009869098663330078, 0.011882781982421875, 0.013896465301513672, 0.01591014862060547, 0.017923831939697266, 0.019937515258789062, 0.02195119857788086, 0.023964881896972656, 0.025978565216064453, 0.02799224853515625, 0.030005931854248047, 0.032019615173339844, 0.03403329849243164, 0.03604698181152344, 0.038060665130615234, 0.04007434844970703, 0.04208803176879883, 0.044101715087890625, 0.04611539840698242, 0.04812908172607422, 0.050142765045166016, 0.05215644836425781, 0.05417013168334961, 0.056183815002441406, 0.0581974983215332, 0.060211181640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 14.0, 16.0, 30.0, 42.0, 80.0, 87.0, 111.0, 132.0, 116.0, 91.0, 79.0, 75.0, 43.0, 31.0, 25.0, 17.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0297393798828125, -0.028888225555419922, -0.028037071228027344, -0.027185916900634766, -0.026334762573242188, -0.02548360824584961, -0.02463245391845703, -0.023781299591064453, -0.022930145263671875, -0.022078990936279297, -0.02122783660888672, -0.02037668228149414, -0.019525527954101562, -0.018674373626708984, -0.017823219299316406, -0.016972064971923828, -0.01612091064453125, -0.015269756317138672, -0.014418601989746094, -0.013567447662353516, -0.012716293334960938, -0.01186513900756836, -0.011013984680175781, -0.010162830352783203, -0.009311676025390625, -0.008460521697998047, -0.007609367370605469, -0.006758213043212891, -0.0059070587158203125, -0.005055904388427734, -0.004204750061035156, -0.003353595733642578, -0.00250244140625, -0.0016512870788574219, -0.0008001327514648438, 5.1021575927734375e-05, 0.0009021759033203125, 0.0017533302307128906, 0.0026044845581054688, 0.003455638885498047, 0.004306793212890625, 0.005157947540283203, 0.006009101867675781, 0.006860256195068359, 0.0077114105224609375, 0.008562564849853516, 0.009413719177246094, 0.010264873504638672, 0.01111602783203125, 0.011967182159423828, 0.012818336486816406, 0.013669490814208984, 0.014520645141601562, 0.01537179946899414, 0.01622295379638672, 0.017074108123779297, 0.017925262451171875, 0.018776416778564453, 0.01962757110595703, 0.02047872543334961, 0.021329879760742188, 0.022181034088134766, 0.023032188415527344, 0.023883342742919922, 0.0247344970703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 17.0, 16.0, 37.0, 59.0, 113.0, 191.0, 422.0, 852.0, 2223.0, 5994.0, 19420.0, 70924.0, 276770.0, 464305.0, 150406.0, 39130.0, 11174.0, 3801.0, 1454.0, 589.0, 305.0, 143.0, 71.0, 47.0, 33.0, 14.0, 12.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059234619140625, -0.05734062194824219, -0.055446624755859375, -0.05355262756347656, -0.05165863037109375, -0.04976463317871094, -0.047870635986328125, -0.04597663879394531, -0.0440826416015625, -0.04218864440917969, -0.040294647216796875, -0.03840065002441406, -0.03650665283203125, -0.03461265563964844, -0.032718658447265625, -0.030824661254882812, -0.0289306640625, -0.027036666870117188, -0.025142669677734375, -0.023248672485351562, -0.02135467529296875, -0.019460678100585938, -0.017566680908203125, -0.015672683715820312, -0.0137786865234375, -0.011884689331054688, -0.009990692138671875, -0.008096694946289062, -0.00620269775390625, -0.0043087005615234375, -0.002414703369140625, -0.0005207061767578125, 0.001373291015625, 0.0032672882080078125, 0.005161285400390625, 0.0070552825927734375, 0.00894927978515625, 0.010843276977539062, 0.012737274169921875, 0.014631271362304688, 0.0165252685546875, 0.018419265747070312, 0.020313262939453125, 0.022207260131835938, 0.02410125732421875, 0.025995254516601562, 0.027889251708984375, 0.029783248901367188, 0.03167724609375, 0.03357124328613281, 0.035465240478515625, 0.03735923767089844, 0.03925323486328125, 0.04114723205566406, 0.043041229248046875, 0.04493522644042969, 0.0468292236328125, 0.04872322082519531, 0.050617218017578125, 0.05251121520996094, 0.05440521240234375, 0.05629920959472656, 0.058193206787109375, 0.06008720397949219, 0.061981201171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 13.0, 12.0, 25.0, 27.0, 46.0, 42.0, 58.0, 47.0, 47.0, 56.0, 47.0, 48.0, 57.0, 51.0, 55.0, 41.0, 36.0, 56.0, 32.0, 29.0, 13.0, 11.0, 14.0, 15.0, 15.0, 9.0, 11.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04876708984375, -0.04725074768066406, -0.045734405517578125, -0.04421806335449219, -0.04270172119140625, -0.04118537902832031, -0.039669036865234375, -0.03815269470214844, -0.0366363525390625, -0.03512001037597656, -0.033603668212890625, -0.03208732604980469, -0.03057098388671875, -0.029054641723632812, -0.027538299560546875, -0.026021957397460938, -0.024505615234375, -0.022989273071289062, -0.021472930908203125, -0.019956588745117188, -0.01844024658203125, -0.016923904418945312, -0.015407562255859375, -0.013891220092773438, -0.0123748779296875, -0.010858535766601562, -0.009342193603515625, -0.007825851440429688, -0.00630950927734375, -0.0047931671142578125, -0.003276824951171875, -0.0017604827880859375, -0.000244140625, 0.0012722015380859375, 0.002788543701171875, 0.0043048858642578125, 0.00582122802734375, 0.0073375701904296875, 0.008853912353515625, 0.010370254516601562, 0.0118865966796875, 0.013402938842773438, 0.014919281005859375, 0.016435623168945312, 0.01795196533203125, 0.019468307495117188, 0.020984649658203125, 0.022500991821289062, 0.024017333984375, 0.025533676147460938, 0.027050018310546875, 0.028566360473632812, 0.03008270263671875, 0.03159904479980469, 0.033115386962890625, 0.03463172912597656, 0.0361480712890625, 0.03766441345214844, 0.039180755615234375, 0.04069709777832031, 0.04221343994140625, 0.04372978210449219, 0.045246124267578125, 0.04676246643066406, 0.04827880859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 2.0, 9.0, 3.0, 17.0, 18.0, 19.0, 29.0, 52.0, 75.0, 147.0, 198.0, 357.0, 621.0, 980.0, 1716.0, 3132.0, 5579.0, 10417.0, 20778.0, 44232.0, 109161.0, 307042.0, 331008.0, 118925.0, 47485.0, 21831.0, 11066.0, 5892.0, 3199.0, 1793.0, 1045.0, 636.0, 424.0, 259.0, 138.0, 87.0, 59.0, 39.0, 26.0, 13.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.02197265625, -0.021363019943237305, -0.02075338363647461, -0.020143747329711914, -0.01953411102294922, -0.018924474716186523, -0.018314838409423828, -0.017705202102661133, -0.017095565795898438, -0.016485929489135742, -0.015876293182373047, -0.015266656875610352, -0.014657020568847656, -0.014047384262084961, -0.013437747955322266, -0.01282811164855957, -0.012218475341796875, -0.01160883903503418, -0.010999202728271484, -0.010389566421508789, -0.009779930114746094, -0.009170293807983398, -0.008560657501220703, -0.007951021194458008, -0.0073413848876953125, -0.006731748580932617, -0.006122112274169922, -0.0055124759674072266, -0.004902839660644531, -0.004293203353881836, -0.0036835670471191406, -0.0030739307403564453, -0.00246429443359375, -0.0018546581268310547, -0.0012450218200683594, -0.0006353855133056641, -2.574920654296875e-05, 0.0005838871002197266, 0.0011935234069824219, 0.0018031597137451172, 0.0024127960205078125, 0.003022432327270508, 0.003632068634033203, 0.0042417049407958984, 0.004851341247558594, 0.005460977554321289, 0.006070613861083984, 0.00668025016784668, 0.007289886474609375, 0.00789952278137207, 0.008509159088134766, 0.009118795394897461, 0.009728431701660156, 0.010338068008422852, 0.010947704315185547, 0.011557340621948242, 0.012166976928710938, 0.012776613235473633, 0.013386249542236328, 0.013995885848999023, 0.014605522155761719, 0.015215158462524414, 0.01582479476928711, 0.016434431076049805, 0.0170440673828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 20.0, 15.0, 20.0, 29.0, 33.0, 25.0, 52.0, 50.0, 68.0, 90.0, 69.0, 77.0, 72.0, 57.0, 54.0, 56.0, 42.0, 21.0, 33.0, 16.0, 23.0, 15.0, 15.0, 7.0, 7.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.5344775319099426e-05, -5.352869629859924e-05, -5.171261727809906e-05, -4.989653825759888e-05, -4.8080459237098694e-05, -4.626438021659851e-05, -4.444830119609833e-05, -4.2632222175598145e-05, -4.081614315509796e-05, -3.900006413459778e-05, -3.7183985114097595e-05, -3.536790609359741e-05, -3.355182707309723e-05, -3.1735748052597046e-05, -2.9919669032096863e-05, -2.810359001159668e-05, -2.6287510991096497e-05, -2.4471431970596313e-05, -2.265535295009613e-05, -2.0839273929595947e-05, -1.9023194909095764e-05, -1.720711588859558e-05, -1.5391036868095398e-05, -1.3574957847595215e-05, -1.1758878827095032e-05, -9.942799806594849e-06, -8.126720786094666e-06, -6.310641765594482e-06, -4.494562745094299e-06, -2.678483724594116e-06, -8.624047040939331e-07, 9.5367431640625e-07, 2.769753336906433e-06, 4.585832357406616e-06, 6.401911377906799e-06, 8.217990398406982e-06, 1.0034069418907166e-05, 1.1850148439407349e-05, 1.3666227459907532e-05, 1.5482306480407715e-05, 1.7298385500907898e-05, 1.911446452140808e-05, 2.0930543541908264e-05, 2.2746622562408447e-05, 2.456270158290863e-05, 2.6378780603408813e-05, 2.8194859623908997e-05, 3.001093864440918e-05, 3.182701766490936e-05, 3.3643096685409546e-05, 3.545917570590973e-05, 3.727525472640991e-05, 3.9091333746910095e-05, 4.090741276741028e-05, 4.272349178791046e-05, 4.4539570808410645e-05, 4.635564982891083e-05, 4.817172884941101e-05, 4.9987807869911194e-05, 5.180388689041138e-05, 5.361996591091156e-05, 5.543604493141174e-05, 5.7252123951911926e-05, 5.906820297241211e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 14.0, 10.0, 25.0, 28.0, 35.0, 95.0, 181.0, 285.0, 611.0, 1250.0, 2870.0, 6960.0, 17448.0, 49284.0, 189296.0, 524992.0, 178867.0, 47147.0, 16904.0, 6743.0, 2945.0, 1267.0, 616.0, 292.0, 167.0, 81.0, 42.0, 43.0, 15.0, 11.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.025797367095947266, -0.02492237091064453, -0.024047374725341797, -0.023172378540039062, -0.022297382354736328, -0.021422386169433594, -0.02054738998413086, -0.019672393798828125, -0.01879739761352539, -0.017922401428222656, -0.017047405242919922, -0.016172409057617188, -0.015297412872314453, -0.014422416687011719, -0.013547420501708984, -0.01267242431640625, -0.011797428131103516, -0.010922431945800781, -0.010047435760498047, -0.009172439575195312, -0.008297443389892578, -0.007422447204589844, -0.006547451019287109, -0.005672454833984375, -0.004797458648681641, -0.003922462463378906, -0.003047466278076172, -0.0021724700927734375, -0.0012974739074707031, -0.00042247772216796875, 0.0004525184631347656, 0.0013275146484375, 0.0022025108337402344, 0.0030775070190429688, 0.003952503204345703, 0.0048274993896484375, 0.005702495574951172, 0.006577491760253906, 0.007452487945556641, 0.008327484130859375, 0.00920248031616211, 0.010077476501464844, 0.010952472686767578, 0.011827468872070312, 0.012702465057373047, 0.013577461242675781, 0.014452457427978516, 0.01532745361328125, 0.016202449798583984, 0.01707744598388672, 0.017952442169189453, 0.018827438354492188, 0.019702434539794922, 0.020577430725097656, 0.02145242691040039, 0.022327423095703125, 0.02320241928100586, 0.024077415466308594, 0.024952411651611328, 0.025827407836914062, 0.026702404022216797, 0.02757740020751953, 0.028452396392822266, 0.029327392578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 4.0, 2.0, 9.0, 5.0, 12.0, 11.0, 15.0, 14.0, 22.0, 23.0, 32.0, 38.0, 50.0, 69.0, 88.0, 134.0, 102.0, 85.0, 71.0, 62.0, 36.0, 20.0, 33.0, 10.0, 11.0, 12.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025238037109375, -0.024384021759033203, -0.023530006408691406, -0.02267599105834961, -0.021821975708007812, -0.020967960357666016, -0.02011394500732422, -0.019259929656982422, -0.018405914306640625, -0.017551898956298828, -0.01669788360595703, -0.015843868255615234, -0.014989852905273438, -0.01413583755493164, -0.013281822204589844, -0.012427806854248047, -0.01157379150390625, -0.010719776153564453, -0.009865760803222656, -0.00901174545288086, -0.008157730102539062, -0.007303714752197266, -0.006449699401855469, -0.005595684051513672, -0.004741668701171875, -0.003887653350830078, -0.0030336380004882812, -0.0021796226501464844, -0.0013256072998046875, -0.0004715919494628906, 0.00038242340087890625, 0.0012364387512207031, 0.0020904541015625, 0.002944469451904297, 0.0037984848022460938, 0.004652500152587891, 0.0055065155029296875, 0.006360530853271484, 0.007214546203613281, 0.008068561553955078, 0.008922576904296875, 0.009776592254638672, 0.010630607604980469, 0.011484622955322266, 0.012338638305664062, 0.01319265365600586, 0.014046669006347656, 0.014900684356689453, 0.01575469970703125, 0.016608715057373047, 0.017462730407714844, 0.01831674575805664, 0.019170761108398438, 0.020024776458740234, 0.02087879180908203, 0.021732807159423828, 0.022586822509765625, 0.023440837860107422, 0.02429485321044922, 0.025148868560791016, 0.026002883911132812, 0.02685689926147461, 0.027710914611816406, 0.028564929962158203, 0.0294189453125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 14.0, 12.0, 24.0, 40.0, 55.0, 72.0, 74.0, 90.0, 110.0, 86.0, 101.0, 82.0, 66.0, 48.0, 30.0, 22.0, 20.0, 15.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2896897792816162, -0.28223860263824463, -0.27478742599487305, -0.2673362195491791, -0.2598850429058075, -0.2524338662624359, -0.24498268961906433, -0.23753151297569275, -0.23008032143115997, -0.2226291447877884, -0.21517795324325562, -0.20772677659988403, -0.20027559995651245, -0.19282440841197968, -0.1853732317686081, -0.17792204022407532, -0.17047086358070374, -0.16301968693733215, -0.15556849539279938, -0.1481173187494278, -0.14066612720489502, -0.13321495056152344, -0.12576377391815186, -0.11831258982419968, -0.1108614057302475, -0.10341022163629532, -0.09595903754234314, -0.08850786089897156, -0.08105667680501938, -0.0736054927110672, -0.06615431606769562, -0.05870313197374344, -0.051251962780952454, -0.043800778687000275, -0.036349598318338394, -0.028898416087031364, -0.021447233855724335, -0.013996049761772156, -0.006544869393110275, 0.0009063109755516052, 0.008357495069503784, 0.015808677300810814, 0.023259859532117844, 0.030711041763424873, 0.0381622239947319, 0.04561340808868408, 0.05306458845734596, 0.06051576882600784, 0.06796695291996002, 0.0754181370139122, 0.08286932110786438, 0.09032049775123596, 0.09777168184518814, 0.10522286593914032, 0.1126740425825119, 0.12012522667646408, 0.12757641077041626, 0.13502758741378784, 0.14247877895832062, 0.1499299556016922, 0.15738114714622498, 0.16483232378959656, 0.17228350043296814, 0.17973467707633972, 0.1871858686208725]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 2.0, 14.0, 13.0, 19.0, 8.0, 21.0, 25.0, 23.0, 21.0, 23.0, 24.0, 40.0, 30.0, 27.0, 43.0, 45.0, 57.0, 53.0, 51.0, 44.0, 34.0, 51.0, 49.0, 34.0, 46.0, 28.0, 24.0, 19.0, 24.0, 16.0, 12.0, 12.0, 13.0, 14.0, 6.0, 9.0, 9.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12698519229888916, -0.1231943741440773, -0.11940354853868484, -0.11561273038387299, -0.11182190477848053, -0.10803108662366867, -0.10424026846885681, -0.10044944286346436, -0.0966586247086525, -0.09286780655384064, -0.08907698094844818, -0.08528616279363632, -0.08149534463882446, -0.077704519033432, -0.07391370087862015, -0.07012288272380829, -0.06633205711841583, -0.06254123896360397, -0.05875041335821152, -0.05495959520339966, -0.0511687733232975, -0.04737795144319534, -0.043587133288383484, -0.039796311408281326, -0.03600548952817917, -0.03221466764807701, -0.028423847630620003, -0.024633027613162994, -0.020842205733060837, -0.01705138385295868, -0.01326056383550167, -0.009469743818044662, -0.005678921937942505, -0.001888100989162922, 0.001902719959616661, 0.005693540908396244, 0.009484361857175827, 0.013275183737277985, 0.017066003754734993, 0.020856823772192, 0.02464764565229416, 0.028438467532396317, 0.032229289412498474, 0.03602010756731033, 0.03981092944741249, 0.04360175132751465, 0.04739256948232651, 0.051183391362428665, 0.05497421324253082, 0.05876503512263298, 0.06255585700273514, 0.066346675157547, 0.07013750076293945, 0.07392831891775131, 0.07771913707256317, 0.08150996267795563, 0.08530078083276749, 0.08909159898757935, 0.0928824245929718, 0.09667324274778366, 0.10046406090259552, 0.10425488650798798, 0.10804570466279984, 0.1118365228176117, 0.11562734842300415]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 10.0, 22.0, 31.0, 56.0, 124.0, 292.0, 701.0, 2261.0, 7585.0, 31930.0, 279712.0, 3441317.0, 378832.0, 38905.0, 8709.0, 2338.0, 831.0, 307.0, 145.0, 68.0, 35.0, 19.0, 14.0, 5.0, 4.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037445068359375, -0.036034584045410156, -0.03462409973144531, -0.03321361541748047, -0.031803131103515625, -0.03039264678955078, -0.028982162475585938, -0.027571678161621094, -0.02616119384765625, -0.024750709533691406, -0.023340225219726562, -0.02192974090576172, -0.020519256591796875, -0.01910877227783203, -0.017698287963867188, -0.016287803649902344, -0.0148773193359375, -0.013466835021972656, -0.012056350708007812, -0.010645866394042969, -0.009235382080078125, -0.007824897766113281, -0.0064144134521484375, -0.005003929138183594, -0.00359344482421875, -0.0021829605102539062, -0.0007724761962890625, 0.0006380081176757812, 0.002048492431640625, 0.0034589767456054688, 0.0048694610595703125, 0.006279945373535156, 0.0076904296875, 0.009100914001464844, 0.010511398315429688, 0.011921882629394531, 0.013332366943359375, 0.014742851257324219, 0.016153335571289062, 0.017563819885253906, 0.01897430419921875, 0.020384788513183594, 0.021795272827148438, 0.02320575714111328, 0.024616241455078125, 0.02602672576904297, 0.027437210083007812, 0.028847694396972656, 0.0302581787109375, 0.031668663024902344, 0.03307914733886719, 0.03448963165283203, 0.035900115966796875, 0.03731060028076172, 0.03872108459472656, 0.040131568908691406, 0.04154205322265625, 0.042952537536621094, 0.04436302185058594, 0.04577350616455078, 0.047183990478515625, 0.04859447479248047, 0.05000495910644531, 0.051415443420410156, 0.052825927734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 8.0, 24.0, 29.0, 56.0, 55.0, 76.0, 112.0, 129.0, 119.0, 90.0, 95.0, 71.0, 39.0, 33.0, 23.0, 19.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029052734375, -0.028144121170043945, -0.02723550796508789, -0.026326894760131836, -0.02541828155517578, -0.024509668350219727, -0.023601055145263672, -0.022692441940307617, -0.021783828735351562, -0.020875215530395508, -0.019966602325439453, -0.0190579891204834, -0.018149375915527344, -0.01724076271057129, -0.016332149505615234, -0.01542353630065918, -0.014514923095703125, -0.01360630989074707, -0.012697696685791016, -0.011789083480834961, -0.010880470275878906, -0.009971857070922852, -0.009063243865966797, -0.008154630661010742, -0.0072460174560546875, -0.006337404251098633, -0.005428791046142578, -0.0045201778411865234, -0.0036115646362304688, -0.002702951431274414, -0.0017943382263183594, -0.0008857250213623047, 2.288818359375e-05, 0.0009315013885498047, 0.0018401145935058594, 0.002748727798461914, 0.0036573410034179688, 0.0045659542083740234, 0.005474567413330078, 0.006383180618286133, 0.0072917938232421875, 0.008200407028198242, 0.009109020233154297, 0.010017633438110352, 0.010926246643066406, 0.011834859848022461, 0.012743473052978516, 0.01365208625793457, 0.014560699462890625, 0.01546931266784668, 0.016377925872802734, 0.01728653907775879, 0.018195152282714844, 0.0191037654876709, 0.020012378692626953, 0.020920991897583008, 0.021829605102539062, 0.022738218307495117, 0.023646831512451172, 0.024555444717407227, 0.02546405792236328, 0.026372671127319336, 0.02728128433227539, 0.028189897537231445, 0.0290985107421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 11.0, 12.0, 27.0, 39.0, 57.0, 71.0, 98.0, 183.0, 341.0, 550.0, 1068.0, 2339.0, 6351.0, 21319.0, 104694.0, 2157398.0, 1772821.0, 96394.0, 19820.0, 5961.0, 2292.0, 1032.0, 548.0, 310.0, 201.0, 121.0, 91.0, 38.0, 44.0, 19.0, 15.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05352783203125, -0.05190467834472656, -0.050281524658203125, -0.04865837097167969, -0.04703521728515625, -0.04541206359863281, -0.043788909912109375, -0.04216575622558594, -0.0405426025390625, -0.03891944885253906, -0.037296295166015625, -0.03567314147949219, -0.03404998779296875, -0.03242683410644531, -0.030803680419921875, -0.029180526733398438, -0.027557373046875, -0.025934219360351562, -0.024311065673828125, -0.022687911987304688, -0.02106475830078125, -0.019441604614257812, -0.017818450927734375, -0.016195297241210938, -0.0145721435546875, -0.012948989868164062, -0.011325836181640625, -0.009702682495117188, -0.00807952880859375, -0.0064563751220703125, -0.004833221435546875, -0.0032100677490234375, -0.0015869140625, 3.62396240234375e-05, 0.001659393310546875, 0.0032825469970703125, 0.00490570068359375, 0.0065288543701171875, 0.008152008056640625, 0.009775161743164062, 0.0113983154296875, 0.013021469116210938, 0.014644622802734375, 0.016267776489257812, 0.01789093017578125, 0.019514083862304688, 0.021137237548828125, 0.022760391235351562, 0.024383544921875, 0.026006698608398438, 0.027629852294921875, 0.029253005981445312, 0.03087615966796875, 0.03249931335449219, 0.034122467041015625, 0.03574562072753906, 0.0373687744140625, 0.03899192810058594, 0.040615081787109375, 0.04223823547363281, 0.04386138916015625, 0.04548454284667969, 0.047107696533203125, 0.04873085021972656, 0.05035400390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 4.0, 6.0, 6.0, 14.0, 15.0, 19.0, 36.0, 37.0, 58.0, 89.0, 129.0, 202.0, 399.0, 834.0, 887.0, 547.0, 235.0, 179.0, 98.0, 68.0, 53.0, 45.0, 20.0, 21.0, 13.0, 13.0, 11.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.024083852767944336, -0.022944927215576172, -0.021806001663208008, -0.020667076110839844, -0.01952815055847168, -0.018389225006103516, -0.01725029945373535, -0.016111373901367188, -0.014972448348999023, -0.01383352279663086, -0.012694597244262695, -0.011555671691894531, -0.010416746139526367, -0.009277820587158203, -0.008138895034790039, -0.006999969482421875, -0.005861043930053711, -0.004722118377685547, -0.003583192825317383, -0.0024442672729492188, -0.0013053417205810547, -0.00016641616821289062, 0.0009725093841552734, 0.0021114349365234375, 0.0032503604888916016, 0.004389286041259766, 0.00552821159362793, 0.006667137145996094, 0.007806062698364258, 0.008944988250732422, 0.010083913803100586, 0.01122283935546875, 0.012361764907836914, 0.013500690460205078, 0.014639616012573242, 0.015778541564941406, 0.01691746711730957, 0.018056392669677734, 0.0191953182220459, 0.020334243774414062, 0.021473169326782227, 0.02261209487915039, 0.023751020431518555, 0.02488994598388672, 0.026028871536254883, 0.027167797088623047, 0.02830672264099121, 0.029445648193359375, 0.03058457374572754, 0.0317234992980957, 0.03286242485046387, 0.03400135040283203, 0.035140275955200195, 0.03627920150756836, 0.03741812705993652, 0.03855705261230469, 0.03969597816467285, 0.040834903717041016, 0.04197382926940918, 0.043112754821777344, 0.04425168037414551, 0.04539060592651367, 0.046529531478881836, 0.04766845703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 11.0, 13.0, 39.0, 86.0, 142.0, 222.0, 218.0, 124.0, 57.0, 37.0, 20.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5880122184753418, -0.5751349329948425, -0.5622576475143433, -0.549380362033844, -0.5365030765533447, -0.5236257910728455, -0.5107485055923462, -0.4978712499141693, -0.48499396443367004, -0.4721166789531708, -0.4592393934726715, -0.44636210799217224, -0.43348485231399536, -0.4206075668334961, -0.4077302813529968, -0.39485299587249756, -0.3819757103919983, -0.369098424911499, -0.35622113943099976, -0.3433438539505005, -0.3304665684700012, -0.31758928298950195, -0.3047120273113251, -0.2918347418308258, -0.27895745635032654, -0.26608017086982727, -0.253202885389328, -0.24032561480998993, -0.22744832932949066, -0.2145710438489914, -0.20169377326965332, -0.18881648778915405, -0.17593920230865479, -0.16306191682815552, -0.15018463134765625, -0.13730736076831818, -0.12443007528781891, -0.11155278980731964, -0.09867551177740097, -0.0857982337474823, -0.07292094826698303, -0.06004366651177406, -0.047166384756565094, -0.034289103001356125, -0.021411821246147156, -0.008534535765647888, 0.0043427422642707825, 0.017220020294189453, 0.03009730577468872, 0.04297458752989769, 0.05585186928510666, 0.06872914731502533, 0.0816064327955246, 0.09448371827602386, 0.10736099630594254, 0.1202382743358612, 0.13311555981636047, 0.14599284529685974, 0.158870130777359, 0.17174740135669708, 0.18462468683719635, 0.19750197231769562, 0.2103792428970337, 0.22325652837753296, 0.23613381385803223]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 12.0, 18.0, 18.0, 24.0, 20.0, 32.0, 35.0, 30.0, 37.0, 44.0, 32.0, 47.0, 39.0, 46.0, 47.0, 49.0, 39.0, 55.0, 44.0, 38.0, 37.0, 30.0, 23.0, 25.0, 27.0, 26.0, 20.0, 13.0, 13.0, 5.0, 11.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.14956510066986084, -0.1455327719449997, -0.14150044322013855, -0.1374681144952774, -0.13343578577041626, -0.12940345704555511, -0.12537112832069397, -0.12133880704641342, -0.11730647832155228, -0.11327414959669113, -0.10924182087182999, -0.10520949214696884, -0.1011771708726883, -0.09714484214782715, -0.093112513422966, -0.08908018469810486, -0.08504785597324371, -0.08101552724838257, -0.07698319852352142, -0.07295086979866028, -0.06891854107379913, -0.06488621234893799, -0.06085389107465744, -0.056821562349796295, -0.05278923362493515, -0.048756904900074005, -0.04472457617521286, -0.040692251175642014, -0.03665992245078087, -0.032627593725919724, -0.028595266863703728, -0.024562940001487732, -0.020530611276626587, -0.016498282551765442, -0.012465955689549446, -0.008433627896010876, -0.004401300102472305, -0.0003689713776111603, 0.0036633554846048355, 0.007695682346820831, 0.011728011071681976, 0.01576033979654312, 0.019792666658759117, 0.023824993520975113, 0.027857322245836258, 0.0318896509706974, 0.03592197597026825, 0.039954304695129395, 0.04398663341999054, 0.048018962144851685, 0.05205129086971283, 0.056083615869283676, 0.06011594459414482, 0.06414827704429626, 0.06818059831857681, 0.07221292704343796, 0.0762452557682991, 0.08027758449316025, 0.08430991321802139, 0.08834224194288254, 0.09237456321716309, 0.09640689194202423, 0.10043922066688538, 0.10447154939174652, 0.10850387811660767]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 16.0, 15.0, 17.0, 21.0, 34.0, 43.0, 56.0, 82.0, 140.0, 189.0, 312.0, 566.0, 1001.0, 1900.0, 4430.0, 10986.0, 29467.0, 81418.0, 214833.0, 350994.0, 217962.0, 83789.0, 30119.0, 11163.0, 4460.0, 2006.0, 967.0, 600.0, 325.0, 210.0, 136.0, 82.0, 60.0, 45.0, 34.0, 22.0, 23.0, 10.0, 10.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.03670692443847656, -0.035419464111328125, -0.03413200378417969, -0.03284454345703125, -0.03155708312988281, -0.030269622802734375, -0.028982162475585938, -0.0276947021484375, -0.026407241821289062, -0.025119781494140625, -0.023832321166992188, -0.02254486083984375, -0.021257400512695312, -0.019969940185546875, -0.018682479858398438, -0.01739501953125, -0.016107559204101562, -0.014820098876953125, -0.013532638549804688, -0.01224517822265625, -0.010957717895507812, -0.009670257568359375, -0.008382797241210938, -0.0070953369140625, -0.0058078765869140625, -0.004520416259765625, -0.0032329559326171875, -0.00194549560546875, -0.0006580352783203125, 0.000629425048828125, 0.0019168853759765625, 0.003204345703125, 0.0044918060302734375, 0.005779266357421875, 0.0070667266845703125, 0.00835418701171875, 0.009641647338867188, 0.010929107666015625, 0.012216567993164062, 0.0135040283203125, 0.014791488647460938, 0.016078948974609375, 0.017366409301757812, 0.01865386962890625, 0.019941329956054688, 0.021228790283203125, 0.022516250610351562, 0.0238037109375, 0.025091171264648438, 0.026378631591796875, 0.027666091918945312, 0.02895355224609375, 0.030241012573242188, 0.031528472900390625, 0.03281593322753906, 0.0341033935546875, 0.03539085388183594, 0.036678314208984375, 0.03796577453613281, 0.03925323486328125, 0.04054069519042969, 0.041828155517578125, 0.04311561584472656, 0.044403076171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 13.0, 26.0, 22.0, 32.0, 36.0, 53.0, 57.0, 72.0, 87.0, 100.0, 87.0, 85.0, 73.0, 83.0, 51.0, 37.0, 23.0, 15.0, 17.0, 16.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.029153108596801758, -0.028292179107666016, -0.027431249618530273, -0.02657032012939453, -0.02570939064025879, -0.024848461151123047, -0.023987531661987305, -0.023126602172851562, -0.02226567268371582, -0.021404743194580078, -0.020543813705444336, -0.019682884216308594, -0.01882195472717285, -0.01796102523803711, -0.017100095748901367, -0.016239166259765625, -0.015378236770629883, -0.01451730728149414, -0.013656377792358398, -0.012795448303222656, -0.011934518814086914, -0.011073589324951172, -0.01021265983581543, -0.009351730346679688, -0.008490800857543945, -0.007629871368408203, -0.006768941879272461, -0.005908012390136719, -0.0050470829010009766, -0.004186153411865234, -0.003325223922729492, -0.00246429443359375, -0.0016033649444580078, -0.0007424354553222656, 0.00011849403381347656, 0.0009794235229492188, 0.001840353012084961, 0.002701282501220703, 0.0035622119903564453, 0.0044231414794921875, 0.00528407096862793, 0.006145000457763672, 0.007005929946899414, 0.007866859436035156, 0.008727788925170898, 0.00958871841430664, 0.010449647903442383, 0.011310577392578125, 0.012171506881713867, 0.01303243637084961, 0.013893365859985352, 0.014754295349121094, 0.015615224838256836, 0.016476154327392578, 0.01733708381652832, 0.018198013305664062, 0.019058942794799805, 0.019919872283935547, 0.02078080177307129, 0.02164173126220703, 0.022502660751342773, 0.023363590240478516, 0.024224519729614258, 0.02508544921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 7.0, 16.0, 18.0, 29.0, 47.0, 64.0, 129.0, 199.0, 315.0, 644.0, 1079.0, 2238.0, 4488.0, 9439.0, 20743.0, 47411.0, 112622.0, 251870.0, 310085.0, 163223.0, 69088.0, 29462.0, 12920.0, 6053.0, 2906.0, 1515.0, 815.0, 454.0, 247.0, 147.0, 83.0, 61.0, 38.0, 21.0, 23.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033050537109375, -0.03195667266845703, -0.030862808227539062, -0.029768943786621094, -0.028675079345703125, -0.027581214904785156, -0.026487350463867188, -0.02539348602294922, -0.02429962158203125, -0.02320575714111328, -0.022111892700195312, -0.021018028259277344, -0.019924163818359375, -0.018830299377441406, -0.017736434936523438, -0.01664257049560547, -0.0155487060546875, -0.014454841613769531, -0.013360977172851562, -0.012267112731933594, -0.011173248291015625, -0.010079383850097656, -0.008985519409179688, -0.007891654968261719, -0.00679779052734375, -0.005703926086425781, -0.0046100616455078125, -0.0035161972045898438, -0.002422332763671875, -0.0013284683227539062, -0.0002346038818359375, 0.0008592605590820312, 0.001953125, 0.0030469894409179688, 0.0041408538818359375, 0.005234718322753906, 0.006328582763671875, 0.007422447204589844, 0.008516311645507812, 0.009610176086425781, 0.01070404052734375, 0.011797904968261719, 0.012891769409179688, 0.013985633850097656, 0.015079498291015625, 0.016173362731933594, 0.017267227172851562, 0.01836109161376953, 0.0194549560546875, 0.02054882049560547, 0.021642684936523438, 0.022736549377441406, 0.023830413818359375, 0.024924278259277344, 0.026018142700195312, 0.02711200714111328, 0.02820587158203125, 0.02929973602294922, 0.030393600463867188, 0.031487464904785156, 0.032581329345703125, 0.033675193786621094, 0.03476905822753906, 0.03586292266845703, 0.036956787109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 2.0, 9.0, 17.0, 14.0, 7.0, 19.0, 17.0, 19.0, 30.0, 21.0, 33.0, 46.0, 26.0, 40.0, 45.0, 37.0, 55.0, 53.0, 40.0, 46.0, 41.0, 40.0, 30.0, 43.0, 29.0, 30.0, 25.0, 33.0, 26.0, 15.0, 21.0, 21.0, 10.0, 9.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.045989990234375, -0.044579505920410156, -0.04316902160644531, -0.04175853729248047, -0.040348052978515625, -0.03893756866455078, -0.03752708435058594, -0.036116600036621094, -0.03470611572265625, -0.033295631408691406, -0.03188514709472656, -0.03047466278076172, -0.029064178466796875, -0.02765369415283203, -0.026243209838867188, -0.024832725524902344, -0.0234222412109375, -0.022011756896972656, -0.020601272583007812, -0.01919078826904297, -0.017780303955078125, -0.01636981964111328, -0.014959335327148438, -0.013548851013183594, -0.01213836669921875, -0.010727882385253906, -0.009317398071289062, -0.007906913757324219, -0.006496429443359375, -0.005085945129394531, -0.0036754608154296875, -0.0022649765014648438, -0.0008544921875, 0.0005559921264648438, 0.0019664764404296875, 0.0033769607543945312, 0.004787445068359375, 0.006197929382324219, 0.0076084136962890625, 0.009018898010253906, 0.01042938232421875, 0.011839866638183594, 0.013250350952148438, 0.014660835266113281, 0.016071319580078125, 0.01748180389404297, 0.018892288208007812, 0.020302772521972656, 0.0217132568359375, 0.023123741149902344, 0.024534225463867188, 0.02594470977783203, 0.027355194091796875, 0.02876567840576172, 0.030176162719726562, 0.031586647033691406, 0.03299713134765625, 0.034407615661621094, 0.03581809997558594, 0.03722858428955078, 0.038639068603515625, 0.04004955291748047, 0.04146003723144531, 0.042870521545410156, 0.044281005859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 29.0, 41.0, 56.0, 94.0, 159.0, 260.0, 462.0, 786.0, 1591.0, 3137.0, 6885.0, 17812.0, 66723.0, 545574.0, 336090.0, 44133.0, 13571.0, 5499.0, 2653.0, 1292.0, 685.0, 410.0, 226.0, 126.0, 91.0, 52.0, 39.0, 21.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026702880859375, -0.02583789825439453, -0.024972915649414062, -0.024107933044433594, -0.023242950439453125, -0.022377967834472656, -0.021512985229492188, -0.02064800262451172, -0.01978302001953125, -0.01891803741455078, -0.018053054809570312, -0.017188072204589844, -0.016323089599609375, -0.015458106994628906, -0.014593124389648438, -0.013728141784667969, -0.0128631591796875, -0.011998176574707031, -0.011133193969726562, -0.010268211364746094, -0.009403228759765625, -0.008538246154785156, -0.0076732635498046875, -0.006808280944824219, -0.00594329833984375, -0.005078315734863281, -0.0042133331298828125, -0.0033483505249023438, -0.002483367919921875, -0.0016183853149414062, -0.0007534027099609375, 0.00011157989501953125, 0.0009765625, 0.0018415451049804688, 0.0027065277099609375, 0.0035715103149414062, 0.004436492919921875, 0.005301475524902344, 0.0061664581298828125, 0.007031440734863281, 0.00789642333984375, 0.008761405944824219, 0.009626388549804688, 0.010491371154785156, 0.011356353759765625, 0.012221336364746094, 0.013086318969726562, 0.013951301574707031, 0.0148162841796875, 0.01568126678466797, 0.016546249389648438, 0.017411231994628906, 0.018276214599609375, 0.019141197204589844, 0.020006179809570312, 0.02087116241455078, 0.02173614501953125, 0.02260112762451172, 0.023466110229492188, 0.024331092834472656, 0.025196075439453125, 0.026061058044433594, 0.026926040649414062, 0.02779102325439453, 0.028656005859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 12.0, 12.0, 10.0, 19.0, 24.0, 25.0, 51.0, 48.0, 59.0, 76.0, 74.0, 92.0, 75.0, 66.0, 76.0, 52.0, 38.0, 32.0, 28.0, 26.0, 22.0, 14.0, 12.0, 5.0, 2.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.731250762939453e-05, -3.596208989620209e-05, -3.4611672163009644e-05, -3.32612544298172e-05, -3.1910836696624756e-05, -3.056041896343231e-05, -2.9210001230239868e-05, -2.7859583497047424e-05, -2.650916576385498e-05, -2.5158748030662537e-05, -2.3808330297470093e-05, -2.245791256427765e-05, -2.1107494831085205e-05, -1.975707709789276e-05, -1.8406659364700317e-05, -1.7056241631507874e-05, -1.570582389831543e-05, -1.4355406165122986e-05, -1.3004988431930542e-05, -1.1654570698738098e-05, -1.0304152965545654e-05, -8.95373523235321e-06, -7.603317499160767e-06, -6.252899765968323e-06, -4.902482032775879e-06, -3.552064299583435e-06, -2.201646566390991e-06, -8.512288331985474e-07, 4.991888999938965e-07, 1.8496066331863403e-06, 3.200024366378784e-06, 4.550442099571228e-06, 5.900859832763672e-06, 7.251277565956116e-06, 8.60169529914856e-06, 9.952113032341003e-06, 1.1302530765533447e-05, 1.2652948498725891e-05, 1.4003366231918335e-05, 1.535378396511078e-05, 1.6704201698303223e-05, 1.8054619431495667e-05, 1.940503716468811e-05, 2.0755454897880554e-05, 2.2105872631072998e-05, 2.3456290364265442e-05, 2.4806708097457886e-05, 2.615712583065033e-05, 2.7507543563842773e-05, 2.8857961297035217e-05, 3.020837903022766e-05, 3.1558796763420105e-05, 3.290921449661255e-05, 3.425963222980499e-05, 3.5610049962997437e-05, 3.696046769618988e-05, 3.8310885429382324e-05, 3.966130316257477e-05, 4.101172089576721e-05, 4.2362138628959656e-05, 4.37125563621521e-05, 4.5062974095344543e-05, 4.641339182853699e-05, 4.776380956172943e-05, 4.9114227294921875e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 15.0, 14.0, 20.0, 34.0, 29.0, 59.0, 77.0, 129.0, 180.0, 295.0, 540.0, 886.0, 1654.0, 3061.0, 5963.0, 13527.0, 40880.0, 228164.0, 582591.0, 122384.0, 27140.0, 10269.0, 4742.0, 2606.0, 1338.0, 729.0, 395.0, 282.0, 174.0, 117.0, 82.0, 48.0, 33.0, 24.0, 18.0, 14.0, 3.0, 11.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.024078369140625, -0.023377180099487305, -0.02267599105834961, -0.021974802017211914, -0.02127361297607422, -0.020572423934936523, -0.019871234893798828, -0.019170045852661133, -0.018468856811523438, -0.017767667770385742, -0.017066478729248047, -0.01636528968811035, -0.015664100646972656, -0.014962911605834961, -0.014261722564697266, -0.01356053352355957, -0.012859344482421875, -0.01215815544128418, -0.011456966400146484, -0.010755777359008789, -0.010054588317871094, -0.009353399276733398, -0.008652210235595703, -0.007951021194458008, -0.0072498321533203125, -0.006548643112182617, -0.005847454071044922, -0.0051462650299072266, -0.004445075988769531, -0.003743886947631836, -0.0030426979064941406, -0.0023415088653564453, -0.00164031982421875, -0.0009391307830810547, -0.00023794174194335938, 0.00046324729919433594, 0.0011644363403320312, 0.0018656253814697266, 0.002566814422607422, 0.003268003463745117, 0.0039691925048828125, 0.004670381546020508, 0.005371570587158203, 0.0060727596282958984, 0.006773948669433594, 0.007475137710571289, 0.008176326751708984, 0.00887751579284668, 0.009578704833984375, 0.01027989387512207, 0.010981082916259766, 0.011682271957397461, 0.012383460998535156, 0.013084650039672852, 0.013785839080810547, 0.014487028121948242, 0.015188217163085938, 0.015889406204223633, 0.016590595245361328, 0.017291784286499023, 0.01799297332763672, 0.018694162368774414, 0.01939535140991211, 0.020096540451049805, 0.0207977294921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 3.0, 5.0, 9.0, 9.0, 17.0, 23.0, 24.0, 50.0, 57.0, 77.0, 127.0, 150.0, 144.0, 80.0, 58.0, 55.0, 43.0, 18.0, 13.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.0282135009765625, -0.027502775192260742, -0.026792049407958984, -0.026081323623657227, -0.02537059783935547, -0.02465987205505371, -0.023949146270751953, -0.023238420486450195, -0.022527694702148438, -0.02181696891784668, -0.021106243133544922, -0.020395517349243164, -0.019684791564941406, -0.01897406578063965, -0.01826333999633789, -0.017552614212036133, -0.016841888427734375, -0.016131162643432617, -0.01542043685913086, -0.014709711074829102, -0.013998985290527344, -0.013288259506225586, -0.012577533721923828, -0.01186680793762207, -0.011156082153320312, -0.010445356369018555, -0.009734630584716797, -0.009023904800415039, -0.008313179016113281, -0.0076024532318115234, -0.006891727447509766, -0.006181001663208008, -0.00547027587890625, -0.004759550094604492, -0.004048824310302734, -0.0033380985260009766, -0.0026273727416992188, -0.001916646957397461, -0.0012059211730957031, -0.0004951953887939453, 0.0002155303955078125, 0.0009262561798095703, 0.0016369819641113281, 0.002347707748413086, 0.0030584335327148438, 0.0037691593170166016, 0.004479885101318359, 0.005190610885620117, 0.005901336669921875, 0.006612062454223633, 0.007322788238525391, 0.008033514022827148, 0.008744239807128906, 0.009454965591430664, 0.010165691375732422, 0.01087641716003418, 0.011587142944335938, 0.012297868728637695, 0.013008594512939453, 0.013719320297241211, 0.014430046081542969, 0.015140771865844727, 0.015851497650146484, 0.016562223434448242, 0.01727294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 14.0, 14.0, 20.0, 36.0, 60.0, 126.0, 145.0, 204.0, 177.0, 102.0, 45.0, 29.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5163941979408264, -0.5038917064666748, -0.4913892447948456, -0.47888678312301636, -0.46638432145118713, -0.4538818597793579, -0.4413793683052063, -0.4288769066333771, -0.41637444496154785, -0.40387198328971863, -0.391369491815567, -0.3788670301437378, -0.36636456847190857, -0.35386210680007935, -0.34135961532592773, -0.3288571536540985, -0.3163546919822693, -0.30385223031044006, -0.29134973883628845, -0.27884727716445923, -0.26634481549263, -0.2538423538208008, -0.24133986234664917, -0.22883740067481995, -0.21633490920066833, -0.20383243262767792, -0.1913299709558487, -0.17882749438285828, -0.16632503271102905, -0.15382255613803864, -0.14132007956504822, -0.128817617893219, -0.11631515622138977, -0.10381268709897995, -0.09131021797657013, -0.07880774140357971, -0.06630527973175049, -0.05380280315876007, -0.04130033403635025, -0.02879786491394043, -0.01629539579153061, -0.003792925737798214, 0.008709544315934181, 0.02121201530098915, 0.03371448442339897, 0.04621695727109909, 0.05871942639350891, 0.07122189551591873, 0.08372436463832855, 0.09622683376073837, 0.1087293028831482, 0.12123177945613861, 0.13373424112796783, 0.14623671770095825, 0.15873917937278748, 0.1712416559457779, 0.1837441325187683, 0.19624660909175873, 0.20874907076358795, 0.22125154733657837, 0.2337540090084076, 0.246256485581398, 0.2587589621543884, 0.27126142382621765, 0.2837638854980469]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 9.0, 13.0, 14.0, 17.0, 19.0, 27.0, 31.0, 25.0, 18.0, 27.0, 31.0, 44.0, 42.0, 39.0, 46.0, 42.0, 45.0, 43.0, 47.0, 47.0, 39.0, 42.0, 36.0, 40.0, 28.0, 26.0, 31.0, 26.0, 14.0, 11.0, 17.0, 11.0, 10.0, 13.0, 3.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.14830946922302246, -0.14427319169044495, -0.14023689925670624, -0.13620062172412872, -0.13216432929039001, -0.1281280517578125, -0.12409176677465439, -0.12005548179149628, -0.11601919680833817, -0.11198291182518005, -0.10794662684202194, -0.10391034185886383, -0.09987406432628632, -0.09583777189254761, -0.09180149435997009, -0.08776520937681198, -0.08372892439365387, -0.07969263941049576, -0.07565635442733765, -0.07162006944417953, -0.06758378446102142, -0.06354750692844391, -0.0595112219452858, -0.055474936962127686, -0.051438651978969574, -0.04740236699581146, -0.04336608201265335, -0.03932980075478554, -0.035293515771627426, -0.031257230788469315, -0.027220947667956352, -0.02318466454744339, -0.01914837956428528, -0.015112095512449741, -0.011075811460614204, -0.0070395274087786674, -0.0030032433569431305, 0.001033041626214981, 0.005069324746727943, 0.009105607867240906, 0.013141892850399017, 0.01717817783355713, 0.02121446095407009, 0.025250744074583054, 0.029287029057741165, 0.03332331404089928, 0.03735959529876709, 0.0413958802819252, 0.04543216526508331, 0.049468450248241425, 0.053504735231399536, 0.05754101648926735, 0.06157730147242546, 0.06561358273029327, 0.06964986771345139, 0.0736861526966095, 0.07772243767976761, 0.08175872266292572, 0.08579500764608383, 0.08983129262924194, 0.09386757016181946, 0.09790386259555817, 0.10194014012813568, 0.10597642511129379, 0.1100127100944519]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 5.0, 11.0, 13.0, 24.0, 28.0, 35.0, 56.0, 103.0, 232.0, 428.0, 889.0, 2100.0, 5769.0, 20888.0, 118417.0, 2623106.0, 1322120.0, 76322.0, 15798.0, 4586.0, 1804.0, 761.0, 318.0, 177.0, 95.0, 63.0, 35.0, 20.0, 18.0, 7.0, 1.0, 4.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059051513671875, -0.057358741760253906, -0.05566596984863281, -0.05397319793701172, -0.052280426025390625, -0.05058765411376953, -0.04889488220214844, -0.047202110290527344, -0.04550933837890625, -0.043816566467285156, -0.04212379455566406, -0.04043102264404297, -0.038738250732421875, -0.03704547882080078, -0.03535270690917969, -0.033659934997558594, -0.0319671630859375, -0.030274391174316406, -0.028581619262695312, -0.02688884735107422, -0.025196075439453125, -0.02350330352783203, -0.021810531616210938, -0.020117759704589844, -0.01842498779296875, -0.016732215881347656, -0.015039443969726562, -0.013346672058105469, -0.011653900146484375, -0.009961128234863281, -0.008268356323242188, -0.006575584411621094, -0.0048828125, -0.0031900405883789062, -0.0014972686767578125, 0.00019550323486328125, 0.001888275146484375, 0.0035810470581054688, 0.0052738189697265625, 0.006966590881347656, 0.00865936279296875, 0.010352134704589844, 0.012044906616210938, 0.013737678527832031, 0.015430450439453125, 0.01712322235107422, 0.018815994262695312, 0.020508766174316406, 0.0222015380859375, 0.023894309997558594, 0.025587081909179688, 0.02727985382080078, 0.028972625732421875, 0.03066539764404297, 0.03235816955566406, 0.034050941467285156, 0.03574371337890625, 0.037436485290527344, 0.03912925720214844, 0.04082202911376953, 0.042514801025390625, 0.04420757293701172, 0.04590034484863281, 0.047593116760253906, 0.049285888671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 12.0, 17.0, 21.0, 29.0, 40.0, 45.0, 70.0, 69.0, 77.0, 81.0, 91.0, 94.0, 82.0, 68.0, 55.0, 36.0, 37.0, 18.0, 23.0, 8.0, 3.0, 6.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02801513671875, -0.02719402313232422, -0.026372909545898438, -0.025551795959472656, -0.024730682373046875, -0.023909568786621094, -0.023088455200195312, -0.02226734161376953, -0.02144622802734375, -0.02062511444091797, -0.019804000854492188, -0.018982887268066406, -0.018161773681640625, -0.017340660095214844, -0.016519546508789062, -0.01569843292236328, -0.0148773193359375, -0.014056205749511719, -0.013235092163085938, -0.012413978576660156, -0.011592864990234375, -0.010771751403808594, -0.009950637817382812, -0.009129524230957031, -0.00830841064453125, -0.007487297058105469, -0.0066661834716796875, -0.005845069885253906, -0.005023956298828125, -0.004202842712402344, -0.0033817291259765625, -0.0025606155395507812, -0.001739501953125, -0.0009183883666992188, -9.72747802734375e-05, 0.0007238388061523438, 0.001544952392578125, 0.0023660659790039062, 0.0031871795654296875, 0.004008293151855469, 0.00482940673828125, 0.005650520324707031, 0.0064716339111328125, 0.007292747497558594, 0.008113861083984375, 0.008934974670410156, 0.009756088256835938, 0.010577201843261719, 0.0113983154296875, 0.012219429016113281, 0.013040542602539062, 0.013861656188964844, 0.014682769775390625, 0.015503883361816406, 0.016324996948242188, 0.01714611053466797, 0.01796722412109375, 0.01878833770751953, 0.019609451293945312, 0.020430564880371094, 0.021251678466796875, 0.022072792053222656, 0.022893905639648438, 0.02371501922607422, 0.0245361328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 5.0, 14.0, 19.0, 30.0, 35.0, 42.0, 73.0, 113.0, 134.0, 255.0, 399.0, 598.0, 1029.0, 1925.0, 3359.0, 6865.0, 15380.0, 39162.0, 128171.0, 863933.0, 2760871.0, 262753.0, 65462.0, 23211.0, 9703.0, 4736.0, 2475.0, 1355.0, 750.0, 465.0, 312.0, 227.0, 135.0, 90.0, 66.0, 39.0, 32.0, 16.0, 15.0, 10.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039764404296875, -0.03860282897949219, -0.037441253662109375, -0.03627967834472656, -0.03511810302734375, -0.03395652770996094, -0.032794952392578125, -0.03163337707519531, -0.0304718017578125, -0.029310226440429688, -0.028148651123046875, -0.026987075805664062, -0.02582550048828125, -0.024663925170898438, -0.023502349853515625, -0.022340774536132812, -0.02117919921875, -0.020017623901367188, -0.018856048583984375, -0.017694473266601562, -0.01653289794921875, -0.015371322631835938, -0.014209747314453125, -0.013048171997070312, -0.0118865966796875, -0.010725021362304688, -0.009563446044921875, -0.008401870727539062, -0.00724029541015625, -0.0060787200927734375, -0.004917144775390625, -0.0037555694580078125, -0.002593994140625, -0.0014324188232421875, -0.000270843505859375, 0.0008907318115234375, 0.00205230712890625, 0.0032138824462890625, 0.004375457763671875, 0.0055370330810546875, 0.0066986083984375, 0.007860183715820312, 0.009021759033203125, 0.010183334350585938, 0.01134490966796875, 0.012506484985351562, 0.013668060302734375, 0.014829635620117188, 0.0159912109375, 0.017152786254882812, 0.018314361572265625, 0.019475936889648438, 0.02063751220703125, 0.021799087524414062, 0.022960662841796875, 0.024122238159179688, 0.0252838134765625, 0.026445388793945312, 0.027606964111328125, 0.028768539428710938, 0.02993011474609375, 0.031091690063476562, 0.032253265380859375, 0.03341484069824219, 0.034576416015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 11.0, 14.0, 21.0, 44.0, 58.0, 76.0, 108.0, 222.0, 516.0, 1096.0, 836.0, 401.0, 216.0, 139.0, 66.0, 62.0, 49.0, 30.0, 22.0, 18.0, 7.0, 12.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04449462890625, -0.04295158386230469, -0.041408538818359375, -0.03986549377441406, -0.03832244873046875, -0.03677940368652344, -0.035236358642578125, -0.03369331359863281, -0.0321502685546875, -0.030607223510742188, -0.029064178466796875, -0.027521133422851562, -0.02597808837890625, -0.024435043334960938, -0.022891998291015625, -0.021348953247070312, -0.019805908203125, -0.018262863159179688, -0.016719818115234375, -0.015176773071289062, -0.01363372802734375, -0.012090682983398438, -0.010547637939453125, -0.009004592895507812, -0.0074615478515625, -0.0059185028076171875, -0.004375457763671875, -0.0028324127197265625, -0.00128936767578125, 0.0002536773681640625, 0.001796722412109375, 0.0033397674560546875, 0.0048828125, 0.0064258575439453125, 0.007968902587890625, 0.009511947631835938, 0.01105499267578125, 0.012598037719726562, 0.014141082763671875, 0.015684127807617188, 0.0172271728515625, 0.018770217895507812, 0.020313262939453125, 0.021856307983398438, 0.02339935302734375, 0.024942398071289062, 0.026485443115234375, 0.028028488159179688, 0.029571533203125, 0.031114578247070312, 0.032657623291015625, 0.03420066833496094, 0.03574371337890625, 0.03728675842285156, 0.038829803466796875, 0.04037284851074219, 0.0419158935546875, 0.04345893859863281, 0.045001983642578125, 0.04654502868652344, 0.04808807373046875, 0.04963111877441406, 0.051174163818359375, 0.05271720886230469, 0.05426025390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 24.0, 62.0, 191.0, 293.0, 239.0, 106.0, 46.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6213767528533936, -0.5994256734848022, -0.5774745345115662, -0.5555234551429749, -0.5335723161697388, -0.5116212368011475, -0.4896700978279114, -0.46771901845932007, -0.445767879486084, -0.4238167703151703, -0.4018656611442566, -0.3799145519733429, -0.3579634428024292, -0.3360123336315155, -0.3140612244606018, -0.2921101450920105, -0.2701590359210968, -0.2482079267501831, -0.2262568175792694, -0.2043057084083557, -0.18235459923744202, -0.16040349006652832, -0.13845239579677582, -0.11650128662586212, -0.09455017745494843, -0.07259906828403473, -0.05064796283841133, -0.028696857392787933, -0.006745748221874237, 0.01520536094903946, 0.03715646266937256, 0.059107571840286255, 0.08105868101119995, 0.10300979018211365, 0.12496089935302734, 0.14691200852394104, 0.16886311769485474, 0.19081422686576843, 0.21276532113552094, 0.23471643030643463, 0.2566675543785095, 0.2786186635494232, 0.3005697727203369, 0.3225208818912506, 0.3444719910621643, 0.366423100233078, 0.3883742094039917, 0.410325288772583, 0.4322763979434967, 0.4542275071144104, 0.4761786162853241, 0.4981297254562378, 0.5200808048248291, 0.5420319437980652, 0.5639830231666565, 0.5859341621398926, 0.6078852415084839, 0.6298363208770752, 0.6517874598503113, 0.6737385392189026, 0.6956896781921387, 0.71764075756073, 0.7395918965339661, 0.7615429759025574, 0.7834941148757935]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 10.0, 10.0, 12.0, 7.0, 8.0, 17.0, 20.0, 18.0, 23.0, 26.0, 29.0, 28.0, 37.0, 37.0, 37.0, 30.0, 41.0, 52.0, 39.0, 42.0, 42.0, 42.0, 42.0, 34.0, 28.0, 39.0, 34.0, 31.0, 26.0, 31.0, 27.0, 12.0, 18.0, 17.0, 11.0, 4.0, 8.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.14839178323745728, -0.14376282691955566, -0.13913385570049286, -0.13450489938259125, -0.12987592816352844, -0.12524697184562683, -0.12061800807714462, -0.11598904430866241, -0.1113600805401802, -0.106731116771698, -0.10210215300321579, -0.09747318923473358, -0.09284423291683197, -0.08821526169776917, -0.08358630537986755, -0.07895734161138535, -0.07432837784290314, -0.06969941407442093, -0.06507045030593872, -0.06044149026274681, -0.0558125264942646, -0.051183562725782394, -0.046554602682590485, -0.041925638914108276, -0.03729667514562607, -0.03266771137714386, -0.0280387494713068, -0.023409787565469742, -0.018780823796987534, -0.014151860028505325, -0.009522898122668266, -0.004893936216831207, -0.000264972448348999, 0.004363990388810635, 0.008992953225970268, 0.013621916063129902, 0.018250878900289536, 0.022879842668771744, 0.027508804574608803, 0.03213776648044586, 0.03676673024892807, 0.04139569401741028, 0.04602465778589249, 0.050653617829084396, 0.055282581597566605, 0.05991154536604881, 0.06454050540924072, 0.06916946917772293, 0.07379843294620514, 0.07842739671468735, 0.08305636048316956, 0.08768532425165176, 0.09231428802013397, 0.09694324433803558, 0.10157220810651779, 0.106201171875, 0.11083013564348221, 0.11545909941196442, 0.12008806318044662, 0.12471702694892883, 0.12934598326683044, 0.13397495448589325, 0.13860391080379486, 0.14323288202285767, 0.14786183834075928]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 23.0, 34.0, 42.0, 54.0, 109.0, 174.0, 280.0, 537.0, 1081.0, 2207.0, 5096.0, 11764.0, 30299.0, 81432.0, 217797.0, 360910.0, 209409.0, 78045.0, 28583.0, 11410.0, 4834.0, 2117.0, 1059.0, 499.0, 278.0, 172.0, 101.0, 54.0, 38.0, 29.0, 21.0, 16.0, 10.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0457763671875, -0.04436683654785156, -0.042957305908203125, -0.04154777526855469, -0.04013824462890625, -0.03872871398925781, -0.037319183349609375, -0.03590965270996094, -0.0345001220703125, -0.03309059143066406, -0.031681060791015625, -0.030271530151367188, -0.02886199951171875, -0.027452468872070312, -0.026042938232421875, -0.024633407592773438, -0.023223876953125, -0.021814346313476562, -0.020404815673828125, -0.018995285034179688, -0.01758575439453125, -0.016176223754882812, -0.014766693115234375, -0.013357162475585938, -0.0119476318359375, -0.010538101196289062, -0.009128570556640625, -0.0077190399169921875, -0.00630950927734375, -0.0048999786376953125, -0.003490447998046875, -0.0020809173583984375, -0.00067138671875, 0.0007381439208984375, 0.002147674560546875, 0.0035572052001953125, 0.00496673583984375, 0.0063762664794921875, 0.007785797119140625, 0.009195327758789062, 0.0106048583984375, 0.012014389038085938, 0.013423919677734375, 0.014833450317382812, 0.01624298095703125, 0.017652511596679688, 0.019062042236328125, 0.020471572875976562, 0.021881103515625, 0.023290634155273438, 0.024700164794921875, 0.026109695434570312, 0.02751922607421875, 0.028928756713867188, 0.030338287353515625, 0.03174781799316406, 0.0331573486328125, 0.03456687927246094, 0.035976409912109375, 0.03738594055175781, 0.03879547119140625, 0.04020500183105469, 0.041614532470703125, 0.04302406311035156, 0.04443359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 11.0, 30.0, 22.0, 24.0, 23.0, 38.0, 50.0, 59.0, 67.0, 70.0, 81.0, 78.0, 75.0, 58.0, 69.0, 55.0, 40.0, 38.0, 22.0, 23.0, 19.0, 8.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0297393798828125, -0.028862714767456055, -0.02798604965209961, -0.027109384536743164, -0.02623271942138672, -0.025356054306030273, -0.024479389190673828, -0.023602724075317383, -0.022726058959960938, -0.021849393844604492, -0.020972728729248047, -0.0200960636138916, -0.019219398498535156, -0.01834273338317871, -0.017466068267822266, -0.01658940315246582, -0.015712738037109375, -0.01483607292175293, -0.013959407806396484, -0.013082742691040039, -0.012206077575683594, -0.011329412460327148, -0.010452747344970703, -0.009576082229614258, -0.008699417114257812, -0.007822751998901367, -0.006946086883544922, -0.0060694217681884766, -0.005192756652832031, -0.004316091537475586, -0.0034394264221191406, -0.0025627613067626953, -0.00168609619140625, -0.0008094310760498047, 6.723403930664062e-05, 0.0009438991546630859, 0.0018205642700195312, 0.0026972293853759766, 0.003573894500732422, 0.004450559616088867, 0.0053272247314453125, 0.006203889846801758, 0.007080554962158203, 0.007957220077514648, 0.008833885192871094, 0.009710550308227539, 0.010587215423583984, 0.01146388053894043, 0.012340545654296875, 0.01321721076965332, 0.014093875885009766, 0.014970541000366211, 0.015847206115722656, 0.0167238712310791, 0.017600536346435547, 0.018477201461791992, 0.019353866577148438, 0.020230531692504883, 0.021107196807861328, 0.021983861923217773, 0.02286052703857422, 0.023737192153930664, 0.02461385726928711, 0.025490522384643555, 0.0263671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 10.0, 13.0, 13.0, 27.0, 45.0, 50.0, 76.0, 148.0, 251.0, 422.0, 748.0, 1251.0, 2399.0, 4937.0, 10298.0, 23436.0, 58591.0, 161400.0, 390717.0, 243671.0, 88304.0, 33674.0, 14338.0, 6455.0, 3250.0, 1716.0, 999.0, 510.0, 316.0, 206.0, 84.0, 63.0, 49.0, 22.0, 15.0, 12.0, 10.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0494384765625, -0.04797172546386719, -0.046504974365234375, -0.04503822326660156, -0.04357147216796875, -0.04210472106933594, -0.040637969970703125, -0.03917121887207031, -0.0377044677734375, -0.03623771667480469, -0.034770965576171875, -0.03330421447753906, -0.03183746337890625, -0.030370712280273438, -0.028903961181640625, -0.027437210083007812, -0.025970458984375, -0.024503707885742188, -0.023036956787109375, -0.021570205688476562, -0.02010345458984375, -0.018636703491210938, -0.017169952392578125, -0.015703201293945312, -0.0142364501953125, -0.012769699096679688, -0.011302947998046875, -0.009836196899414062, -0.00836944580078125, -0.0069026947021484375, -0.005435943603515625, -0.0039691925048828125, -0.00250244140625, -0.0010356903076171875, 0.000431060791015625, 0.0018978118896484375, 0.00336456298828125, 0.0048313140869140625, 0.006298065185546875, 0.0077648162841796875, 0.0092315673828125, 0.010698318481445312, 0.012165069580078125, 0.013631820678710938, 0.01509857177734375, 0.016565322875976562, 0.018032073974609375, 0.019498825073242188, 0.020965576171875, 0.022432327270507812, 0.023899078369140625, 0.025365829467773438, 0.02683258056640625, 0.028299331665039062, 0.029766082763671875, 0.031232833862304688, 0.0326995849609375, 0.03416633605957031, 0.035633087158203125, 0.03709983825683594, 0.03856658935546875, 0.04003334045410156, 0.041500091552734375, 0.04296684265136719, 0.04443359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 13.0, 17.0, 23.0, 20.0, 34.0, 24.0, 24.0, 45.0, 53.0, 54.0, 73.0, 61.0, 59.0, 52.0, 50.0, 63.0, 44.0, 51.0, 28.0, 25.0, 32.0, 34.0, 25.0, 19.0, 12.0, 9.0, 9.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06756591796875, -0.06525611877441406, -0.06294631958007812, -0.06063652038574219, -0.05832672119140625, -0.05601692199707031, -0.053707122802734375, -0.05139732360839844, -0.0490875244140625, -0.04677772521972656, -0.044467926025390625, -0.04215812683105469, -0.03984832763671875, -0.03753852844238281, -0.035228729248046875, -0.03291893005371094, -0.030609130859375, -0.028299331665039062, -0.025989532470703125, -0.023679733276367188, -0.02136993408203125, -0.019060134887695312, -0.016750335693359375, -0.014440536499023438, -0.0121307373046875, -0.009820938110351562, -0.007511138916015625, -0.0052013397216796875, -0.00289154052734375, -0.0005817413330078125, 0.001728057861328125, 0.0040378570556640625, 0.00634765625, 0.008657455444335938, 0.010967254638671875, 0.013277053833007812, 0.01558685302734375, 0.017896652221679688, 0.020206451416015625, 0.022516250610351562, 0.0248260498046875, 0.027135848999023438, 0.029445648193359375, 0.03175544738769531, 0.03406524658203125, 0.03637504577636719, 0.038684844970703125, 0.04099464416503906, 0.043304443359375, 0.04561424255371094, 0.047924041748046875, 0.05023384094238281, 0.05254364013671875, 0.05485343933105469, 0.057163238525390625, 0.05947303771972656, 0.0617828369140625, 0.06409263610839844, 0.06640243530273438, 0.06871223449707031, 0.07102203369140625, 0.07333183288574219, 0.07564163208007812, 0.07795143127441406, 0.08026123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 2.0, 5.0, 12.0, 18.0, 25.0, 40.0, 50.0, 62.0, 107.0, 149.0, 199.0, 358.0, 518.0, 783.0, 1297.0, 2087.0, 3537.0, 6047.0, 11597.0, 23131.0, 57056.0, 193953.0, 472340.0, 174459.0, 53276.0, 21790.0, 10854.0, 5859.0, 3453.0, 2010.0, 1179.0, 759.0, 514.0, 312.0, 233.0, 139.0, 100.0, 72.0, 54.0, 35.0, 19.0, 20.0, 5.0, 8.0, 5.0, 5.0, 8.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.01448822021484375, -0.014041900634765625, -0.0135955810546875, -0.013149261474609375, -0.01270294189453125, -0.012256622314453125, -0.011810302734375, -0.011363983154296875, -0.01091766357421875, -0.010471343994140625, -0.0100250244140625, -0.009578704833984375, -0.00913238525390625, -0.008686065673828125, -0.00823974609375, -0.007793426513671875, -0.00734710693359375, -0.006900787353515625, -0.0064544677734375, -0.006008148193359375, -0.00556182861328125, -0.005115509033203125, -0.004669189453125, -0.004222869873046875, -0.00377655029296875, -0.003330230712890625, -0.0028839111328125, -0.002437591552734375, -0.00199127197265625, -0.001544952392578125, -0.0010986328125, -0.000652313232421875, -0.00020599365234375, 0.000240325927734375, 0.0006866455078125, 0.001132965087890625, 0.00157928466796875, 0.002025604248046875, 0.002471923828125, 0.002918243408203125, 0.00336456298828125, 0.003810882568359375, 0.0042572021484375, 0.004703521728515625, 0.00514984130859375, 0.005596160888671875, 0.00604248046875, 0.006488800048828125, 0.00693511962890625, 0.007381439208984375, 0.0078277587890625, 0.008274078369140625, 0.00872039794921875, 0.009166717529296875, 0.009613037109375, 0.010059356689453125, 0.01050567626953125, 0.010951995849609375, 0.0113983154296875, 0.011844635009765625, 0.01229095458984375, 0.012737274169921875, 0.01318359375, 0.013629913330078125, 0.01407623291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 8.0, 8.0, 5.0, 10.0, 10.0, 14.0, 16.0, 33.0, 38.0, 49.0, 52.0, 72.0, 72.0, 74.0, 78.0, 82.0, 75.0, 49.0, 57.0, 35.0, 40.0, 26.0, 12.0, 11.0, 12.0, 7.0, 10.0, 6.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.838539123535156e-05, -3.711320459842682e-05, -3.5841017961502075e-05, -3.456883132457733e-05, -3.329664468765259e-05, -3.2024458050727844e-05, -3.07522714138031e-05, -2.9480084776878357e-05, -2.8207898139953613e-05, -2.693571150302887e-05, -2.5663524866104126e-05, -2.4391338229179382e-05, -2.311915159225464e-05, -2.1846964955329895e-05, -2.057477831840515e-05, -1.9302591681480408e-05, -1.8030405044555664e-05, -1.675821840763092e-05, -1.5486031770706177e-05, -1.4213845133781433e-05, -1.294165849685669e-05, -1.1669471859931946e-05, -1.0397285223007202e-05, -9.125098586082458e-06, -7.852911949157715e-06, -6.580725312232971e-06, -5.3085386753082275e-06, -4.036352038383484e-06, -2.7641654014587402e-06, -1.4919787645339966e-06, -2.1979212760925293e-07, 1.0523945093154907e-06, 2.3245811462402344e-06, 3.596767783164978e-06, 4.868954420089722e-06, 6.141141057014465e-06, 7.413327693939209e-06, 8.685514330863953e-06, 9.957700967788696e-06, 1.122988760471344e-05, 1.2502074241638184e-05, 1.3774260878562927e-05, 1.5046447515487671e-05, 1.6318634152412415e-05, 1.7590820789337158e-05, 1.8863007426261902e-05, 2.0135194063186646e-05, 2.140738070011139e-05, 2.2679567337036133e-05, 2.3951753973960876e-05, 2.522394061088562e-05, 2.6496127247810364e-05, 2.7768313884735107e-05, 2.904050052165985e-05, 3.0312687158584595e-05, 3.158487379550934e-05, 3.285706043243408e-05, 3.4129247069358826e-05, 3.540143370628357e-05, 3.667362034320831e-05, 3.794580698013306e-05, 3.92179936170578e-05, 4.0490180253982544e-05, 4.176236689090729e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 17.0, 10.0, 9.0, 15.0, 24.0, 31.0, 56.0, 66.0, 118.0, 153.0, 241.0, 328.0, 477.0, 695.0, 1127.0, 1716.0, 2848.0, 4656.0, 8294.0, 15427.0, 31446.0, 70075.0, 175482.0, 372444.0, 205511.0, 81483.0, 35830.0, 17126.0, 9084.0, 5217.0, 3149.0, 1864.0, 1124.0, 801.0, 490.0, 344.0, 250.0, 159.0, 100.0, 82.0, 66.0, 42.0, 35.0, 16.0, 8.0, 9.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00986480712890625, -0.009552478790283203, -0.009240150451660156, -0.00892782211303711, -0.008615493774414062, -0.008303165435791016, -0.007990837097167969, -0.007678508758544922, -0.007366180419921875, -0.007053852081298828, -0.006741523742675781, -0.006429195404052734, -0.0061168670654296875, -0.005804538726806641, -0.005492210388183594, -0.005179882049560547, -0.0048675537109375, -0.004555225372314453, -0.004242897033691406, -0.003930568695068359, -0.0036182403564453125, -0.0033059120178222656, -0.0029935836791992188, -0.002681255340576172, -0.002368927001953125, -0.002056598663330078, -0.0017442703247070312, -0.0014319419860839844, -0.0011196136474609375, -0.0008072853088378906, -0.0004949569702148438, -0.00018262863159179688, 0.00012969970703125, 0.0004420280456542969, 0.0007543563842773438, 0.0010666847229003906, 0.0013790130615234375, 0.0016913414001464844, 0.0020036697387695312, 0.002315998077392578, 0.002628326416015625, 0.002940654754638672, 0.0032529830932617188, 0.0035653114318847656, 0.0038776397705078125, 0.004189968109130859, 0.004502296447753906, 0.004814624786376953, 0.005126953125, 0.005439281463623047, 0.005751609802246094, 0.006063938140869141, 0.0063762664794921875, 0.006688594818115234, 0.007000923156738281, 0.007313251495361328, 0.007625579833984375, 0.007937908172607422, 0.008250236511230469, 0.008562564849853516, 0.008874893188476562, 0.00918722152709961, 0.009499549865722656, 0.009811878204345703, 0.01012420654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 11.0, 6.0, 15.0, 13.0, 16.0, 29.0, 37.0, 42.0, 64.0, 86.0, 68.0, 87.0, 103.0, 77.0, 61.0, 56.0, 46.0, 33.0, 22.0, 30.0, 13.0, 17.0, 9.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01485443115234375, -0.014367938041687012, -0.013881444931030273, -0.013394951820373535, -0.012908458709716797, -0.012421965599060059, -0.01193547248840332, -0.011448979377746582, -0.010962486267089844, -0.010475993156433105, -0.009989500045776367, -0.009503006935119629, -0.00901651382446289, -0.008530020713806152, -0.008043527603149414, -0.007557034492492676, -0.0070705413818359375, -0.006584048271179199, -0.006097555160522461, -0.005611062049865723, -0.005124568939208984, -0.004638075828552246, -0.004151582717895508, -0.0036650896072387695, -0.0031785964965820312, -0.002692103385925293, -0.0022056102752685547, -0.0017191171646118164, -0.0012326240539550781, -0.0007461309432983398, -0.00025963783264160156, 0.00022685527801513672, 0.000713348388671875, 0.0011998414993286133, 0.0016863346099853516, 0.00217282772064209, 0.002659320831298828, 0.0031458139419555664, 0.0036323070526123047, 0.004118800163269043, 0.004605293273925781, 0.0050917863845825195, 0.005578279495239258, 0.006064772605895996, 0.006551265716552734, 0.007037758827209473, 0.007524251937866211, 0.00801074504852295, 0.008497238159179688, 0.008983731269836426, 0.009470224380493164, 0.009956717491149902, 0.01044321060180664, 0.010929703712463379, 0.011416196823120117, 0.011902689933776855, 0.012389183044433594, 0.012875676155090332, 0.01336216926574707, 0.013848662376403809, 0.014335155487060547, 0.014821648597717285, 0.015308141708374023, 0.01579463481903076, 0.0162811279296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 23.0, 48.0, 106.0, 204.0, 247.0, 175.0, 92.0, 48.0, 19.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8503850102424622, -0.8307543396949768, -0.8111236095428467, -0.7914929389953613, -0.771862268447876, -0.7522315382957458, -0.7326008677482605, -0.7129701375961304, -0.693339467048645, -0.6737087965011597, -0.6540780663490295, -0.6344473958015442, -0.6148166656494141, -0.5951859951019287, -0.5755553245544434, -0.555924654006958, -0.5362939238548279, -0.5166632533073425, -0.4970325231552124, -0.47740185260772705, -0.4577711522579193, -0.4381404519081116, -0.4185097813606262, -0.3988790810108185, -0.37924838066101074, -0.359617680311203, -0.33998697996139526, -0.3203563094139099, -0.3007256090641022, -0.28109490871429443, -0.2614642381668091, -0.24183353781700134, -0.22220280766487122, -0.20257210731506348, -0.18294142186641693, -0.16331073641777039, -0.14368003606796265, -0.1240493431687355, -0.10441865026950836, -0.08478796482086182, -0.06515726447105408, -0.045526571571826935, -0.025895878672599792, -0.00626518577337265, 0.013365507125854492, 0.032996200025081635, 0.05262689292430878, 0.07225757837295532, 0.09188827872276306, 0.1115189716219902, 0.13114966452121735, 0.1507803499698639, 0.17041105031967163, 0.19004175066947937, 0.20967243611812592, 0.22930312156677246, 0.2489338219165802, 0.26856452226638794, 0.2881951928138733, 0.30782589316368103, 0.32745659351348877, 0.3470872938632965, 0.36671799421310425, 0.3863486647605896, 0.40597936511039734]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 11.0, 15.0, 12.0, 19.0, 20.0, 22.0, 22.0, 25.0, 26.0, 35.0, 22.0, 33.0, 38.0, 50.0, 37.0, 52.0, 49.0, 49.0, 47.0, 39.0, 43.0, 42.0, 46.0, 31.0, 28.0, 32.0, 20.0, 16.0, 16.0, 14.0, 15.0, 10.0, 3.0, 14.0, 7.0, 5.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.20375710725784302, -0.1981145590543747, -0.19247199594974518, -0.18682944774627686, -0.18118689954280853, -0.1755443513393402, -0.1699017882347107, -0.16425924003124237, -0.15861669182777405, -0.15297414362430573, -0.1473315805196762, -0.14168903231620789, -0.13604648411273956, -0.13040393590927124, -0.12476137280464172, -0.1191188246011734, -0.11347626149654388, -0.10783370584249496, -0.10219115763902664, -0.09654860198497772, -0.0909060537815094, -0.08526349812746048, -0.07962094247341156, -0.07397839426994324, -0.06833583861589432, -0.0626932829618454, -0.057050734758377075, -0.051408179104328156, -0.045765627175569534, -0.04012307524681091, -0.03448051959276199, -0.028837967664003372, -0.02319541573524475, -0.01755286380648613, -0.01191031001508236, -0.006267756223678589, -0.0006252042949199677, 0.0050173476338386536, 0.010659903287887573, 0.016302455216646194, 0.021945007145404816, 0.027587559074163437, 0.03323011100292206, 0.03887266665697098, 0.0445152185857296, 0.05015777051448822, 0.05580032616853714, 0.06144287809729576, 0.06708543002605438, 0.0727279856801033, 0.07837053388357162, 0.08401308953762054, 0.08965563774108887, 0.09529819339513779, 0.1009407490491867, 0.10658329725265503, 0.11222585290670395, 0.11786840856075287, 0.12351095676422119, 0.1291535198688507, 0.13479606807231903, 0.14043861627578735, 0.14608117938041687, 0.1517237275838852, 0.15736627578735352]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 9.0, 17.0, 15.0, 26.0, 39.0, 48.0, 78.0, 109.0, 174.0, 286.0, 501.0, 1048.0, 2399.0, 7079.0, 25626.0, 130010.0, 1164291.0, 2472994.0, 320450.0, 50909.0, 11939.0, 3637.0, 1327.0, 570.0, 277.0, 146.0, 78.0, 66.0, 26.0, 28.0, 11.0, 15.0, 11.0, 10.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07891845703125, -0.07654285430908203, -0.07416725158691406, -0.0717916488647461, -0.06941604614257812, -0.06704044342041016, -0.06466484069824219, -0.06228923797607422, -0.05991363525390625, -0.05753803253173828, -0.05516242980957031, -0.052786827087402344, -0.050411224365234375, -0.048035621643066406, -0.04566001892089844, -0.04328441619873047, -0.0409088134765625, -0.03853321075439453, -0.03615760803222656, -0.033782005310058594, -0.031406402587890625, -0.029030799865722656, -0.026655197143554688, -0.02427959442138672, -0.02190399169921875, -0.01952838897705078, -0.017152786254882812, -0.014777183532714844, -0.012401580810546875, -0.010025978088378906, -0.0076503753662109375, -0.005274772644042969, -0.002899169921875, -0.0005235671997070312, 0.0018520355224609375, 0.004227638244628906, 0.006603240966796875, 0.008978843688964844, 0.011354446411132812, 0.013730049133300781, 0.01610565185546875, 0.01848125457763672, 0.020856857299804688, 0.023232460021972656, 0.025608062744140625, 0.027983665466308594, 0.030359268188476562, 0.03273487091064453, 0.0351104736328125, 0.03748607635498047, 0.03986167907714844, 0.042237281799316406, 0.044612884521484375, 0.046988487243652344, 0.04936408996582031, 0.05173969268798828, 0.05411529541015625, 0.05649089813232422, 0.05886650085449219, 0.061242103576660156, 0.06361770629882812, 0.0659933090209961, 0.06836891174316406, 0.07074451446533203, 0.0731201171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 17.0, 7.0, 19.0, 29.0, 27.0, 48.0, 59.0, 61.0, 51.0, 83.0, 86.0, 84.0, 72.0, 74.0, 59.0, 57.0, 49.0, 24.0, 23.0, 15.0, 20.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.030609130859375, -0.02972888946533203, -0.028848648071289062, -0.027968406677246094, -0.027088165283203125, -0.026207923889160156, -0.025327682495117188, -0.02444744110107422, -0.02356719970703125, -0.02268695831298828, -0.021806716918945312, -0.020926475524902344, -0.020046234130859375, -0.019165992736816406, -0.018285751342773438, -0.01740550994873047, -0.0165252685546875, -0.01564502716064453, -0.014764785766601562, -0.013884544372558594, -0.013004302978515625, -0.012124061584472656, -0.011243820190429688, -0.010363578796386719, -0.00948333740234375, -0.008603096008300781, -0.0077228546142578125, -0.006842613220214844, -0.005962371826171875, -0.005082130432128906, -0.0042018890380859375, -0.0033216476440429688, -0.00244140625, -0.0015611648559570312, -0.0006809234619140625, 0.00019931793212890625, 0.001079559326171875, 0.0019598007202148438, 0.0028400421142578125, 0.0037202835083007812, 0.00460052490234375, 0.005480766296386719, 0.0063610076904296875, 0.007241249084472656, 0.008121490478515625, 0.009001731872558594, 0.009881973266601562, 0.010762214660644531, 0.0116424560546875, 0.012522697448730469, 0.013402938842773438, 0.014283180236816406, 0.015163421630859375, 0.016043663024902344, 0.016923904418945312, 0.01780414581298828, 0.01868438720703125, 0.01956462860107422, 0.020444869995117188, 0.021325111389160156, 0.022205352783203125, 0.023085594177246094, 0.023965835571289062, 0.02484607696533203, 0.025726318359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 11.0, 12.0, 31.0, 21.0, 39.0, 47.0, 63.0, 90.0, 132.0, 199.0, 326.0, 555.0, 963.0, 1637.0, 3259.0, 7009.0, 17408.0, 54279.0, 243772.0, 1968113.0, 1610289.0, 208121.0, 48820.0, 15794.0, 6457.0, 3041.0, 1504.0, 868.0, 503.0, 318.0, 198.0, 113.0, 77.0, 62.0, 48.0, 34.0, 14.0, 13.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0], "bins": [-0.07318115234375, -0.07130241394042969, -0.06942367553710938, -0.06754493713378906, -0.06566619873046875, -0.06378746032714844, -0.061908721923828125, -0.06002998352050781, -0.0581512451171875, -0.05627250671386719, -0.054393768310546875, -0.05251502990722656, -0.05063629150390625, -0.04875755310058594, -0.046878814697265625, -0.04500007629394531, -0.043121337890625, -0.04124259948730469, -0.039363861083984375, -0.03748512268066406, -0.03560638427734375, -0.03372764587402344, -0.031848907470703125, -0.029970169067382812, -0.0280914306640625, -0.026212692260742188, -0.024333953857421875, -0.022455215454101562, -0.02057647705078125, -0.018697738647460938, -0.016819000244140625, -0.014940261840820312, -0.0130615234375, -0.011182785034179688, -0.009304046630859375, -0.0074253082275390625, -0.00554656982421875, -0.0036678314208984375, -0.001789093017578125, 8.96453857421875e-05, 0.0019683837890625, 0.0038471221923828125, 0.005725860595703125, 0.0076045989990234375, 0.00948333740234375, 0.011362075805664062, 0.013240814208984375, 0.015119552612304688, 0.016998291015625, 0.018877029418945312, 0.020755767822265625, 0.022634506225585938, 0.02451324462890625, 0.026391983032226562, 0.028270721435546875, 0.030149459838867188, 0.0320281982421875, 0.03390693664550781, 0.035785675048828125, 0.03766441345214844, 0.03954315185546875, 0.04142189025878906, 0.043300628662109375, 0.04517936706542969, 0.04705810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 5.0, 8.0, 12.0, 11.0, 23.0, 20.0, 35.0, 42.0, 85.0, 112.0, 158.0, 216.0, 369.0, 477.0, 615.0, 574.0, 415.0, 288.0, 198.0, 128.0, 94.0, 65.0, 30.0, 39.0, 14.0, 11.0, 9.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08607673645019531, -0.08328628540039062, -0.08049583435058594, -0.07770538330078125, -0.07491493225097656, -0.07212448120117188, -0.06933403015136719, -0.0665435791015625, -0.06375312805175781, -0.060962677001953125, -0.05817222595214844, -0.05538177490234375, -0.05259132385253906, -0.049800872802734375, -0.04701042175292969, -0.044219970703125, -0.04142951965332031, -0.038639068603515625, -0.03584861755371094, -0.03305816650390625, -0.030267715454101562, -0.027477264404296875, -0.024686813354492188, -0.0218963623046875, -0.019105911254882812, -0.016315460205078125, -0.013525009155273438, -0.01073455810546875, -0.007944107055664062, -0.005153656005859375, -0.0023632049560546875, 0.00042724609375, 0.0032176971435546875, 0.006008148193359375, 0.008798599243164062, 0.01158905029296875, 0.014379501342773438, 0.017169952392578125, 0.019960403442382812, 0.0227508544921875, 0.025541305541992188, 0.028331756591796875, 0.031122207641601562, 0.03391265869140625, 0.03670310974121094, 0.039493560791015625, 0.04228401184082031, 0.045074462890625, 0.04786491394042969, 0.050655364990234375, 0.05344581604003906, 0.05623626708984375, 0.05902671813964844, 0.061817169189453125, 0.06460762023925781, 0.0673980712890625, 0.07018852233886719, 0.07297897338867188, 0.07576942443847656, 0.07855987548828125, 0.08135032653808594, 0.08414077758789062, 0.08693122863769531, 0.0897216796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 9.0, 4.0, 9.0, 4.0, 17.0, 10.0, 31.0, 63.0, 77.0, 143.0, 195.0, 154.0, 117.0, 65.0, 39.0, 20.0, 13.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5112895965576172, -1.4646813869476318, -1.418073058128357, -1.3714648485183716, -1.3248566389083862, -1.2782483100891113, -1.231640100479126, -1.1850318908691406, -1.1384235620498657, -1.0918153524398804, -1.0452070236206055, -0.9985988140106201, -0.95199054479599, -0.9053822755813599, -0.8587740659713745, -0.8121657967567444, -0.765557587146759, -0.7189493179321289, -0.6723411083221436, -0.6257328391075134, -0.5791245698928833, -0.532516360282898, -0.4859080910682678, -0.4392998218536377, -0.39269158244132996, -0.3460833430290222, -0.2994750738143921, -0.25286683440208435, -0.20625858008861542, -0.15965032577514648, -0.11304208636283875, -0.06643381714820862, -0.01982557773590088, 0.026782672852277756, 0.07339092344045639, 0.11999917030334473, 0.16660742461681366, 0.2132156789302826, 0.25982391834259033, 0.30643218755722046, 0.3530404269695282, 0.39964866638183594, 0.44625693559646606, 0.4928651750087738, 0.5394734144210815, 0.5860816836357117, 0.6326899528503418, 0.6792981624603271, 0.7259064316749573, 0.7725147008895874, 0.8191229104995728, 0.8657311797142029, 0.912339448928833, 0.9589476585388184, 1.0055558681488037, 1.0521641969680786, 1.098772406578064, 1.1453806161880493, 1.1919889450073242, 1.2385971546173096, 1.285205364227295, 1.3318136930465698, 1.3784219026565552, 1.42503023147583, 1.4716384410858154]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 16.0, 12.0, 20.0, 18.0, 27.0, 20.0, 42.0, 37.0, 37.0, 47.0, 36.0, 51.0, 47.0, 53.0, 60.0, 48.0, 53.0, 42.0, 42.0, 37.0, 43.0, 43.0, 23.0, 25.0, 20.0, 7.0, 11.0, 9.0, 10.0, 7.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7311837077140808, -0.709852397441864, -0.6885210871696472, -0.6671898365020752, -0.6458585262298584, -0.6245272159576416, -0.6031959056854248, -0.581864595413208, -0.5605332851409912, -0.5392019748687744, -0.5178706645965576, -0.4965393841266632, -0.4752081036567688, -0.453876793384552, -0.4325454831123352, -0.4112141728401184, -0.3898829221725464, -0.3685516119003296, -0.3472203314304352, -0.3258890211582184, -0.304557740688324, -0.2832264304161072, -0.2618951201438904, -0.24056382477283478, -0.21923252940177917, -0.19790123403072357, -0.17656993865966797, -0.15523862838745117, -0.13390733301639557, -0.11257603764533997, -0.09124472737312317, -0.06991343200206757, -0.04858219623565674, -0.027250897139310837, -0.005919598042964935, 0.015411704778671265, 0.03674300014972687, 0.05807429552078247, 0.07940560579299927, 0.10073690116405487, 0.12206819653511047, 0.14339949190616608, 0.16473078727722168, 0.18606209754943848, 0.20739339292049408, 0.22872468829154968, 0.2500559985637665, 0.2713872790336609, 0.2927185893058777, 0.3140498995780945, 0.3353811800479889, 0.3567124903202057, 0.3780437707901001, 0.3993750810623169, 0.4207063913345337, 0.4420377016067505, 0.4633689820766449, 0.4847002923488617, 0.5060315728187561, 0.5273628830909729, 0.5486941933631897, 0.5700254440307617, 0.5913567543029785, 0.6126880645751953, 0.6340193748474121]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 2.0, 11.0, 11.0, 12.0, 20.0, 28.0, 31.0, 59.0, 76.0, 108.0, 180.0, 261.0, 422.0, 767.0, 1141.0, 2044.0, 3597.0, 6721.0, 13598.0, 29668.0, 68375.0, 171617.0, 349458.0, 232430.0, 92371.0, 38830.0, 17592.0, 8572.0, 4423.0, 2440.0, 1362.0, 864.0, 529.0, 329.0, 231.0, 132.0, 83.0, 51.0, 29.0, 13.0, 24.0, 10.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048095703125, -0.04652738571166992, -0.044959068298339844, -0.043390750885009766, -0.04182243347167969, -0.04025411605834961, -0.03868579864501953, -0.03711748123168945, -0.035549163818359375, -0.0339808464050293, -0.03241252899169922, -0.03084421157836914, -0.029275894165039062, -0.027707576751708984, -0.026139259338378906, -0.024570941925048828, -0.02300262451171875, -0.021434307098388672, -0.019865989685058594, -0.018297672271728516, -0.016729354858398438, -0.01516103744506836, -0.013592720031738281, -0.012024402618408203, -0.010456085205078125, -0.008887767791748047, -0.007319450378417969, -0.005751132965087891, -0.0041828155517578125, -0.0026144981384277344, -0.0010461807250976562, 0.0005221366882324219, 0.0020904541015625, 0.003658771514892578, 0.005227088928222656, 0.006795406341552734, 0.008363723754882812, 0.00993204116821289, 0.011500358581542969, 0.013068675994873047, 0.014636993408203125, 0.016205310821533203, 0.01777362823486328, 0.01934194564819336, 0.020910263061523438, 0.022478580474853516, 0.024046897888183594, 0.025615215301513672, 0.02718353271484375, 0.028751850128173828, 0.030320167541503906, 0.031888484954833984, 0.03345680236816406, 0.03502511978149414, 0.03659343719482422, 0.0381617546081543, 0.039730072021484375, 0.04129838943481445, 0.04286670684814453, 0.04443502426147461, 0.04600334167480469, 0.047571659088134766, 0.049139976501464844, 0.05070829391479492, 0.052276611328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 13.0, 14.0, 20.0, 19.0, 27.0, 35.0, 38.0, 40.0, 53.0, 43.0, 60.0, 77.0, 57.0, 66.0, 65.0, 57.0, 61.0, 44.0, 27.0, 31.0, 26.0, 22.0, 10.0, 18.0, 14.0, 5.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0582275390625, -0.05646848678588867, -0.054709434509277344, -0.052950382232666016, -0.05119132995605469, -0.04943227767944336, -0.04767322540283203, -0.0459141731262207, -0.044155120849609375, -0.04239606857299805, -0.04063701629638672, -0.03887796401977539, -0.03711891174316406, -0.035359859466552734, -0.033600807189941406, -0.03184175491333008, -0.03008270263671875, -0.028323650360107422, -0.026564598083496094, -0.024805545806884766, -0.023046493530273438, -0.02128744125366211, -0.01952838897705078, -0.017769336700439453, -0.016010284423828125, -0.014251232147216797, -0.012492179870605469, -0.01073312759399414, -0.008974075317382812, -0.007215023040771484, -0.005455970764160156, -0.003696918487548828, -0.0019378662109375, -0.00017881393432617188, 0.0015802383422851562, 0.0033392906188964844, 0.0050983428955078125, 0.006857395172119141, 0.008616447448730469, 0.010375499725341797, 0.012134552001953125, 0.013893604278564453, 0.01565265655517578, 0.01741170883178711, 0.019170761108398438, 0.020929813385009766, 0.022688865661621094, 0.024447917938232422, 0.02620697021484375, 0.027966022491455078, 0.029725074768066406, 0.031484127044677734, 0.03324317932128906, 0.03500223159790039, 0.03676128387451172, 0.03852033615112305, 0.040279388427734375, 0.0420384407043457, 0.04379749298095703, 0.04555654525756836, 0.04731559753417969, 0.049074649810791016, 0.050833702087402344, 0.05259275436401367, 0.054351806640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 12.0, 14.0, 25.0, 52.0, 118.0, 291.0, 897.0, 4129.0, 39012.0, 930334.0, 66406.0, 5521.0, 1099.0, 367.0, 147.0, 53.0, 28.0, 16.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3289680480957031, -0.31784820556640625, -0.3067283630371094, -0.2956085205078125, -0.2844886779785156, -0.27336883544921875, -0.2622489929199219, -0.251129150390625, -0.24000930786132812, -0.22888946533203125, -0.21776962280273438, -0.2066497802734375, -0.19552993774414062, -0.18441009521484375, -0.17329025268554688, -0.16217041015625, -0.15105056762695312, -0.13993072509765625, -0.12881088256835938, -0.1176910400390625, -0.10657119750976562, -0.09545135498046875, -0.08433151245117188, -0.073211669921875, -0.062091827392578125, -0.05097198486328125, -0.039852142333984375, -0.0287322998046875, -0.017612457275390625, -0.00649261474609375, 0.004627227783203125, 0.0157470703125, 0.026866912841796875, 0.03798675537109375, 0.049106597900390625, 0.0602264404296875, 0.07134628295898438, 0.08246612548828125, 0.09358596801757812, 0.104705810546875, 0.11582565307617188, 0.12694549560546875, 0.13806533813476562, 0.1491851806640625, 0.16030502319335938, 0.17142486572265625, 0.18254470825195312, 0.19366455078125, 0.20478439331054688, 0.21590423583984375, 0.22702407836914062, 0.2381439208984375, 0.24926376342773438, 0.26038360595703125, 0.2715034484863281, 0.282623291015625, 0.2937431335449219, 0.30486297607421875, 0.3159828186035156, 0.3271026611328125, 0.3382225036621094, 0.34934234619140625, 0.3604621887207031, 0.37158203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 12.0, 14.0, 21.0, 26.0, 39.0, 51.0, 80.0, 83.0, 113.0, 106.0, 101.0, 81.0, 87.0, 56.0, 36.0, 29.0, 20.0, 20.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45751953125, -0.44249725341796875, -0.4274749755859375, -0.41245269775390625, -0.397430419921875, -0.38240814208984375, -0.3673858642578125, -0.35236358642578125, -0.33734130859375, -0.32231903076171875, -0.3072967529296875, -0.29227447509765625, -0.277252197265625, -0.26222991943359375, -0.2472076416015625, -0.23218536376953125, -0.2171630859375, -0.20214080810546875, -0.1871185302734375, -0.17209625244140625, -0.157073974609375, -0.14205169677734375, -0.1270294189453125, -0.11200714111328125, -0.09698486328125, -0.08196258544921875, -0.0669403076171875, -0.05191802978515625, -0.036895751953125, -0.02187347412109375, -0.0068511962890625, 0.00817108154296875, 0.023193359375, 0.03821563720703125, 0.0532379150390625, 0.06826019287109375, 0.083282470703125, 0.09830474853515625, 0.1133270263671875, 0.12834930419921875, 0.14337158203125, 0.15839385986328125, 0.1734161376953125, 0.18843841552734375, 0.203460693359375, 0.21848297119140625, 0.2335052490234375, 0.24852752685546875, 0.2635498046875, 0.27857208251953125, 0.2935943603515625, 0.30861663818359375, 0.323638916015625, 0.33866119384765625, 0.3536834716796875, 0.36870574951171875, 0.38372802734375, 0.39875030517578125, 0.4137725830078125, 0.42879486083984375, 0.443817138671875, 0.45883941650390625, 0.4738616943359375, 0.48888397216796875, 0.50390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 15.0, 47.0, 285.0, 11011.0, 1036186.0, 856.0, 90.0, 20.0, 8.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2776947021484375, -1.238006591796875, -1.1983184814453125, -1.15863037109375, -1.1189422607421875, -1.079254150390625, -1.0395660400390625, -0.9998779296875, -0.9601898193359375, -0.920501708984375, -0.8808135986328125, -0.84112548828125, -0.8014373779296875, -0.761749267578125, -0.7220611572265625, -0.682373046875, -0.6426849365234375, -0.602996826171875, -0.5633087158203125, -0.52362060546875, -0.4839324951171875, -0.444244384765625, -0.4045562744140625, -0.3648681640625, -0.3251800537109375, -0.285491943359375, -0.2458038330078125, -0.20611572265625, -0.1664276123046875, -0.126739501953125, -0.0870513916015625, -0.04736328125, -0.0076751708984375, 0.032012939453125, 0.0717010498046875, 0.11138916015625, 0.1510772705078125, 0.190765380859375, 0.2304534912109375, 0.2701416015625, 0.3098297119140625, 0.349517822265625, 0.3892059326171875, 0.42889404296875, 0.4685821533203125, 0.508270263671875, 0.5479583740234375, 0.587646484375, 0.6273345947265625, 0.667022705078125, 0.7067108154296875, 0.74639892578125, 0.7860870361328125, 0.825775146484375, 0.8654632568359375, 0.9051513671875, 0.9448394775390625, 0.984527587890625, 1.0242156982421875, 1.06390380859375, 1.1035919189453125, 1.143280029296875, 1.1829681396484375, 1.22265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 3.0, 6.0, 4.0, 5.0, 11.0, 9.0, 20.0, 25.0, 26.0, 42.0, 64.0, 97.0, 149.0, 132.0, 95.0, 68.0, 54.0, 26.0, 26.0, 14.0, 16.0, 29.0, 15.0, 11.0, 5.0, 3.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.002187728881836e-05, -5.820672959089279e-05, -5.6391581892967224e-05, -5.4576434195041656e-05, -5.276128649711609e-05, -5.094613879919052e-05, -4.9130991101264954e-05, -4.7315843403339386e-05, -4.550069570541382e-05, -4.368554800748825e-05, -4.187040030956268e-05, -4.0055252611637115e-05, -3.824010491371155e-05, -3.642495721578598e-05, -3.460980951786041e-05, -3.2794661819934845e-05, -3.097951412200928e-05, -2.916436642408371e-05, -2.7349218726158142e-05, -2.5534071028232574e-05, -2.3718923330307007e-05, -2.190377563238144e-05, -2.008862793445587e-05, -1.8273480236530304e-05, -1.6458332538604736e-05, -1.4643184840679169e-05, -1.2828037142753601e-05, -1.1012889444828033e-05, -9.197741746902466e-06, -7.382594048976898e-06, -5.5674463510513306e-06, -3.752298653125763e-06, -1.9371509552001953e-06, -1.2200325727462769e-07, 1.69314444065094e-06, 3.5082921385765076e-06, 5.323439836502075e-06, 7.138587534427643e-06, 8.95373523235321e-06, 1.0768882930278778e-05, 1.2584030628204346e-05, 1.4399178326129913e-05, 1.621432602405548e-05, 1.802947372198105e-05, 1.9844621419906616e-05, 2.1659769117832184e-05, 2.347491681575775e-05, 2.529006451368332e-05, 2.7105212211608887e-05, 2.8920359909534454e-05, 3.073550760746002e-05, 3.255065530538559e-05, 3.436580300331116e-05, 3.6180950701236725e-05, 3.799609839916229e-05, 3.981124609708786e-05, 4.162639379501343e-05, 4.3441541492938995e-05, 4.525668919086456e-05, 4.707183688879013e-05, 4.88869845867157e-05, 5.0702132284641266e-05, 5.2517279982566833e-05, 5.43324276804924e-05, 5.614757537841797e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 9.0, 14.0, 22.0, 30.0, 47.0, 70.0, 101.0, 150.0, 284.0, 583.0, 1285.0, 4076.0, 25295.0, 911072.0, 94071.0, 7750.0, 2018.0, 791.0, 350.0, 175.0, 122.0, 81.0, 40.0, 29.0, 19.0, 16.0, 8.0, 14.0, 9.0, 7.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.10940265655517578, -0.10497474670410156, -0.10054683685302734, -0.09611892700195312, -0.0916910171508789, -0.08726310729980469, -0.08283519744873047, -0.07840728759765625, -0.07397937774658203, -0.06955146789550781, -0.0651235580444336, -0.060695648193359375, -0.056267738342285156, -0.05183982849121094, -0.04741191864013672, -0.0429840087890625, -0.03855609893798828, -0.03412818908691406, -0.029700279235839844, -0.025272369384765625, -0.020844459533691406, -0.016416549682617188, -0.011988639831542969, -0.00756072998046875, -0.0031328201293945312, 0.0012950897216796875, 0.005722999572753906, 0.010150909423828125, 0.014578819274902344, 0.019006729125976562, 0.02343463897705078, 0.027862548828125, 0.03229045867919922, 0.03671836853027344, 0.041146278381347656, 0.045574188232421875, 0.050002098083496094, 0.05443000793457031, 0.05885791778564453, 0.06328582763671875, 0.06771373748779297, 0.07214164733886719, 0.0765695571899414, 0.08099746704101562, 0.08542537689208984, 0.08985328674316406, 0.09428119659423828, 0.0987091064453125, 0.10313701629638672, 0.10756492614746094, 0.11199283599853516, 0.11642074584960938, 0.1208486557006836, 0.1252765655517578, 0.12970447540283203, 0.13413238525390625, 0.13856029510498047, 0.1429882049560547, 0.1474161148071289, 0.15184402465820312, 0.15627193450927734, 0.16069984436035156, 0.16512775421142578, 0.1695556640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 17.0, 26.0, 49.0, 69.0, 131.0, 277.0, 187.0, 95.0, 46.0, 27.0, 23.0, 10.0, 10.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.176666259765625, -0.16949462890625, -0.162322998046875, -0.1551513671875, -0.147979736328125, -0.14080810546875, -0.133636474609375, -0.12646484375, -0.119293212890625, -0.11212158203125, -0.104949951171875, -0.0977783203125, -0.090606689453125, -0.08343505859375, -0.076263427734375, -0.069091796875, -0.061920166015625, -0.05474853515625, -0.047576904296875, -0.0404052734375, -0.033233642578125, -0.02606201171875, -0.018890380859375, -0.01171875, -0.004547119140625, 0.00262451171875, 0.009796142578125, 0.0169677734375, 0.024139404296875, 0.03131103515625, 0.038482666015625, 0.045654296875, 0.052825927734375, 0.05999755859375, 0.067169189453125, 0.0743408203125, 0.081512451171875, 0.08868408203125, 0.095855712890625, 0.10302734375, 0.110198974609375, 0.11737060546875, 0.124542236328125, 0.1317138671875, 0.138885498046875, 0.14605712890625, 0.153228759765625, 0.160400390625, 0.167572021484375, 0.17474365234375, 0.181915283203125, 0.1890869140625, 0.196258544921875, 0.20343017578125, 0.210601806640625, 0.2177734375, 0.224945068359375, 0.23211669921875, 0.239288330078125, 0.2464599609375, 0.253631591796875, 0.26080322265625, 0.267974853515625, 0.275146484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 10.0, 17.0, 27.0, 109.0, 367.0, 287.0, 104.0, 39.0, 12.0, 15.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.168622970581055, -6.036830425262451, -5.905038356781006, -5.773245811462402, -5.641453266143799, -5.509660720825195, -5.37786865234375, -5.2460761070251465, -5.114283561706543, -4.9824910163879395, -4.850698947906494, -4.718906402587891, -4.587113857269287, -4.455321311950684, -4.323529243469238, -4.191736698150635, -4.059944152832031, -3.928151845932007, -3.7963593006134033, -3.664566993713379, -3.5327744483947754, -3.400982141494751, -3.2691898345947266, -3.137397289276123, -3.0056052207946777, -2.8738129138946533, -2.74202036857605, -2.6102280616760254, -2.478435516357422, -2.3466432094573975, -2.214850902557373, -2.0830583572387695, -1.951265811920166, -1.819473385810852, -1.687680959701538, -1.5558886528015137, -1.4240961074829102, -1.2923038005828857, -1.1605113744735718, -1.0287189483642578, -0.8969265222549438, -0.7651340961456299, -0.6333416700363159, -0.5015493035316467, -0.36975687742233276, -0.2379644513130188, -0.10617208480834961, 0.025620341300964355, 0.15741276741027832, 0.2892051935195923, 0.42099758982658386, 0.5527899861335754, 0.6845824122428894, 0.8163748383522034, 0.9481672048568726, 1.0799596309661865, 1.2117520570755005, 1.3435444831848145, 1.4753369092941284, 1.6071293354034424, 1.7389216423034668, 1.8707141876220703, 2.0025064945220947, 2.134298801422119, 2.2660913467407227]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 20.0, 20.0, 38.0, 75.0, 104.0, 133.0, 182.0, 134.0, 95.0, 77.0, 40.0, 29.0, 10.0, 14.0, 5.0, 8.0, 1.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.509722709655762, -4.4109601974487305, -4.312197685241699, -4.213435649871826, -4.114673137664795, -4.015910625457764, -3.9171481132507324, -3.8183858394622803, -3.719623565673828, -3.620861053466797, -3.5220987796783447, -3.4233362674713135, -3.3245739936828613, -3.22581148147583, -3.127048969268799, -3.0282866954803467, -2.9295241832733154, -2.830761671066284, -2.731999397277832, -2.633236885070801, -2.5344746112823486, -2.4357120990753174, -2.3369498252868652, -2.238187313079834, -2.1394248008728027, -2.0406622886657715, -1.9419000148773193, -1.843137502670288, -1.744375228881836, -1.6456127166748047, -1.546850323677063, -1.4480879306793213, -1.3493256568908691, -1.2505632638931274, -1.1518008708953857, -1.0530383586883545, -0.9542760252952576, -0.8555136322975159, -0.7567511796951294, -0.6579887866973877, -0.559226393699646, -0.4604640007019043, -0.3617015779018402, -0.2629391551017761, -0.16417676210403442, -0.06541436910629272, 0.03334808349609375, 0.13211047649383545, 0.23087286949157715, 0.32963526248931885, 0.42839768528938293, 0.527160108089447, 0.6259225010871887, 0.7246848940849304, 0.8234473466873169, 0.9222097396850586, 1.0209721326828003, 1.119734525680542, 1.2184969186782837, 1.3172593116760254, 1.4160218238830566, 1.5147840976715088, 1.61354660987854, 1.7123090028762817, 1.8110713958740234]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 12.0, 19.0, 25.0, 47.0, 87.0, 514.0, 160.0, 50.0, 31.0, 20.0, 14.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3882732391357422, -0.3795738220214844, -0.37087440490722656, -0.36217498779296875, -0.35347557067871094, -0.3447761535644531, -0.3360767364501953, -0.3273773193359375, -0.3186779022216797, -0.3099784851074219, -0.30127906799316406, -0.29257965087890625, -0.28388023376464844, -0.2751808166503906, -0.2664813995361328, -0.257781982421875, -0.2490825653076172, -0.24038314819335938, -0.23168373107910156, -0.22298431396484375, -0.21428489685058594, -0.20558547973632812, -0.1968860626220703, -0.1881866455078125, -0.1794872283935547, -0.17078781127929688, -0.16208839416503906, -0.15338897705078125, -0.14468955993652344, -0.13599014282226562, -0.1272907257080078, -0.11859130859375, -0.10989189147949219, -0.10119247436523438, -0.09249305725097656, -0.08379364013671875, -0.07509422302246094, -0.06639480590820312, -0.05769538879394531, -0.0489959716796875, -0.04029655456542969, -0.031597137451171875, -0.022897720336914062, -0.01419830322265625, -0.0054988861083984375, 0.003200531005859375, 0.011899948120117188, 0.020599365234375, 0.029298782348632812, 0.037998199462890625, 0.04669761657714844, 0.05539703369140625, 0.06409645080566406, 0.07279586791992188, 0.08149528503417969, 0.0901947021484375, 0.09889411926269531, 0.10759353637695312, 0.11629295349121094, 0.12499237060546875, 0.13369178771972656, 0.14239120483398438, 0.1510906219482422, 0.1597900390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 11.0, 10.0, 10.0, 18.0, 21.0, 25.0, 38.0, 60.0, 70.0, 168.0, 378.0, 1090.0, 6216.0, 8342106.0, 35168.0, 2223.0, 564.0, 195.0, 69.0, 35.0, 27.0, 15.0, 13.0, 8.0, 4.0, 4.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9338787794113159, -0.9091488122940063, -0.884418785572052, -0.8596888184547424, -0.8349588513374329, -0.8102288246154785, -0.785498857498169, -0.7607688903808594, -0.7360389232635498, -0.7113089561462402, -0.6865789294242859, -0.6618489623069763, -0.6371189951896667, -0.6123889684677124, -0.5876590013504028, -0.5629290342330933, -0.5381990075111389, -0.5134690403938293, -0.4887390434741974, -0.46400904655456543, -0.43927907943725586, -0.4145490825176239, -0.38981908559799194, -0.3650891184806824, -0.3403591215610504, -0.31562912464141846, -0.2908991575241089, -0.26616916060447693, -0.24143917858600616, -0.2167091965675354, -0.19197919964790344, -0.16724921762943268, -0.14251917600631714, -0.11778919398784637, -0.09305920451879501, -0.06832921504974365, -0.04359923303127289, -0.018869251012802124, 0.005860745906829834, 0.030590727925300598, 0.05532070994377136, 0.08005069196224213, 0.10478068143129349, 0.12951067090034485, 0.1542406529188156, 0.17897063493728638, 0.20370063185691833, 0.2284306138753891, 0.25316059589385986, 0.2778905928134918, 0.3026205599308014, 0.32735055685043335, 0.3520805239677429, 0.3768105208873749, 0.40154051780700684, 0.4262704849243164, 0.45100048184394836, 0.4757304787635803, 0.5004604458808899, 0.5251904726028442, 0.5499204397201538, 0.5746504068374634, 0.599380373954773, 0.6241104006767273, 0.6488403677940369]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 4.0, 5.0, 3.0, 8.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.6906124353408813, -0.6626277565956116, -0.6346430778503418, -0.606658399105072, -0.5786737203598022, -0.5506890416145325, -0.5227043628692627, -0.4947196841239929, -0.46673500537872314, -0.43875032663345337, -0.4107656478881836, -0.3827809691429138, -0.35479629039764404, -0.32681161165237427, -0.2988269329071045, -0.2708422541618347, -0.24285760521888733, -0.21487292647361755, -0.18688824772834778, -0.158903568983078, -0.13091889023780823, -0.10293422639369965, -0.07494954764842987, -0.046964868903160095, -0.01898019015789032, 0.009004486724734306, 0.03698916360735893, 0.06497383862733841, 0.09295851737260818, 0.12094318866729736, 0.14892786741256714, 0.17691254615783691, 0.2048972249031067, 0.23288190364837646, 0.26086658239364624, 0.288851261138916, 0.3168359398841858, 0.34482061862945557, 0.37280529737472534, 0.4007899761199951, 0.4287746548652649, 0.45675933361053467, 0.48474401235580444, 0.5127286911010742, 0.540713369846344, 0.5686980485916138, 0.5966827273368835, 0.6246674060821533, 0.6526520252227783, 0.6806367039680481, 0.7086213827133179, 0.7366060614585876, 0.7645907402038574, 0.7925754189491272, 0.820560097694397, 0.8485447764396667, 0.8765294551849365, 0.9045141339302063, 0.9324988126754761, 0.9604834914207458, 0.9884681701660156, 1.0164527893066406, 1.0444375276565552, 1.0724221467971802, 1.1004068851470947]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 15.0, 26.0, 43.0, 55.0, 119.0, 143.0, 221.0, 154.0, 93.0, 50.0, 38.0, 18.0, 15.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.1612548828125, -0.15816259384155273, -0.15507030487060547, -0.1519780158996582, -0.14888572692871094, -0.14579343795776367, -0.1427011489868164, -0.13960886001586914, -0.13651657104492188, -0.1334242820739746, -0.13033199310302734, -0.12723970413208008, -0.12414741516113281, -0.12105512619018555, -0.11796283721923828, -0.11487054824829102, -0.11177825927734375, -0.10868597030639648, -0.10559368133544922, -0.10250139236450195, -0.09940910339355469, -0.09631681442260742, -0.09322452545166016, -0.09013223648071289, -0.08703994750976562, -0.08394765853881836, -0.0808553695678711, -0.07776308059692383, -0.07467079162597656, -0.0715785026550293, -0.06848621368408203, -0.06539392471313477, -0.0623016357421875, -0.059209346771240234, -0.05611705780029297, -0.0530247688293457, -0.04993247985839844, -0.04684019088745117, -0.043747901916503906, -0.04065561294555664, -0.037563323974609375, -0.03447103500366211, -0.031378746032714844, -0.028286457061767578, -0.025194168090820312, -0.022101879119873047, -0.01900959014892578, -0.015917301177978516, -0.01282501220703125, -0.009732723236083984, -0.006640434265136719, -0.003548145294189453, -0.0004558563232421875, 0.002636432647705078, 0.005728721618652344, 0.00882101058959961, 0.011913299560546875, 0.01500558853149414, 0.018097877502441406, 0.021190166473388672, 0.024282455444335938, 0.027374744415283203, 0.03046703338623047, 0.033559322357177734, 0.036651611328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 16.0, 21.0, 14.0, 26.0, 34.0, 53.0, 80.0, 127.0, 175.0, 297.0, 509.0, 974.0, 2094.0, 5245.0, 15983.0, 69484.0, 304697.0, 94006.0, 20029.0, 5958.0, 2261.0, 955.0, 486.0, 250.0, 159.0, 102.0, 70.0, 44.0, 25.0, 26.0, 14.0, 16.0, 7.0, 10.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.037109375, -1.0115585327148438, -0.9860076904296875, -0.9604568481445312, -0.934906005859375, -0.9093551635742188, -0.8838043212890625, -0.8582534790039062, -0.83270263671875, -0.8071517944335938, -0.7816009521484375, -0.7560501098632812, -0.730499267578125, -0.7049484252929688, -0.6793975830078125, -0.6538467407226562, -0.6282958984375, -0.6027450561523438, -0.5771942138671875, -0.5516433715820312, -0.526092529296875, -0.5005416870117188, -0.4749908447265625, -0.44944000244140625, -0.42388916015625, -0.39833831787109375, -0.3727874755859375, -0.34723663330078125, -0.321685791015625, -0.29613494873046875, -0.2705841064453125, -0.24503326416015625, -0.219482421875, -0.19393157958984375, -0.1683807373046875, -0.14282989501953125, -0.117279052734375, -0.09172821044921875, -0.0661773681640625, -0.04062652587890625, -0.01507568359375, 0.01047515869140625, 0.0360260009765625, 0.06157684326171875, 0.087127685546875, 0.11267852783203125, 0.1382293701171875, 0.16378021240234375, 0.1893310546875, 0.21488189697265625, 0.2404327392578125, 0.26598358154296875, 0.291534423828125, 0.31708526611328125, 0.3426361083984375, 0.36818695068359375, 0.39373779296875, 0.41928863525390625, 0.4448394775390625, 0.47039031982421875, 0.495941162109375, 0.5214920043945312, 0.5470428466796875, 0.5725936889648438, 0.59814453125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 1.0, 14.0, 9.0, 18.0, 24.0, 41.0, 49.0, 77.0, 110.0, 131.0, 134.0, 133.0, 72.0, 51.0, 41.0, 25.0, 14.0, 20.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.251953125, -0.24603843688964844, -0.24012374877929688, -0.2342090606689453, -0.22829437255859375, -0.2223796844482422, -0.21646499633789062, -0.21055030822753906, -0.2046356201171875, -0.19872093200683594, -0.19280624389648438, -0.1868915557861328, -0.18097686767578125, -0.1750621795654297, -0.16914749145507812, -0.16323280334472656, -0.157318115234375, -0.15140342712402344, -0.14548873901367188, -0.1395740509033203, -0.13365936279296875, -0.1277446746826172, -0.12182998657226562, -0.11591529846191406, -0.1100006103515625, -0.10408592224121094, -0.09817123413085938, -0.09225654602050781, -0.08634185791015625, -0.08042716979980469, -0.07451248168945312, -0.06859779357910156, -0.06268310546875, -0.05676841735839844, -0.050853729248046875, -0.04493904113769531, -0.03902435302734375, -0.03310966491699219, -0.027194976806640625, -0.021280288696289062, -0.0153656005859375, -0.009450912475585938, -0.003536224365234375, 0.0023784637451171875, 0.00829315185546875, 0.014207839965820312, 0.020122528076171875, 0.026037216186523438, 0.031951904296875, 0.03786659240722656, 0.043781280517578125, 0.04969596862792969, 0.05561065673828125, 0.06152534484863281, 0.06744003295898438, 0.07335472106933594, 0.0792694091796875, 0.08518409729003906, 0.09109878540039062, 0.09701347351074219, 0.10292816162109375, 0.10884284973144531, 0.11475753784179688, 0.12067222595214844, 0.1265869140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 9.0, 6.0, 4.0, 10.0, 19.0, 14.0, 24.0, 30.0, 37.0, 42.0, 34.0, 39.0, 38.0, 38.0, 22.0, 20.0, 21.0, 16.0, 12.0, 11.0, 12.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4283409118652344, -0.4173845648765564, -0.4064282178878784, -0.39547187089920044, -0.38451555371284485, -0.37355920672416687, -0.3626028597354889, -0.3516465127468109, -0.3406901955604553, -0.32973384857177734, -0.31877750158309937, -0.3078211545944214, -0.2968648374080658, -0.2859084904193878, -0.27495214343070984, -0.26399579644203186, -0.2530394494533539, -0.2420831024646759, -0.23112677037715912, -0.22017042338848114, -0.20921409130096436, -0.19825774431228638, -0.1873013973236084, -0.17634505033493042, -0.16538871824741364, -0.15443237125873566, -0.14347603917121887, -0.1325196921825409, -0.12156335264444351, -0.11060701310634613, -0.09965066611766815, -0.08869432657957077, -0.077737957239151, -0.06678161770105362, -0.05582527443766594, -0.04486893117427826, -0.03391259163618088, -0.022956252098083496, -0.011999905109405518, -0.001043565571308136, 0.009912773966789246, 0.020869115367531776, 0.03182545676827431, 0.04278180003166199, 0.05373813956975937, 0.06469447910785675, 0.07565082609653473, 0.08660716563463211, 0.09756350517272949, 0.10851984471082687, 0.11947618424892426, 0.13043253123760223, 0.14138886332511902, 0.152345210313797, 0.16330155730247498, 0.17425790429115295, 0.18521423637866974, 0.19617058336734772, 0.2071269154548645, 0.21808326244354248, 0.22903960943222046, 0.23999594151973724, 0.2509523034095764, 0.261908620595932, 0.27286496758461]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 8.0, 20.0, 12.0, 12.0, 18.0, 14.0, 23.0, 41.0, 37.0, 37.0, 39.0, 25.0, 31.0, 21.0, 27.0, 9.0, 21.0, 13.0, 13.0, 8.0, 12.0, 7.0, 5.0, 3.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7345180511474609, -0.7138820290565491, -0.693246066570282, -0.6726100444793701, -0.651974081993103, -0.6313380599021912, -0.6107020378112793, -0.5900660753250122, -0.5694300532341003, -0.5487940311431885, -0.5281580686569214, -0.5075220465660095, -0.48688605427742004, -0.46625006198883057, -0.4456140398979187, -0.4249780476093292, -0.40434205532073975, -0.38370606303215027, -0.3630700707435608, -0.3424340486526489, -0.32179805636405945, -0.30116206407546997, -0.2805260419845581, -0.25989004969596863, -0.23925405740737915, -0.21861806511878967, -0.197982057929039, -0.17734605073928833, -0.15671005845069885, -0.13607406616210938, -0.1154380589723587, -0.09480205178260803, -0.07416605949401855, -0.05353005975484848, -0.032894060015678406, -0.012258060276508331, 0.008377939462661743, 0.029013939201831818, 0.04964993894100189, 0.07028594613075256, 0.09092193841934204, 0.11155793815851212, 0.1321939378976822, 0.15282994508743286, 0.17346593737602234, 0.19410192966461182, 0.2147379368543625, 0.23537394404411316, 0.25600993633270264, 0.2766459286212921, 0.2972819209098816, 0.31791794300079346, 0.33855393528938293, 0.3591899275779724, 0.3798259496688843, 0.40046194195747375, 0.42109793424606323, 0.4417339265346527, 0.4623699188232422, 0.48300594091415405, 0.5036419630050659, 0.524277925491333, 0.5449139475822449, 0.5655499696731567, 0.5861859321594238]}, "eval/loss": 4.281228065490723, "eval/bleu": 0.0, "eval/runtime": 2569.7097, "eval/samples_per_second": 5.744, "eval/steps_per_second": 0.718} \ No newline at end of file +{"train/loss": 3.856, "train/learning_rate": 0.0001684185630143819, "train/epoch": 1.54, "train/global_step": 5000, "_runtime": 47341, "_timestamp": 1651721430, "_step": 5009, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 54.0, 967.0], "bins": [-162.1786346435547, -159.61509704589844, -157.0515594482422, -154.48802185058594, -151.9244842529297, -149.36093139648438, -146.79739379882812, -144.23385620117188, -141.67031860351562, -139.10678100585938, -136.54324340820312, -133.97970581054688, -131.41616821289062, -128.85263061523438, -126.2890853881836, -123.72554779052734, -121.1620101928711, -118.59847259521484, -116.0349349975586, -113.47138977050781, -110.90785217285156, -108.34431457519531, -105.78077697753906, -103.21723937988281, -100.65370178222656, -98.09016418457031, -95.52662658691406, -92.96308135986328, -90.39954376220703, -87.83600616455078, -85.27246856689453, -82.70893096923828, -80.1453857421875, -77.58184814453125, -75.018310546875, -72.45476531982422, -69.89122772216797, -67.32769012451172, -64.76415252685547, -62.20061492919922, -59.63706970214844, -57.07353210449219, -54.50999069213867, -51.94645309448242, -49.382911682128906, -46.819374084472656, -44.255836486816406, -41.692298889160156, -39.12875747680664, -36.56521987915039, -34.001678466796875, -31.438140869140625, -28.874601364135742, -26.31106185913086, -23.74752426147461, -21.183984756469727, -18.620445251464844, -16.05690574645996, -13.493367195129395, -10.929828643798828, -8.366289138793945, -5.8027496337890625, -3.239211082458496, -0.6756725311279297, 1.8878662586212158]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 10.0, 15.0, 17.0, 24.0, 23.0, 31.0, 26.0, 38.0, 42.0, 49.0, 52.0, 51.0, 47.0, 56.0, 62.0, 56.0, 55.0, 49.0, 42.0, 33.0, 41.0, 33.0, 26.0, 16.0, 18.0, 14.0, 10.0, 15.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.286391735076904, -7.084299564361572, -6.882206916809082, -6.68011474609375, -6.478022575378418, -6.275930404663086, -6.073838233947754, -5.871745586395264, -5.669653415679932, -5.4675612449646, -5.265468597412109, -5.063376426696777, -4.861284255981445, -4.659192085266113, -4.457099914550781, -4.255007266998291, -4.052915096282959, -3.850822925567627, -3.648730516433716, -3.4466381072998047, -3.2445459365844727, -3.0424537658691406, -2.8403613567352295, -2.6382689476013184, -2.4361767768859863, -2.2340846061706543, -2.031992197036743, -1.8298999071121216, -1.6278076171875, -1.4257153272628784, -1.2236230373382568, -1.0215307474136353, -0.8194384574890137, -0.6173461675643921, -0.4152538776397705, -0.21316158771514893, -0.011069297790527344, 0.19102299213409424, 0.3931152820587158, 0.5952075719833374, 0.797299861907959, 0.9993921518325806, 1.2014844417572021, 1.4035767316818237, 1.6056690216064453, 1.807761311531067, 2.0098536014556885, 2.2119460105895996, 2.4140381813049316, 2.6161303520202637, 2.818222761154175, 3.020315170288086, 3.222407341003418, 3.42449951171875, 3.626591920852661, 3.8286843299865723, 4.030776500701904, 4.232868671417236, 4.434961318969727, 4.637053489685059, 4.839145660400391, 5.041237831115723, 5.243330001831055, 5.445422649383545, 5.647514820098877]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 6.0, 7.0, 1.0, 13.0, 13.0, 16.0, 24.0, 33.0, 62.0, 61.0, 87.0, 147.0, 226.0, 350.0, 617.0, 993.0, 1666.0, 2917.0, 5495.0, 9986.0, 19120.0, 35183.0, 67868.0, 150003.0, 661350.0, 2750105.0, 279358.0, 100349.0, 49927.0, 26718.0, 14123.0, 7512.0, 4171.0, 2273.0, 1352.0, 781.0, 473.0, 293.0, 192.0, 122.0, 95.0, 57.0, 39.0, 31.0, 27.0, 20.0, 8.0, 8.0, 5.0, 3.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.3935546875, -2.314453125, -2.2353515625, -2.15625, -2.0771484375, -1.998046875, -1.9189453125, -1.83984375, -1.7607421875, -1.681640625, -1.6025390625, -1.5234375, -1.4443359375, -1.365234375, -1.2861328125, -1.20703125, -1.1279296875, -1.048828125, -0.9697265625, -0.890625, -0.8115234375, -0.732421875, -0.6533203125, -0.57421875, -0.4951171875, -0.416015625, -0.3369140625, -0.2578125, -0.1787109375, -0.099609375, -0.0205078125, 0.05859375, 0.1376953125, 0.216796875, 0.2958984375, 0.375, 0.4541015625, 0.533203125, 0.6123046875, 0.69140625, 0.7705078125, 0.849609375, 0.9287109375, 1.0078125, 1.0869140625, 1.166015625, 1.2451171875, 1.32421875, 1.4033203125, 1.482421875, 1.5615234375, 1.640625, 1.7197265625, 1.798828125, 1.8779296875, 1.95703125, 2.0361328125, 2.115234375, 2.1943359375, 2.2734375, 2.3525390625, 2.431640625, 2.5107421875, 2.58984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 8.0, 10.0, 12.0, 13.0, 12.0, 24.0, 30.0, 28.0, 30.0, 42.0, 30.0, 41.0, 44.0, 47.0, 54.0, 46.0, 44.0, 47.0, 49.0, 58.0, 44.0, 40.0, 42.0, 26.0, 30.0, 18.0, 18.0, 20.0, 11.0, 12.0, 11.0, 7.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-5.74609375, -5.5877685546875, -5.429443359375, -5.2711181640625, -5.11279296875, -4.9544677734375, -4.796142578125, -4.6378173828125, -4.4794921875, -4.3211669921875, -4.162841796875, -4.0045166015625, -3.84619140625, -3.6878662109375, -3.529541015625, -3.3712158203125, -3.212890625, -3.0545654296875, -2.896240234375, -2.7379150390625, -2.57958984375, -2.4212646484375, -2.262939453125, -2.1046142578125, -1.9462890625, -1.7879638671875, -1.629638671875, -1.4713134765625, -1.31298828125, -1.1546630859375, -0.996337890625, -0.8380126953125, -0.6796875, -0.5213623046875, -0.363037109375, -0.2047119140625, -0.04638671875, 0.1119384765625, 0.270263671875, 0.4285888671875, 0.5869140625, 0.7452392578125, 0.903564453125, 1.0618896484375, 1.22021484375, 1.3785400390625, 1.536865234375, 1.6951904296875, 1.853515625, 2.0118408203125, 2.170166015625, 2.3284912109375, 2.48681640625, 2.6451416015625, 2.803466796875, 2.9617919921875, 3.1201171875, 3.2784423828125, 3.436767578125, 3.5950927734375, 3.75341796875, 3.9117431640625, 4.070068359375, 4.2283935546875, 4.38671875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 9.0, 7.0, 3.0, 16.0, 14.0, 22.0, 22.0, 48.0, 59.0, 112.0, 333.0, 4189877.0, 3321.0, 215.0, 86.0, 39.0, 37.0, 20.0, 8.0, 12.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.375, -156.73828125, -152.1015625, -147.46484375, -142.828125, -138.19140625, -133.5546875, -128.91796875, -124.28125, -119.64453125, -115.0078125, -110.37109375, -105.734375, -101.09765625, -96.4609375, -91.82421875, -87.1875, -82.55078125, -77.9140625, -73.27734375, -68.640625, -64.00390625, -59.3671875, -54.73046875, -50.09375, -45.45703125, -40.8203125, -36.18359375, -31.546875, -26.91015625, -22.2734375, -17.63671875, -13.0, -8.36328125, -3.7265625, 0.91015625, 5.546875, 10.18359375, 14.8203125, 19.45703125, 24.09375, 28.73046875, 33.3671875, 38.00390625, 42.640625, 47.27734375, 51.9140625, 56.55078125, 61.1875, 65.82421875, 70.4609375, 75.09765625, 79.734375, 84.37109375, 89.0078125, 93.64453125, 98.28125, 102.91796875, 107.5546875, 112.19140625, 116.828125, 121.46484375, 126.1015625, 130.73828125, 135.375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 7.0, 6.0, 6.0, 9.0, 15.0, 26.0, 24.0, 38.0, 57.0, 89.0, 149.0, 975.0, 2182.0, 225.0, 101.0, 51.0, 44.0, 17.0, 16.0, 8.0, 6.0, 4.0, 8.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.973297119140625, -2.88604736328125, -2.798797607421875, -2.7115478515625, -2.624298095703125, -2.53704833984375, -2.449798583984375, -2.362548828125, -2.275299072265625, -2.18804931640625, -2.100799560546875, -2.0135498046875, -1.926300048828125, -1.83905029296875, -1.751800537109375, -1.66455078125, -1.577301025390625, -1.49005126953125, -1.402801513671875, -1.3155517578125, -1.228302001953125, -1.14105224609375, -1.053802490234375, -0.966552734375, -0.879302978515625, -0.79205322265625, -0.704803466796875, -0.6175537109375, -0.530303955078125, -0.44305419921875, -0.355804443359375, -0.2685546875, -0.181304931640625, -0.09405517578125, -0.006805419921875, 0.0804443359375, 0.167694091796875, 0.25494384765625, 0.342193603515625, 0.429443359375, 0.516693115234375, 0.60394287109375, 0.691192626953125, 0.7784423828125, 0.865692138671875, 0.95294189453125, 1.040191650390625, 1.12744140625, 1.214691162109375, 1.30194091796875, 1.389190673828125, 1.4764404296875, 1.563690185546875, 1.65093994140625, 1.738189697265625, 1.825439453125, 1.912689208984375, 1.99993896484375, 2.087188720703125, 2.1744384765625, 2.261688232421875, 2.34893798828125, 2.436187744140625, 2.5234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 5.0, 4.0, 9.0, 11.0, 13.0, 20.0, 53.0, 73.0, 78.0, 113.0, 131.0, 141.0, 103.0, 78.0, 59.0, 37.0, 24.0, 16.0, 9.0, 8.0, 8.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.38481330871582, -9.143033981323242, -8.901254653930664, -8.659476280212402, -8.417696952819824, -8.175917625427246, -7.934138774871826, -7.692359924316406, -7.450580596923828, -7.20880126953125, -6.96702241897583, -6.72524356842041, -6.483464241027832, -6.241684913635254, -5.999906063079834, -5.758127212524414, -5.516347885131836, -5.274568557739258, -5.032789707183838, -4.791010856628418, -4.54923152923584, -4.307452201843262, -4.065673351287842, -3.8238942623138428, -3.5821151733398438, -3.3403360843658447, -3.0985569953918457, -2.8567779064178467, -2.6149988174438477, -2.3732197284698486, -2.1314406394958496, -1.8896615505218506, -1.6478829383850098, -1.4061038494110107, -1.1643247604370117, -0.9225456714630127, -0.6807665824890137, -0.43898749351501465, -0.19720840454101562, 0.0445706844329834, 0.2863497734069824, 0.5281288623809814, 0.7699079513549805, 1.0116870403289795, 1.2534661293029785, 1.4952452182769775, 1.7370243072509766, 1.9788033962249756, 2.2205824851989746, 2.4623615741729736, 2.7041406631469727, 2.9459197521209717, 3.1876988410949707, 3.4294779300689697, 3.6712570190429688, 3.9130361080169678, 4.154815196990967, 4.396594047546387, 4.638373374938965, 4.880152702331543, 5.121931552886963, 5.363710403442383, 5.605489730834961, 5.847269058227539, 6.089047908782959]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 6.0, 0.0, 5.0, 5.0, 10.0, 18.0, 11.0, 13.0, 15.0, 17.0, 14.0, 19.0, 34.0, 29.0, 27.0, 29.0, 39.0, 46.0, 48.0, 35.0, 48.0, 41.0, 46.0, 59.0, 32.0, 42.0, 40.0, 25.0, 29.0, 23.0, 25.0, 27.0, 23.0, 25.0, 8.0, 21.0, 15.0, 13.0, 5.0, 4.0, 7.0, 6.0, 2.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.468169212341309, -4.336191177368164, -4.2042131423950195, -4.072235584259033, -3.9402575492858887, -3.808279514312744, -3.6763017177581787, -3.5443239212036133, -3.4123458862304688, -3.280367851257324, -3.148390054702759, -3.0164122581481934, -2.884434223175049, -2.7524561882019043, -2.620478391647339, -2.4885005950927734, -2.356522560119629, -2.2245445251464844, -2.092566728591919, -1.960588812828064, -1.828610897064209, -1.696632981300354, -1.564655065536499, -1.432677149772644, -1.300699234008789, -1.168721318244934, -1.036743402481079, -0.9047654867172241, -0.7727875709533691, -0.6408096551895142, -0.5088317394256592, -0.3768538236618042, -0.24487590789794922, -0.11289799213409424, 0.019079923629760742, 0.15105783939361572, 0.2830357551574707, 0.4150136709213257, 0.5469915866851807, 0.6789695024490356, 0.8109474182128906, 0.9429253339767456, 1.0749032497406006, 1.2068811655044556, 1.3388590812683105, 1.4708369970321655, 1.6028149127960205, 1.7347928285598755, 1.8667707443237305, 1.9987486600875854, 2.1307265758514404, 2.262704372406006, 2.3946824073791504, 2.526660442352295, 2.6586382389068604, 2.790616035461426, 2.9225940704345703, 3.054572105407715, 3.1865499019622803, 3.3185276985168457, 3.4505057334899902, 3.5824837684631348, 3.7144615650177, 3.8464393615722656, 3.97841739654541]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 14.0, 28.0, 30.0, 60.0, 85.0, 133.0, 241.0, 403.0, 866.0, 2433.0, 8934.0, 44627.0, 333967.0, 557354.0, 79466.0, 14204.0, 3426.0, 1113.0, 483.0, 247.0, 156.0, 88.0, 58.0, 46.0, 22.0, 22.0, 11.0, 9.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2353515625, -1.196929931640625, -1.15850830078125, -1.120086669921875, -1.0816650390625, -1.043243408203125, -1.00482177734375, -0.966400146484375, -0.927978515625, -0.889556884765625, -0.85113525390625, -0.812713623046875, -0.7742919921875, -0.735870361328125, -0.69744873046875, -0.659027099609375, -0.62060546875, -0.582183837890625, -0.54376220703125, -0.505340576171875, -0.4669189453125, -0.428497314453125, -0.39007568359375, -0.351654052734375, -0.313232421875, -0.274810791015625, -0.23638916015625, -0.197967529296875, -0.1595458984375, -0.121124267578125, -0.08270263671875, -0.044281005859375, -0.005859375, 0.032562255859375, 0.07098388671875, 0.109405517578125, 0.1478271484375, 0.186248779296875, 0.22467041015625, 0.263092041015625, 0.301513671875, 0.339935302734375, 0.37835693359375, 0.416778564453125, 0.4552001953125, 0.493621826171875, 0.53204345703125, 0.570465087890625, 0.60888671875, 0.647308349609375, 0.68572998046875, 0.724151611328125, 0.7625732421875, 0.800994873046875, 0.83941650390625, 0.877838134765625, 0.916259765625, 0.954681396484375, 0.99310302734375, 1.031524658203125, 1.0699462890625, 1.108367919921875, 1.14678955078125, 1.185211181640625, 1.2236328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 7.0, 9.0, 17.0, 21.0, 14.0, 30.0, 35.0, 33.0, 49.0, 56.0, 46.0, 67.0, 65.0, 64.0, 69.0, 62.0, 59.0, 61.0, 38.0, 39.0, 35.0, 23.0, 23.0, 15.0, 19.0, 9.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-6.32421875, -6.174896240234375, -6.02557373046875, -5.876251220703125, -5.7269287109375, -5.577606201171875, -5.42828369140625, -5.278961181640625, -5.129638671875, -4.980316162109375, -4.83099365234375, -4.681671142578125, -4.5323486328125, -4.383026123046875, -4.23370361328125, -4.084381103515625, -3.93505859375, -3.785736083984375, -3.63641357421875, -3.487091064453125, -3.3377685546875, -3.188446044921875, -3.03912353515625, -2.889801025390625, -2.740478515625, -2.591156005859375, -2.44183349609375, -2.292510986328125, -2.1431884765625, -1.993865966796875, -1.84454345703125, -1.695220947265625, -1.5458984375, -1.396575927734375, -1.24725341796875, -1.097930908203125, -0.9486083984375, -0.799285888671875, -0.64996337890625, -0.500640869140625, -0.351318359375, -0.201995849609375, -0.05267333984375, 0.096649169921875, 0.2459716796875, 0.395294189453125, 0.54461669921875, 0.693939208984375, 0.84326171875, 0.992584228515625, 1.14190673828125, 1.291229248046875, 1.4405517578125, 1.589874267578125, 1.73919677734375, 1.888519287109375, 2.037841796875, 2.187164306640625, 2.33648681640625, 2.485809326171875, 2.6351318359375, 2.784454345703125, 2.93377685546875, 3.083099365234375, 3.232421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 7.0, 18.0, 14.0, 26.0, 23.0, 17.0, 40.0, 34.0, 46.0, 60.0, 73.0, 73.0, 99.0, 117.0, 133.0, 205.0, 280.0, 408.0, 725.0, 2492.0, 15484.0, 172384.0, 731503.0, 109169.0, 10803.0, 1941.0, 676.0, 339.0, 300.0, 218.0, 143.0, 114.0, 113.0, 93.0, 79.0, 67.0, 51.0, 36.0, 33.0, 19.0, 27.0, 14.0, 13.0, 6.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.77685546875, -0.7521209716796875, -0.727386474609375, -0.7026519775390625, -0.67791748046875, -0.6531829833984375, -0.628448486328125, -0.6037139892578125, -0.5789794921875, -0.5542449951171875, -0.529510498046875, -0.5047760009765625, -0.48004150390625, -0.4553070068359375, -0.430572509765625, -0.4058380126953125, -0.381103515625, -0.3563690185546875, -0.331634521484375, -0.3069000244140625, -0.28216552734375, -0.2574310302734375, -0.232696533203125, -0.2079620361328125, -0.1832275390625, -0.1584930419921875, -0.133758544921875, -0.1090240478515625, -0.08428955078125, -0.0595550537109375, -0.034820556640625, -0.0100860595703125, 0.0146484375, 0.0393829345703125, 0.064117431640625, 0.0888519287109375, 0.11358642578125, 0.1383209228515625, 0.163055419921875, 0.1877899169921875, 0.2125244140625, 0.2372589111328125, 0.261993408203125, 0.2867279052734375, 0.31146240234375, 0.3361968994140625, 0.360931396484375, 0.3856658935546875, 0.410400390625, 0.4351348876953125, 0.459869384765625, 0.4846038818359375, 0.50933837890625, 0.5340728759765625, 0.558807373046875, 0.5835418701171875, 0.6082763671875, 0.6330108642578125, 0.657745361328125, 0.6824798583984375, 0.70721435546875, 0.7319488525390625, 0.756683349609375, 0.7814178466796875, 0.80615234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 12.0, 8.0, 16.0, 17.0, 13.0, 20.0, 28.0, 30.0, 23.0, 36.0, 32.0, 46.0, 54.0, 44.0, 50.0, 50.0, 41.0, 61.0, 40.0, 43.0, 49.0, 46.0, 43.0, 24.0, 17.0, 19.0, 15.0, 23.0, 20.0, 15.0, 12.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.320068359375, -6.09716796875, -5.874267578125, -5.6513671875, -5.428466796875, -5.20556640625, -4.982666015625, -4.759765625, -4.536865234375, -4.31396484375, -4.091064453125, -3.8681640625, -3.645263671875, -3.42236328125, -3.199462890625, -2.9765625, -2.753662109375, -2.53076171875, -2.307861328125, -2.0849609375, -1.862060546875, -1.63916015625, -1.416259765625, -1.193359375, -0.970458984375, -0.74755859375, -0.524658203125, -0.3017578125, -0.078857421875, 0.14404296875, 0.366943359375, 0.58984375, 0.812744140625, 1.03564453125, 1.258544921875, 1.4814453125, 1.704345703125, 1.92724609375, 2.150146484375, 2.373046875, 2.595947265625, 2.81884765625, 3.041748046875, 3.2646484375, 3.487548828125, 3.71044921875, 3.933349609375, 4.15625, 4.379150390625, 4.60205078125, 4.824951171875, 5.0478515625, 5.270751953125, 5.49365234375, 5.716552734375, 5.939453125, 6.162353515625, 6.38525390625, 6.608154296875, 6.8310546875, 7.053955078125, 7.27685546875, 7.499755859375, 7.72265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 9.0, 13.0, 24.0, 30.0, 39.0, 74.0, 140.0, 349.0, 1437.0, 136529.0, 907201.0, 1910.0, 408.0, 144.0, 75.0, 51.0, 45.0, 12.0, 19.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39111328125, -0.3776664733886719, -0.36421966552734375, -0.3507728576660156, -0.3373260498046875, -0.3238792419433594, -0.31043243408203125, -0.2969856262207031, -0.283538818359375, -0.2700920104980469, -0.25664520263671875, -0.24319839477539062, -0.2297515869140625, -0.21630477905273438, -0.20285797119140625, -0.18941116333007812, -0.17596435546875, -0.16251754760742188, -0.14907073974609375, -0.13562393188476562, -0.1221771240234375, -0.10873031616210938, -0.09528350830078125, -0.08183670043945312, -0.068389892578125, -0.054943084716796875, -0.04149627685546875, -0.028049468994140625, -0.0146026611328125, -0.001155853271484375, 0.01229095458984375, 0.025737762451171875, 0.0391845703125, 0.052631378173828125, 0.06607818603515625, 0.07952499389648438, 0.0929718017578125, 0.10641860961914062, 0.11986541748046875, 0.13331222534179688, 0.146759033203125, 0.16020584106445312, 0.17365264892578125, 0.18709945678710938, 0.2005462646484375, 0.21399307250976562, 0.22743988037109375, 0.24088668823242188, 0.25433349609375, 0.2677803039550781, 0.28122711181640625, 0.2946739196777344, 0.3081207275390625, 0.3215675354003906, 0.33501434326171875, 0.3484611511230469, 0.361907958984375, 0.3753547668457031, 0.38880157470703125, 0.4022483825683594, 0.4156951904296875, 0.4291419982910156, 0.44258880615234375, 0.4560356140136719, 0.469482421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 14.0, 10.0, 26.0, 35.0, 37.0, 55.0, 50.0, 82.0, 98.0, 98.0, 108.0, 85.0, 84.0, 38.0, 44.0, 40.0, 32.0, 13.0, 7.0, 11.0, 3.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.857778549194336e-05, -4.6426430344581604e-05, -4.427507519721985e-05, -4.212372004985809e-05, -3.997236490249634e-05, -3.782100975513458e-05, -3.566965460777283e-05, -3.351829946041107e-05, -3.1366944313049316e-05, -2.921558916568756e-05, -2.7064234018325806e-05, -2.491287887096405e-05, -2.2761523723602295e-05, -2.061016857624054e-05, -1.8458813428878784e-05, -1.630745828151703e-05, -1.4156103134155273e-05, -1.2004747986793518e-05, -9.853392839431763e-06, -7.702037692070007e-06, -5.550682544708252e-06, -3.3993273973464966e-06, -1.2479722499847412e-06, 9.033828973770142e-07, 3.0547380447387695e-06, 5.206093192100525e-06, 7.35744833946228e-06, 9.508803486824036e-06, 1.1660158634185791e-05, 1.3811513781547546e-05, 1.5962868928909302e-05, 1.8114224076271057e-05, 2.0265579223632812e-05, 2.2416934370994568e-05, 2.4568289518356323e-05, 2.671964466571808e-05, 2.8870999813079834e-05, 3.102235496044159e-05, 3.3173710107803345e-05, 3.53250652551651e-05, 3.7476420402526855e-05, 3.962777554988861e-05, 4.1779130697250366e-05, 4.393048584461212e-05, 4.608184099197388e-05, 4.823319613933563e-05, 5.038455128669739e-05, 5.253590643405914e-05, 5.46872615814209e-05, 5.6838616728782654e-05, 5.898997187614441e-05, 6.114132702350616e-05, 6.329268217086792e-05, 6.544403731822968e-05, 6.759539246559143e-05, 6.974674761295319e-05, 7.189810276031494e-05, 7.40494579076767e-05, 7.620081305503845e-05, 7.835216820240021e-05, 8.050352334976196e-05, 8.265487849712372e-05, 8.480623364448547e-05, 8.695758879184723e-05, 8.910894393920898e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 10.0, 27.0, 30.0, 57.0, 109.0, 427.0, 10678.0, 1033168.0, 3550.0, 257.0, 83.0, 38.0, 34.0, 15.0, 5.0, 6.0, 7.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2236328125, -1.19000244140625, -1.1563720703125, -1.12274169921875, -1.089111328125, -1.05548095703125, -1.0218505859375, -0.98822021484375, -0.95458984375, -0.92095947265625, -0.8873291015625, -0.85369873046875, -0.820068359375, -0.78643798828125, -0.7528076171875, -0.71917724609375, -0.685546875, -0.65191650390625, -0.6182861328125, -0.58465576171875, -0.551025390625, -0.51739501953125, -0.4837646484375, -0.45013427734375, -0.41650390625, -0.38287353515625, -0.3492431640625, -0.31561279296875, -0.281982421875, -0.24835205078125, -0.2147216796875, -0.18109130859375, -0.1474609375, -0.11383056640625, -0.0802001953125, -0.04656982421875, -0.012939453125, 0.02069091796875, 0.0543212890625, 0.08795166015625, 0.12158203125, 0.15521240234375, 0.1888427734375, 0.22247314453125, 0.256103515625, 0.28973388671875, 0.3233642578125, 0.35699462890625, 0.390625, 0.42425537109375, 0.4578857421875, 0.49151611328125, 0.525146484375, 0.55877685546875, 0.5924072265625, 0.62603759765625, 0.65966796875, 0.69329833984375, 0.7269287109375, 0.76055908203125, 0.794189453125, 0.82781982421875, 0.8614501953125, 0.89508056640625, 0.9287109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 10.0, 15.0, 29.0, 39.0, 66.0, 111.0, 125.0, 231.0, 120.0, 74.0, 56.0, 31.0, 17.0, 12.0, 6.0, 8.0, 3.0, 5.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07989501953125, -0.0776987075805664, -0.07550239562988281, -0.07330608367919922, -0.07110977172851562, -0.06891345977783203, -0.06671714782714844, -0.06452083587646484, -0.06232452392578125, -0.060128211975097656, -0.05793190002441406, -0.05573558807373047, -0.053539276123046875, -0.05134296417236328, -0.04914665222167969, -0.046950340270996094, -0.0447540283203125, -0.042557716369628906, -0.04036140441894531, -0.03816509246826172, -0.035968780517578125, -0.03377246856689453, -0.03157615661621094, -0.029379844665527344, -0.02718353271484375, -0.024987220764160156, -0.022790908813476562, -0.02059459686279297, -0.018398284912109375, -0.01620197296142578, -0.014005661010742188, -0.011809349060058594, -0.009613037109375, -0.007416725158691406, -0.0052204132080078125, -0.0030241012573242188, -0.000827789306640625, 0.0013685226440429688, 0.0035648345947265625, 0.005761146545410156, 0.00795745849609375, 0.010153770446777344, 0.012350082397460938, 0.014546394348144531, 0.016742706298828125, 0.01893901824951172, 0.021135330200195312, 0.023331642150878906, 0.0255279541015625, 0.027724266052246094, 0.029920578002929688, 0.03211688995361328, 0.034313201904296875, 0.03650951385498047, 0.03870582580566406, 0.040902137756347656, 0.04309844970703125, 0.045294761657714844, 0.04749107360839844, 0.04968738555908203, 0.051883697509765625, 0.05408000946044922, 0.05627632141113281, 0.058472633361816406, 0.0606689453125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 10.0, 22.0, 60.0, 125.0, 197.0, 220.0, 158.0, 102.0, 47.0, 15.0, 8.0, 8.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.618609428405762, -11.289319038391113, -10.960028648376465, -10.630738258361816, -10.301447868347168, -9.97215747833252, -9.642867088317871, -9.313577651977539, -8.98428726196289, -8.654996871948242, -8.325706481933594, -7.996416091918945, -7.667125701904297, -7.337835311889648, -7.008545398712158, -6.67925500869751, -6.349964141845703, -6.020673751831055, -5.691383361816406, -5.362092971801758, -5.032802581787109, -4.703512191772461, -4.374222278594971, -4.044931888580322, -3.715641498565674, -3.3863511085510254, -3.057060718536377, -2.7277705669403076, -2.398480176925659, -2.0691897869110107, -1.7398995161056519, -1.410609245300293, -1.0813179016113281, -0.7520275712013245, -0.4227372407913208, -0.09344691038131714, 0.23584342002868652, 0.565133810043335, 0.8944240808486938, 1.2237143516540527, 1.5530047416687012, 1.8822951316833496, 2.211585521697998, 2.5408756732940674, 2.870166063308716, 3.1994564533233643, 3.5287466049194336, 3.858036994934082, 4.1873273849487305, 4.516617774963379, 4.845908164978027, 5.175198554992676, 5.504488945007324, 5.833779335021973, 6.163069248199463, 6.492359638214111, 6.82165002822876, 7.150940418243408, 7.480230808258057, 7.809521198272705, 8.138811111450195, 8.468101501464844, 8.797391891479492, 9.12668228149414, 9.455972671508789]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 19.0, 17.0, 19.0, 25.0, 33.0, 37.0, 50.0, 54.0, 69.0, 77.0, 62.0, 80.0, 80.0, 66.0, 48.0, 37.0, 41.0, 44.0, 32.0, 28.0, 20.0, 6.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.2737016677856445, -6.120598793029785, -5.967495918273926, -5.814392566680908, -5.661289691925049, -5.5081868171691895, -5.35508394241333, -5.2019805908203125, -5.048877716064453, -4.895774841308594, -4.742671966552734, -4.589568614959717, -4.436465740203857, -4.283362865447998, -4.130259990692139, -3.9771568775177, -3.824054002761841, -3.6709511280059814, -3.517848014831543, -3.3647451400756836, -3.211642026901245, -3.0585391521453857, -2.9054360389709473, -2.752333164215088, -2.5992302894592285, -2.446127414703369, -2.2930243015289307, -2.1399214267730713, -1.9868183135986328, -1.8337154388427734, -1.6806124448776245, -1.5275094509124756, -1.374406099319458, -1.221303105354309, -1.0682001113891602, -0.915097177028656, -0.7619941830635071, -0.6088911890983582, -0.455788254737854, -0.3026852607727051, -0.14958226680755615, 0.0035207122564315796, 0.1566236913204193, 0.30972665548324585, 0.4628296494483948, 0.6159326434135437, 0.7690355777740479, 0.9221385717391968, 1.0752415657043457, 1.2283445596694946, 1.3814475536346436, 1.534550428390503, 1.6876535415649414, 1.8407564163208008, 1.9938594102859497, 2.1469624042510986, 2.300065517425537, 2.4531683921813965, 2.606271505355835, 2.7593743801116943, 2.912477493286133, 3.065580368041992, 3.2186832427978516, 3.37178635597229, 3.5248892307281494]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 18.0, 15.0, 22.0, 52.0, 97.0, 159.0, 314.0, 562.0, 1073.0, 2124.0, 4714.0, 11488.0, 32148.0, 122632.0, 522296.0, 262699.0, 57124.0, 17839.0, 7006.0, 3025.0, 1451.0, 718.0, 419.0, 215.0, 117.0, 68.0, 49.0, 28.0, 13.0, 13.0, 11.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.669921875, -2.588348388671875, -2.50677490234375, -2.425201416015625, -2.3436279296875, -2.262054443359375, -2.18048095703125, -2.098907470703125, -2.017333984375, -1.935760498046875, -1.85418701171875, -1.772613525390625, -1.6910400390625, -1.609466552734375, -1.52789306640625, -1.446319580078125, -1.36474609375, -1.283172607421875, -1.20159912109375, -1.120025634765625, -1.0384521484375, -0.956878662109375, -0.87530517578125, -0.793731689453125, -0.712158203125, -0.630584716796875, -0.54901123046875, -0.467437744140625, -0.3858642578125, -0.304290771484375, -0.22271728515625, -0.141143798828125, -0.0595703125, 0.022003173828125, 0.10357666015625, 0.185150146484375, 0.2667236328125, 0.348297119140625, 0.42987060546875, 0.511444091796875, 0.593017578125, 0.674591064453125, 0.75616455078125, 0.837738037109375, 0.9193115234375, 1.000885009765625, 1.08245849609375, 1.164031982421875, 1.24560546875, 1.327178955078125, 1.40875244140625, 1.490325927734375, 1.5718994140625, 1.653472900390625, 1.73504638671875, 1.816619873046875, 1.898193359375, 1.979766845703125, 2.06134033203125, 2.142913818359375, 2.2244873046875, 2.306060791015625, 2.38763427734375, 2.469207763671875, 2.55078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 9.0, 6.0, 8.0, 12.0, 17.0, 19.0, 29.0, 47.0, 53.0, 54.0, 73.0, 87.0, 84.0, 71.0, 85.0, 62.0, 55.0, 49.0, 40.0, 36.0, 26.0, 32.0, 15.0, 13.0, 8.0, 8.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -19.034912109375, -18.50732421875, -17.979736328125, -17.4521484375, -16.924560546875, -16.39697265625, -15.869384765625, -15.341796875, -14.814208984375, -14.28662109375, -13.759033203125, -13.2314453125, -12.703857421875, -12.17626953125, -11.648681640625, -11.12109375, -10.593505859375, -10.06591796875, -9.538330078125, -9.0107421875, -8.483154296875, -7.95556640625, -7.427978515625, -6.900390625, -6.372802734375, -5.84521484375, -5.317626953125, -4.7900390625, -4.262451171875, -3.73486328125, -3.207275390625, -2.6796875, -2.152099609375, -1.62451171875, -1.096923828125, -0.5693359375, -0.041748046875, 0.48583984375, 1.013427734375, 1.541015625, 2.068603515625, 2.59619140625, 3.123779296875, 3.6513671875, 4.178955078125, 4.70654296875, 5.234130859375, 5.76171875, 6.289306640625, 6.81689453125, 7.344482421875, 7.8720703125, 8.399658203125, 8.92724609375, 9.454833984375, 9.982421875, 10.510009765625, 11.03759765625, 11.565185546875, 12.0927734375, 12.620361328125, 13.14794921875, 13.675537109375, 14.203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 9.0, 9.0, 13.0, 35.0, 25.0, 42.0, 63.0, 96.0, 219.0, 697.0, 25221.0, 1018636.0, 2620.0, 376.0, 160.0, 99.0, 62.0, 37.0, 40.0, 18.0, 24.0, 15.0, 11.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.0625, -16.359375, -15.65625, -14.953125, -14.25, -13.546875, -12.84375, -12.140625, -11.4375, -10.734375, -10.03125, -9.328125, -8.625, -7.921875, -7.21875, -6.515625, -5.8125, -5.109375, -4.40625, -3.703125, -3.0, -2.296875, -1.59375, -0.890625, -0.1875, 0.515625, 1.21875, 1.921875, 2.625, 3.328125, 4.03125, 4.734375, 5.4375, 6.140625, 6.84375, 7.546875, 8.25, 8.953125, 9.65625, 10.359375, 11.0625, 11.765625, 12.46875, 13.171875, 13.875, 14.578125, 15.28125, 15.984375, 16.6875, 17.390625, 18.09375, 18.796875, 19.5, 20.203125, 20.90625, 21.609375, 22.3125, 23.015625, 23.71875, 24.421875, 25.125, 25.828125, 26.53125, 27.234375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 2.0, 4.0, 6.0, 6.0, 16.0, 8.0, 10.0, 13.0, 16.0, 18.0, 24.0, 28.0, 33.0, 35.0, 24.0, 40.0, 51.0, 42.0, 46.0, 47.0, 35.0, 30.0, 38.0, 30.0, 34.0, 44.0, 28.0, 28.0, 33.0, 20.0, 35.0, 33.0, 15.0, 18.0, 19.0, 10.0, 7.0, 19.0, 7.0, 10.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.484375, -8.189208984375, -7.89404296875, -7.598876953125, -7.3037109375, -7.008544921875, -6.71337890625, -6.418212890625, -6.123046875, -5.827880859375, -5.53271484375, -5.237548828125, -4.9423828125, -4.647216796875, -4.35205078125, -4.056884765625, -3.76171875, -3.466552734375, -3.17138671875, -2.876220703125, -2.5810546875, -2.285888671875, -1.99072265625, -1.695556640625, -1.400390625, -1.105224609375, -0.81005859375, -0.514892578125, -0.2197265625, 0.075439453125, 0.37060546875, 0.665771484375, 0.9609375, 1.256103515625, 1.55126953125, 1.846435546875, 2.1416015625, 2.436767578125, 2.73193359375, 3.027099609375, 3.322265625, 3.617431640625, 3.91259765625, 4.207763671875, 4.5029296875, 4.798095703125, 5.09326171875, 5.388427734375, 5.68359375, 5.978759765625, 6.27392578125, 6.569091796875, 6.8642578125, 7.159423828125, 7.45458984375, 7.749755859375, 8.044921875, 8.340087890625, 8.63525390625, 8.930419921875, 9.2255859375, 9.520751953125, 9.81591796875, 10.111083984375, 10.40625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 9.0, 7.0, 6.0, 17.0, 20.0, 30.0, 66.0, 135.0, 376.0, 1338.0, 8068.0, 203800.0, 819380.0, 12747.0, 1745.0, 465.0, 148.0, 80.0, 35.0, 36.0, 9.0, 12.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9208526611328125, -1.866119384765625, -1.8113861083984375, -1.75665283203125, -1.7019195556640625, -1.647186279296875, -1.5924530029296875, -1.5377197265625, -1.4829864501953125, -1.428253173828125, -1.3735198974609375, -1.31878662109375, -1.2640533447265625, -1.209320068359375, -1.1545867919921875, -1.099853515625, -1.0451202392578125, -0.990386962890625, -0.9356536865234375, -0.88092041015625, -0.8261871337890625, -0.771453857421875, -0.7167205810546875, -0.6619873046875, -0.6072540283203125, -0.552520751953125, -0.4977874755859375, -0.44305419921875, -0.3883209228515625, -0.333587646484375, -0.2788543701171875, -0.22412109375, -0.1693878173828125, -0.114654541015625, -0.0599212646484375, -0.00518798828125, 0.0495452880859375, 0.104278564453125, 0.1590118408203125, 0.2137451171875, 0.2684783935546875, 0.323211669921875, 0.3779449462890625, 0.43267822265625, 0.4874114990234375, 0.542144775390625, 0.5968780517578125, 0.651611328125, 0.7063446044921875, 0.761077880859375, 0.8158111572265625, 0.87054443359375, 0.9252777099609375, 0.980010986328125, 1.0347442626953125, 1.0894775390625, 1.1442108154296875, 1.198944091796875, 1.2536773681640625, 1.30841064453125, 1.3631439208984375, 1.417877197265625, 1.4726104736328125, 1.52734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 9.0, 7.0, 6.0, 6.0, 11.0, 23.0, 29.0, 41.0, 74.0, 131.0, 281.0, 155.0, 71.0, 53.0, 25.0, 13.0, 13.0, 12.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018715858459472656, -0.0001813843846321106, -0.00017561018466949463, -0.00016983598470687866, -0.0001640617847442627, -0.00015828758478164673, -0.00015251338481903076, -0.0001467391848564148, -0.00014096498489379883, -0.00013519078493118286, -0.0001294165849685669, -0.00012364238500595093, -0.00011786818504333496, -0.000112093985080719, -0.00010631978511810303, -0.00010054558515548706, -9.47713851928711e-05, -8.899718523025513e-05, -8.322298526763916e-05, -7.74487853050232e-05, -7.167458534240723e-05, -6.590038537979126e-05, -6.012618541717529e-05, -5.4351985454559326e-05, -4.857778549194336e-05, -4.280358552932739e-05, -3.7029385566711426e-05, -3.125518560409546e-05, -2.5480985641479492e-05, -1.9706785678863525e-05, -1.3932585716247559e-05, -8.158385753631592e-06, -2.384185791015625e-06, 3.390014171600342e-06, 9.164214134216309e-06, 1.4938414096832275e-05, 2.0712614059448242e-05, 2.648681402206421e-05, 3.2261013984680176e-05, 3.803521394729614e-05, 4.380941390991211e-05, 4.9583613872528076e-05, 5.535781383514404e-05, 6.113201379776001e-05, 6.690621376037598e-05, 7.268041372299194e-05, 7.845461368560791e-05, 8.422881364822388e-05, 9.000301361083984e-05, 9.577721357345581e-05, 0.00010155141353607178, 0.00010732561349868774, 0.00011309981346130371, 0.00011887401342391968, 0.00012464821338653564, 0.0001304224133491516, 0.00013619661331176758, 0.00014197081327438354, 0.0001477450132369995, 0.00015351921319961548, 0.00015929341316223145, 0.0001650676131248474, 0.00017084181308746338, 0.00017661601305007935, 0.0001823902130126953]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 10.0, 6.0, 4.0, 14.0, 19.0, 48.0, 99.0, 233.0, 934.0, 7767.0, 814192.0, 218738.0, 5312.0, 770.0, 194.0, 91.0, 38.0, 26.0, 9.0, 10.0, 8.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.069793701171875, -2.00286865234375, -1.935943603515625, -1.8690185546875, -1.802093505859375, -1.73516845703125, -1.668243408203125, -1.601318359375, -1.534393310546875, -1.46746826171875, -1.400543212890625, -1.3336181640625, -1.266693115234375, -1.19976806640625, -1.132843017578125, -1.06591796875, -0.998992919921875, -0.93206787109375, -0.865142822265625, -0.7982177734375, -0.731292724609375, -0.66436767578125, -0.597442626953125, -0.530517578125, -0.463592529296875, -0.39666748046875, -0.329742431640625, -0.2628173828125, -0.195892333984375, -0.12896728515625, -0.062042236328125, 0.0048828125, 0.071807861328125, 0.13873291015625, 0.205657958984375, 0.2725830078125, 0.339508056640625, 0.40643310546875, 0.473358154296875, 0.540283203125, 0.607208251953125, 0.67413330078125, 0.741058349609375, 0.8079833984375, 0.874908447265625, 0.94183349609375, 1.008758544921875, 1.07568359375, 1.142608642578125, 1.20953369140625, 1.276458740234375, 1.3433837890625, 1.410308837890625, 1.47723388671875, 1.544158935546875, 1.611083984375, 1.678009033203125, 1.74493408203125, 1.811859130859375, 1.8787841796875, 1.945709228515625, 2.01263427734375, 2.079559326171875, 2.146484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 8.0, 11.0, 21.0, 28.0, 37.0, 55.0, 98.0, 373.0, 126.0, 65.0, 53.0, 24.0, 13.0, 18.0, 8.0, 12.0, 11.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.39269256591796875, -0.3798675537109375, -0.36704254150390625, -0.354217529296875, -0.34139251708984375, -0.3285675048828125, -0.31574249267578125, -0.30291748046875, -0.29009246826171875, -0.2772674560546875, -0.26444244384765625, -0.251617431640625, -0.23879241943359375, -0.2259674072265625, -0.21314239501953125, -0.2003173828125, -0.18749237060546875, -0.1746673583984375, -0.16184234619140625, -0.149017333984375, -0.13619232177734375, -0.1233673095703125, -0.11054229736328125, -0.09771728515625, -0.08489227294921875, -0.0720672607421875, -0.05924224853515625, -0.046417236328125, -0.03359222412109375, -0.0207672119140625, -0.00794219970703125, 0.0048828125, 0.01770782470703125, 0.0305328369140625, 0.04335784912109375, 0.056182861328125, 0.06900787353515625, 0.0818328857421875, 0.09465789794921875, 0.10748291015625, 0.12030792236328125, 0.1331329345703125, 0.14595794677734375, 0.158782958984375, 0.17160797119140625, 0.1844329833984375, 0.19725799560546875, 0.2100830078125, 0.22290802001953125, 0.2357330322265625, 0.24855804443359375, 0.261383056640625, 0.27420806884765625, 0.2870330810546875, 0.29985809326171875, 0.31268310546875, 0.32550811767578125, 0.3383331298828125, 0.35115814208984375, 0.363983154296875, 0.37680816650390625, 0.3896331787109375, 0.40245819091796875, 0.415283203125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 44.0, 778.0, 181.0, 10.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96755313873291, -10.187633514404297, -7.40771484375, -4.627795219421387, -1.8478765487670898, 0.932042121887207, 3.7119626998901367, 6.491881370544434, 9.27180004119873, 12.051719665527344, 14.83163833618164, 17.611557006835938, 20.391475677490234, 23.17139434814453, 25.951316833496094, 28.73123550415039, 31.511154174804688, 34.291072845458984, 37.07099151611328, 39.850914001464844, 42.630828857421875, 45.41075134277344, 48.190670013427734, 50.97058868408203, 53.75050735473633, 56.530426025390625, 59.31034469604492, 62.09026336669922, 64.87018585205078, 67.65010070800781, 70.43002319335938, 73.20994567871094, 75.98985290527344, 78.769775390625, 81.54969024658203, 84.3296127319336, 87.10952758789062, 89.88945007324219, 92.66937255859375, 95.44928741455078, 98.22920227050781, 101.00912475585938, 103.7890396118164, 106.56896209716797, 109.348876953125, 112.12879943847656, 114.90872192382812, 117.68863677978516, 120.46855926513672, 123.24848175048828, 126.02839660644531, 128.80831909179688, 131.58824157714844, 134.36814880371094, 137.1480712890625, 139.92799377441406, 142.70791625976562, 145.4878387451172, 148.26776123046875, 151.04766845703125, 153.8275909423828, 156.60751342773438, 159.38743591308594, 162.1673583984375, 164.947265625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 10.0, 6.0, 5.0, 17.0, 10.0, 15.0, 19.0, 21.0, 22.0, 27.0, 43.0, 40.0, 36.0, 28.0, 40.0, 35.0, 45.0, 60.0, 47.0, 49.0, 54.0, 40.0, 39.0, 51.0, 42.0, 29.0, 31.0, 27.0, 22.0, 15.0, 18.0, 15.0, 12.0, 9.0, 3.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.840543746948242, -17.29367446899414, -16.746807098388672, -16.19993782043457, -15.653068542480469, -15.106199264526367, -14.559330940246582, -14.012462615966797, -13.465593338012695, -12.918724060058594, -12.371855735778809, -11.824987411499023, -11.278118133544922, -10.73124885559082, -10.184380531311035, -9.63751220703125, -9.090642929077148, -8.543773651123047, -7.996905326843262, -7.450036525726318, -6.903167724609375, -6.356298923492432, -5.809430122375488, -5.262561321258545, -4.715692520141602, -4.168823719024658, -3.621954917907715, -3.0750861167907715, -2.528217315673828, -1.9813485145568848, -1.4344797134399414, -0.887610912322998, -0.3407402038574219, 0.20612859725952148, 0.7529973983764648, 1.2998661994934082, 1.8467350006103516, 2.393603801727295, 2.9404726028442383, 3.4873414039611816, 4.034210205078125, 4.581079006195068, 5.127947807312012, 5.674816608428955, 6.221685409545898, 6.768554210662842, 7.315423011779785, 7.8622918128967285, 8.409160614013672, 8.956029891967773, 9.502898216247559, 10.049766540527344, 10.596635818481445, 11.143505096435547, 11.690373420715332, 12.237241744995117, 12.784111022949219, 13.33098030090332, 13.877848625183105, 14.42471694946289, 14.971586227416992, 15.518455505371094, 16.065322875976562, 16.612192153930664, 17.159061431884766]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 8.0, 7.0, 6.0, 5.0, 14.0, 13.0, 18.0, 22.0, 31.0, 39.0, 47.0, 83.0, 128.0, 259.0, 509.0, 1387.0, 4100.0, 15033.0, 80942.0, 1408435.0, 2547408.0, 107887.0, 19495.0, 5254.0, 1755.0, 648.0, 317.0, 136.0, 76.0, 47.0, 33.0, 32.0, 32.0, 14.0, 8.0, 8.0, 8.0, 8.0, 11.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.13671875, -5.95660400390625, -5.7764892578125, -5.59637451171875, -5.416259765625, -5.23614501953125, -5.0560302734375, -4.87591552734375, -4.69580078125, -4.51568603515625, -4.3355712890625, -4.15545654296875, -3.975341796875, -3.79522705078125, -3.6151123046875, -3.43499755859375, -3.2548828125, -3.07476806640625, -2.8946533203125, -2.71453857421875, -2.534423828125, -2.35430908203125, -2.1741943359375, -1.99407958984375, -1.81396484375, -1.63385009765625, -1.4537353515625, -1.27362060546875, -1.093505859375, -0.91339111328125, -0.7332763671875, -0.55316162109375, -0.373046875, -0.19293212890625, -0.0128173828125, 0.16729736328125, 0.347412109375, 0.52752685546875, 0.7076416015625, 0.88775634765625, 1.06787109375, 1.24798583984375, 1.4281005859375, 1.60821533203125, 1.788330078125, 1.96844482421875, 2.1485595703125, 2.32867431640625, 2.5087890625, 2.68890380859375, 2.8690185546875, 3.04913330078125, 3.229248046875, 3.40936279296875, 3.5894775390625, 3.76959228515625, 3.94970703125, 4.12982177734375, 4.3099365234375, 4.49005126953125, 4.670166015625, 4.85028076171875, 5.0303955078125, 5.21051025390625, 5.390625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 11.0, 13.0, 25.0, 29.0, 39.0, 45.0, 64.0, 84.0, 72.0, 90.0, 100.0, 88.0, 94.0, 65.0, 55.0, 39.0, 27.0, 17.0, 17.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5, -8.310943603515625, -8.12188720703125, -7.932830810546875, -7.7437744140625, -7.554718017578125, -7.36566162109375, -7.176605224609375, -6.987548828125, -6.798492431640625, -6.60943603515625, -6.420379638671875, -6.2313232421875, -6.042266845703125, -5.85321044921875, -5.664154052734375, -5.47509765625, -5.286041259765625, -5.09698486328125, -4.907928466796875, -4.7188720703125, -4.529815673828125, -4.34075927734375, -4.151702880859375, -3.962646484375, -3.773590087890625, -3.58453369140625, -3.395477294921875, -3.2064208984375, -3.017364501953125, -2.82830810546875, -2.639251708984375, -2.4501953125, -2.261138916015625, -2.07208251953125, -1.883026123046875, -1.6939697265625, -1.504913330078125, -1.31585693359375, -1.126800537109375, -0.937744140625, -0.748687744140625, -0.55963134765625, -0.370574951171875, -0.1815185546875, 0.007537841796875, 0.19659423828125, 0.385650634765625, 0.57470703125, 0.763763427734375, 0.95281982421875, 1.141876220703125, 1.3309326171875, 1.519989013671875, 1.70904541015625, 1.898101806640625, 2.087158203125, 2.276214599609375, 2.46527099609375, 2.654327392578125, 2.8433837890625, 3.032440185546875, 3.22149658203125, 3.410552978515625, 3.599609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 9.0, 12.0, 19.0, 40.0, 105.0, 208.0, 1041.0, 4173731.0, 18334.0, 437.0, 146.0, 79.0, 43.0, 35.0, 12.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.82275390625, -47.3330078125, -45.84326171875, -44.353515625, -42.86376953125, -41.3740234375, -39.88427734375, -38.39453125, -36.90478515625, -35.4150390625, -33.92529296875, -32.435546875, -30.94580078125, -29.4560546875, -27.96630859375, -26.4765625, -24.98681640625, -23.4970703125, -22.00732421875, -20.517578125, -19.02783203125, -17.5380859375, -16.04833984375, -14.55859375, -13.06884765625, -11.5791015625, -10.08935546875, -8.599609375, -7.10986328125, -5.6201171875, -4.13037109375, -2.640625, -1.15087890625, 0.3388671875, 1.82861328125, 3.318359375, 4.80810546875, 6.2978515625, 7.78759765625, 9.27734375, 10.76708984375, 12.2568359375, 13.74658203125, 15.236328125, 16.72607421875, 18.2158203125, 19.70556640625, 21.1953125, 22.68505859375, 24.1748046875, 25.66455078125, 27.154296875, 28.64404296875, 30.1337890625, 31.62353515625, 33.11328125, 34.60302734375, 36.0927734375, 37.58251953125, 39.072265625, 40.56201171875, 42.0517578125, 43.54150390625, 45.03125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 6.0, 11.0, 17.0, 39.0, 56.0, 94.0, 136.0, 320.0, 827.0, 1428.0, 536.0, 253.0, 119.0, 67.0, 49.0, 40.0, 27.0, 10.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9691314697265625, -1.914825439453125, -1.8605194091796875, -1.80621337890625, -1.7519073486328125, -1.697601318359375, -1.6432952880859375, -1.5889892578125, -1.5346832275390625, -1.480377197265625, -1.4260711669921875, -1.37176513671875, -1.3174591064453125, -1.263153076171875, -1.2088470458984375, -1.154541015625, -1.1002349853515625, -1.045928955078125, -0.9916229248046875, -0.93731689453125, -0.8830108642578125, -0.828704833984375, -0.7743988037109375, -0.7200927734375, -0.6657867431640625, -0.611480712890625, -0.5571746826171875, -0.50286865234375, -0.4485626220703125, -0.394256591796875, -0.3399505615234375, -0.28564453125, -0.2313385009765625, -0.177032470703125, -0.1227264404296875, -0.06842041015625, -0.0141143798828125, 0.040191650390625, 0.0944976806640625, 0.1488037109375, 0.2031097412109375, 0.257415771484375, 0.3117218017578125, 0.36602783203125, 0.4203338623046875, 0.474639892578125, 0.5289459228515625, 0.583251953125, 0.6375579833984375, 0.691864013671875, 0.7461700439453125, 0.80047607421875, 0.8547821044921875, 0.909088134765625, 0.9633941650390625, 1.0177001953125, 1.0720062255859375, 1.126312255859375, 1.1806182861328125, 1.23492431640625, 1.2892303466796875, 1.343536376953125, 1.3978424072265625, 1.4521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 9.0, 27.0, 36.0, 104.0, 222.0, 253.0, 175.0, 81.0, 46.0, 14.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.656396865844727, -11.24353313446045, -10.830670356750488, -10.417806625366211, -10.004942893981934, -9.592079162597656, -9.179216384887695, -8.766352653503418, -8.35348892211914, -7.9406256675720215, -7.527761936187744, -7.114898681640625, -6.702034950256348, -6.2891716957092285, -5.876308441162109, -5.463444709777832, -5.050581932067871, -4.637718677520752, -4.224854946136475, -3.8119916915893555, -3.3991281986236572, -2.986264705657959, -2.57340145111084, -2.1605379581451416, -1.7476744651794434, -1.3348109722137451, -0.9219475984573364, -0.5090842247009277, -0.09622073173522949, 0.31664276123046875, 0.7295060157775879, 1.1423695087432861, 1.5552330017089844, 1.9680964946746826, 2.380959987640381, 2.7938232421875, 3.2066867351531982, 3.6195502281188965, 4.032413482666016, 4.445277214050293, 4.858140468597412, 5.271003723144531, 5.683867454528809, 6.096730709075928, 6.509593963623047, 6.922457695007324, 7.335320949554443, 7.7481842041015625, 8.16104793548584, 8.573911666870117, 8.986774444580078, 9.399638175964355, 9.812501907348633, 10.225364685058594, 10.638228416442871, 11.051092147827148, 11.46395492553711, 11.876818656921387, 12.289681434631348, 12.702545166015625, 13.115408897399902, 13.52827262878418, 13.94113540649414, 14.353999137878418, 14.766862869262695]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 12.0, 12.0, 8.0, 15.0, 26.0, 35.0, 55.0, 58.0, 71.0, 69.0, 79.0, 65.0, 90.0, 84.0, 70.0, 58.0, 44.0, 39.0, 27.0, 22.0, 17.0, 15.0, 5.0, 10.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.451784610748291, -7.277875900268555, -7.103967189788818, -6.930058479309082, -6.7561492919921875, -6.582240581512451, -6.408331871032715, -6.2344231605529785, -6.060514450073242, -5.886605739593506, -5.7126970291137695, -5.538787841796875, -5.364879131317139, -5.190970420837402, -5.017061710357666, -4.84315299987793, -4.669243812561035, -4.495335102081299, -4.3214263916015625, -4.147517204284668, -3.9736084938049316, -3.7996997833251953, -3.625791072845459, -3.4518823623657227, -3.2779734134674072, -3.104064702987671, -2.9301557540893555, -2.756247043609619, -2.582338333129883, -2.4084293842315674, -2.234520673751831, -2.0606117248535156, -1.8867030143737793, -1.7127941846847534, -1.5388853549957275, -1.3649766445159912, -1.1910678148269653, -1.0171589851379395, -0.8432502746582031, -0.6693414449691772, -0.49543261528015137, -0.3215238153934479, -0.14761501550674438, 0.02629375457763672, 0.2002025842666626, 0.3741114139556885, 0.5480201244354248, 0.7219289541244507, 0.8958377838134766, 1.0697466135025024, 1.2436554431915283, 1.4175641536712646, 1.5914729833602905, 1.7653818130493164, 1.9392905235290527, 2.113199234008789, 2.2871081829071045, 2.461016893386841, 2.6349258422851562, 2.8088345527648926, 2.982743263244629, 3.1566522121429443, 3.3305609226226807, 3.504469871520996, 3.6783785820007324]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 14.0, 34.0, 48.0, 88.0, 153.0, 324.0, 640.0, 1421.0, 5328.0, 80386.0, 918648.0, 35488.0, 3666.0, 1162.0, 545.0, 282.0, 143.0, 69.0, 41.0, 27.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.716796875, -1.66961669921875, -1.6224365234375, -1.57525634765625, -1.528076171875, -1.48089599609375, -1.4337158203125, -1.38653564453125, -1.33935546875, -1.29217529296875, -1.2449951171875, -1.19781494140625, -1.150634765625, -1.10345458984375, -1.0562744140625, -1.00909423828125, -0.9619140625, -0.91473388671875, -0.8675537109375, -0.82037353515625, -0.773193359375, -0.72601318359375, -0.6788330078125, -0.63165283203125, -0.58447265625, -0.53729248046875, -0.4901123046875, -0.44293212890625, -0.395751953125, -0.34857177734375, -0.3013916015625, -0.25421142578125, -0.20703125, -0.15985107421875, -0.1126708984375, -0.06549072265625, -0.018310546875, 0.02886962890625, 0.0760498046875, 0.12322998046875, 0.17041015625, 0.21759033203125, 0.2647705078125, 0.31195068359375, 0.359130859375, 0.40631103515625, 0.4534912109375, 0.50067138671875, 0.5478515625, 0.59503173828125, 0.6422119140625, 0.68939208984375, 0.736572265625, 0.78375244140625, 0.8309326171875, 0.87811279296875, 0.92529296875, 0.97247314453125, 1.0196533203125, 1.06683349609375, 1.114013671875, 1.16119384765625, 1.2083740234375, 1.25555419921875, 1.302734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 12.0, 15.0, 9.0, 13.0, 22.0, 42.0, 46.0, 73.0, 83.0, 90.0, 101.0, 100.0, 75.0, 87.0, 61.0, 48.0, 36.0, 18.0, 24.0, 16.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.30859375, -6.164947509765625, -6.02130126953125, -5.877655029296875, -5.7340087890625, -5.590362548828125, -5.44671630859375, -5.303070068359375, -5.159423828125, -5.015777587890625, -4.87213134765625, -4.728485107421875, -4.5848388671875, -4.441192626953125, -4.29754638671875, -4.153900146484375, -4.01025390625, -3.866607666015625, -3.72296142578125, -3.579315185546875, -3.4356689453125, -3.292022705078125, -3.14837646484375, -3.004730224609375, -2.861083984375, -2.717437744140625, -2.57379150390625, -2.430145263671875, -2.2864990234375, -2.142852783203125, -1.99920654296875, -1.855560302734375, -1.7119140625, -1.568267822265625, -1.42462158203125, -1.280975341796875, -1.1373291015625, -0.993682861328125, -0.85003662109375, -0.706390380859375, -0.562744140625, -0.419097900390625, -0.27545166015625, -0.131805419921875, 0.0118408203125, 0.155487060546875, 0.29913330078125, 0.442779541015625, 0.58642578125, 0.730072021484375, 0.87371826171875, 1.017364501953125, 1.1610107421875, 1.304656982421875, 1.44830322265625, 1.591949462890625, 1.735595703125, 1.879241943359375, 2.02288818359375, 2.166534423828125, 2.3101806640625, 2.453826904296875, 2.59747314453125, 2.741119384765625, 2.884765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 21.0, 17.0, 40.0, 43.0, 55.0, 86.0, 121.0, 175.0, 236.0, 385.0, 847.0, 2960.0, 38411.0, 749366.0, 242263.0, 10467.0, 1399.0, 529.0, 349.0, 213.0, 145.0, 113.0, 78.0, 66.0, 46.0, 27.0, 24.0, 12.0, 13.0, 8.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.76416015625, -0.7449493408203125, -0.725738525390625, -0.7065277099609375, -0.68731689453125, -0.6681060791015625, -0.648895263671875, -0.6296844482421875, -0.6104736328125, -0.5912628173828125, -0.572052001953125, -0.5528411865234375, -0.53363037109375, -0.5144195556640625, -0.495208740234375, -0.4759979248046875, -0.456787109375, -0.4375762939453125, -0.418365478515625, -0.3991546630859375, -0.37994384765625, -0.3607330322265625, -0.341522216796875, -0.3223114013671875, -0.3031005859375, -0.2838897705078125, -0.264678955078125, -0.2454681396484375, -0.22625732421875, -0.2070465087890625, -0.187835693359375, -0.1686248779296875, -0.1494140625, -0.1302032470703125, -0.110992431640625, -0.0917816162109375, -0.07257080078125, -0.0533599853515625, -0.034149169921875, -0.0149383544921875, 0.0042724609375, 0.0234832763671875, 0.042694091796875, 0.0619049072265625, 0.08111572265625, 0.1003265380859375, 0.119537353515625, 0.1387481689453125, 0.157958984375, 0.1771697998046875, 0.196380615234375, 0.2155914306640625, 0.23480224609375, 0.2540130615234375, 0.273223876953125, 0.2924346923828125, 0.3116455078125, 0.3308563232421875, 0.350067138671875, 0.3692779541015625, 0.38848876953125, 0.4076995849609375, 0.426910400390625, 0.4461212158203125, 0.46533203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 7.0, 7.0, 15.0, 5.0, 14.0, 19.0, 19.0, 21.0, 25.0, 24.0, 27.0, 38.0, 31.0, 32.0, 41.0, 50.0, 45.0, 39.0, 45.0, 42.0, 48.0, 46.0, 43.0, 42.0, 31.0, 35.0, 27.0, 22.0, 16.0, 19.0, 26.0, 12.0, 15.0, 19.0, 8.0, 6.0, 11.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.7421875, -4.60552978515625, -4.4688720703125, -4.33221435546875, -4.195556640625, -4.05889892578125, -3.9222412109375, -3.78558349609375, -3.64892578125, -3.51226806640625, -3.3756103515625, -3.23895263671875, -3.102294921875, -2.96563720703125, -2.8289794921875, -2.69232177734375, -2.5556640625, -2.41900634765625, -2.2823486328125, -2.14569091796875, -2.009033203125, -1.87237548828125, -1.7357177734375, -1.59906005859375, -1.46240234375, -1.32574462890625, -1.1890869140625, -1.05242919921875, -0.915771484375, -0.77911376953125, -0.6424560546875, -0.50579833984375, -0.369140625, -0.23248291015625, -0.0958251953125, 0.04083251953125, 0.177490234375, 0.31414794921875, 0.4508056640625, 0.58746337890625, 0.72412109375, 0.86077880859375, 0.9974365234375, 1.13409423828125, 1.270751953125, 1.40740966796875, 1.5440673828125, 1.68072509765625, 1.8173828125, 1.95404052734375, 2.0906982421875, 2.22735595703125, 2.364013671875, 2.50067138671875, 2.6373291015625, 2.77398681640625, 2.91064453125, 3.04730224609375, 3.1839599609375, 3.32061767578125, 3.457275390625, 3.59393310546875, 3.7305908203125, 3.86724853515625, 4.00390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 6.0, 16.0, 25.0, 23.0, 51.0, 74.0, 101.0, 159.0, 293.0, 471.0, 954.0, 3209.0, 27010.0, 927955.0, 80389.0, 5134.0, 1255.0, 551.0, 285.0, 181.0, 136.0, 84.0, 46.0, 41.0, 21.0, 13.0, 20.0, 6.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.0743112564086914, -0.07116889953613281, -0.06802654266357422, -0.06488418579101562, -0.06174182891845703, -0.05859947204589844, -0.055457115173339844, -0.05231475830078125, -0.049172401428222656, -0.04603004455566406, -0.04288768768310547, -0.039745330810546875, -0.03660297393798828, -0.03346061706542969, -0.030318260192871094, -0.0271759033203125, -0.024033546447753906, -0.020891189575195312, -0.01774883270263672, -0.014606475830078125, -0.011464118957519531, -0.008321762084960938, -0.005179405212402344, -0.00203704833984375, 0.0011053085327148438, 0.0042476654052734375, 0.007390022277832031, 0.010532379150390625, 0.013674736022949219, 0.016817092895507812, 0.019959449768066406, 0.023101806640625, 0.026244163513183594, 0.029386520385742188, 0.03252887725830078, 0.035671234130859375, 0.03881359100341797, 0.04195594787597656, 0.045098304748535156, 0.04824066162109375, 0.051383018493652344, 0.05452537536621094, 0.05766773223876953, 0.060810089111328125, 0.06395244598388672, 0.06709480285644531, 0.0702371597290039, 0.0733795166015625, 0.0765218734741211, 0.07966423034667969, 0.08280658721923828, 0.08594894409179688, 0.08909130096435547, 0.09223365783691406, 0.09537601470947266, 0.09851837158203125, 0.10166072845458984, 0.10480308532714844, 0.10794544219970703, 0.11108779907226562, 0.11423015594482422, 0.11737251281738281, 0.1205148696899414, 0.1236572265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 11.0, 19.0, 17.0, 36.0, 57.0, 46.0, 117.0, 115.0, 122.0, 107.0, 98.0, 80.0, 51.0, 34.0, 23.0, 15.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.758646875619888e-05, -5.5866315960884094e-05, -5.4146163165569305e-05, -5.2426010370254517e-05, -5.070585757493973e-05, -4.898570477962494e-05, -4.726555198431015e-05, -4.554539918899536e-05, -4.382524639368057e-05, -4.2105093598365784e-05, -4.0384940803050995e-05, -3.8664788007736206e-05, -3.694463521242142e-05, -3.522448241710663e-05, -3.350432962179184e-05, -3.178417682647705e-05, -3.0064024031162262e-05, -2.8343871235847473e-05, -2.6623718440532684e-05, -2.4903565645217896e-05, -2.3183412849903107e-05, -2.1463260054588318e-05, -1.974310725927353e-05, -1.802295446395874e-05, -1.630280166864395e-05, -1.4582648873329163e-05, -1.2862496078014374e-05, -1.1142343282699585e-05, -9.422190487384796e-06, -7.702037692070007e-06, -5.9818848967552185e-06, -4.26173210144043e-06, -2.541579306125641e-06, -8.21426510810852e-07, 8.987262845039368e-07, 2.6188790798187256e-06, 4.339031875133514e-06, 6.059184670448303e-06, 7.779337465763092e-06, 9.499490261077881e-06, 1.121964305639267e-05, 1.2939795851707458e-05, 1.4659948647022247e-05, 1.6380101442337036e-05, 1.8100254237651825e-05, 1.9820407032966614e-05, 2.1540559828281403e-05, 2.326071262359619e-05, 2.498086541891098e-05, 2.670101821422577e-05, 2.8421171009540558e-05, 3.0141323804855347e-05, 3.1861476600170135e-05, 3.3581629395484924e-05, 3.530178219079971e-05, 3.70219349861145e-05, 3.874208778142929e-05, 4.046224057674408e-05, 4.218239337205887e-05, 4.390254616737366e-05, 4.5622698962688446e-05, 4.7342851758003235e-05, 4.9063004553318024e-05, 5.078315734863281e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 5.0, 5.0, 8.0, 10.0, 17.0, 19.0, 29.0, 104.0, 293.0, 2497.0, 161262.0, 879322.0, 4323.0, 425.0, 97.0, 51.0, 16.0, 16.0, 9.0, 15.0, 5.0, 4.0, 9.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.37890625, -0.3670997619628906, -0.35529327392578125, -0.3434867858886719, -0.3316802978515625, -0.3198738098144531, -0.30806732177734375, -0.2962608337402344, -0.284454345703125, -0.2726478576660156, -0.26084136962890625, -0.24903488159179688, -0.2372283935546875, -0.22542190551757812, -0.21361541748046875, -0.20180892944335938, -0.19000244140625, -0.17819595336914062, -0.16638946533203125, -0.15458297729492188, -0.1427764892578125, -0.13097000122070312, -0.11916351318359375, -0.10735702514648438, -0.095550537109375, -0.08374404907226562, -0.07193756103515625, -0.060131072998046875, -0.0483245849609375, -0.036518096923828125, -0.02471160888671875, -0.012905120849609375, -0.0010986328125, 0.010707855224609375, 0.02251434326171875, 0.034320831298828125, 0.0461273193359375, 0.057933807373046875, 0.06974029541015625, 0.08154678344726562, 0.093353271484375, 0.10515975952148438, 0.11696624755859375, 0.12877273559570312, 0.1405792236328125, 0.15238571166992188, 0.16419219970703125, 0.17599868774414062, 0.18780517578125, 0.19961166381835938, 0.21141815185546875, 0.22322463989257812, 0.2350311279296875, 0.24683761596679688, 0.25864410400390625, 0.2704505920410156, 0.282257080078125, 0.2940635681152344, 0.30587005615234375, 0.3176765441894531, 0.3294830322265625, 0.3412895202636719, 0.35309600830078125, 0.3649024963378906, 0.376708984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 16.0, 11.0, 27.0, 55.0, 63.0, 120.0, 215.0, 210.0, 105.0, 54.0, 26.0, 25.0, 10.0, 16.0, 6.0, 4.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.027252197265625, -0.026397705078125, -0.025543212890625, -0.024688720703125, -0.023834228515625, -0.022979736328125, -0.022125244140625, -0.021270751953125, -0.020416259765625, -0.019561767578125, -0.018707275390625, -0.017852783203125, -0.016998291015625, -0.016143798828125, -0.015289306640625, -0.014434814453125, -0.013580322265625, -0.012725830078125, -0.011871337890625, -0.011016845703125, -0.010162353515625, -0.009307861328125, -0.008453369140625, -0.007598876953125, -0.006744384765625, -0.005889892578125, -0.005035400390625, -0.004180908203125, -0.003326416015625, -0.002471923828125, -0.001617431640625, -0.000762939453125, 9.1552734375e-05, 0.000946044921875, 0.001800537109375, 0.002655029296875, 0.003509521484375, 0.004364013671875, 0.005218505859375, 0.006072998046875, 0.006927490234375, 0.007781982421875, 0.008636474609375, 0.009490966796875, 0.010345458984375, 0.011199951171875, 0.012054443359375, 0.012908935546875, 0.013763427734375, 0.014617919921875, 0.015472412109375, 0.016326904296875, 0.017181396484375, 0.018035888671875, 0.018890380859375, 0.019744873046875, 0.020599365234375, 0.021453857421875, 0.022308349609375, 0.023162841796875, 0.024017333984375, 0.024871826171875, 0.025726318359375, 0.026580810546875, 0.027435302734375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 9.0, 11.0, 16.0, 43.0, 170.0, 341.0, 253.0, 90.0, 37.0, 19.0, 10.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.284192085266113, -10.916738510131836, -10.549283981323242, -10.181829452514648, -9.814375877380371, -9.446922302246094, -9.0794677734375, -8.712013244628906, -8.344559669494629, -7.977105617523193, -7.609651565551758, -7.242197513580322, -6.874743461608887, -6.507289409637451, -6.139835357666016, -5.77238130569458, -5.4049272537231445, -5.037473201751709, -4.670019149780273, -4.302565097808838, -3.9351110458374023, -3.567656993865967, -3.2002029418945312, -2.8327488899230957, -2.46529483795166, -2.0978407859802246, -1.730386734008789, -1.3629326820373535, -0.995478630065918, -0.6280245780944824, -0.2605705261230469, 0.10688352584838867, 0.4743385314941406, 0.8417925834655762, 1.2092466354370117, 1.5767006874084473, 1.9441547393798828, 2.3116087913513184, 2.679062843322754, 3.0465168952941895, 3.413970947265625, 3.7814249992370605, 4.148879051208496, 4.516333103179932, 4.883787155151367, 5.251241207122803, 5.618695259094238, 5.986149311065674, 6.353603363037109, 6.721057415008545, 7.0885114669799805, 7.455965518951416, 7.823419570922852, 8.190874099731445, 8.558327674865723, 8.92578125, 9.293235778808594, 9.660690307617188, 10.028143882751465, 10.395597457885742, 10.763051986694336, 11.13050651550293, 11.497960090637207, 11.865413665771484, 12.232868194580078]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 7.0, 9.0, 8.0, 10.0, 13.0, 30.0, 46.0, 53.0, 88.0, 89.0, 88.0, 97.0, 108.0, 88.0, 70.0, 57.0, 41.0, 27.0, 23.0, 17.0, 14.0, 8.0, 2.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.077759742736816, -5.9345526695251465, -5.791345596313477, -5.648138046264648, -5.5049309730529785, -5.361723899841309, -5.2185163497924805, -5.0753092765808105, -4.932102203369141, -4.788895130157471, -4.645688056945801, -4.502480506896973, -4.359273433685303, -4.216066360473633, -4.072858810424805, -3.9296517372131348, -3.786444664001465, -3.643237590789795, -3.500030279159546, -3.356822967529297, -3.213615894317627, -3.070408821105957, -2.927201509475708, -2.783994197845459, -2.640787124633789, -2.497580051422119, -2.35437273979187, -2.211165428161621, -2.067958354949951, -1.9247511625289917, -1.7815439701080322, -1.6383367776870728, -1.4951298236846924, -1.351922631263733, -1.2087154388427734, -1.065508246421814, -0.9223010540008545, -0.779093861579895, -0.6358866691589355, -0.4926794767379761, -0.3494722843170166, -0.20626509189605713, -0.06305789947509766, 0.08014929294586182, 0.2233564853668213, 0.36656367778778076, 0.5097708702087402, 0.6529780626296997, 0.7961852550506592, 0.9393924474716187, 1.0825996398925781, 1.2258068323135376, 1.369014024734497, 1.5122212171554565, 1.655428409576416, 1.7986356019973755, 1.941842794418335, 2.085050106048584, 2.228257179260254, 2.371464252471924, 2.514671564102173, 2.657878875732422, 2.801085948944092, 2.9442930221557617, 3.0875003337860107]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 10.0, 11.0, 9.0, 26.0, 34.0, 43.0, 87.0, 191.0, 395.0, 844.0, 1998.0, 5573.0, 17582.0, 72958.0, 611438.0, 277180.0, 42254.0, 11428.0, 3780.0, 1436.0, 626.0, 290.0, 143.0, 80.0, 54.0, 43.0, 11.0, 17.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.04296875, -3.950714111328125, -3.85845947265625, -3.766204833984375, -3.6739501953125, -3.581695556640625, -3.48944091796875, -3.397186279296875, -3.304931640625, -3.212677001953125, -3.12042236328125, -3.028167724609375, -2.9359130859375, -2.843658447265625, -2.75140380859375, -2.659149169921875, -2.56689453125, -2.474639892578125, -2.38238525390625, -2.290130615234375, -2.1978759765625, -2.105621337890625, -2.01336669921875, -1.921112060546875, -1.828857421875, -1.736602783203125, -1.64434814453125, -1.552093505859375, -1.4598388671875, -1.367584228515625, -1.27532958984375, -1.183074951171875, -1.0908203125, -0.998565673828125, -0.90631103515625, -0.814056396484375, -0.7218017578125, -0.629547119140625, -0.53729248046875, -0.445037841796875, -0.352783203125, -0.260528564453125, -0.16827392578125, -0.076019287109375, 0.0162353515625, 0.108489990234375, 0.20074462890625, 0.292999267578125, 0.38525390625, 0.477508544921875, 0.56976318359375, 0.662017822265625, 0.7542724609375, 0.846527099609375, 0.93878173828125, 1.031036376953125, 1.123291015625, 1.215545654296875, 1.30780029296875, 1.400054931640625, 1.4923095703125, 1.584564208984375, 1.67681884765625, 1.769073486328125, 1.861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 2.0, 9.0, 7.0, 12.0, 17.0, 23.0, 23.0, 40.0, 37.0, 59.0, 56.0, 74.0, 78.0, 90.0, 98.0, 86.0, 56.0, 48.0, 44.0, 33.0, 20.0, 26.0, 13.0, 15.0, 14.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.1201171875, -9.857421875, -9.5947265625, -9.33203125, -9.0693359375, -8.806640625, -8.5439453125, -8.28125, -8.0185546875, -7.755859375, -7.4931640625, -7.23046875, -6.9677734375, -6.705078125, -6.4423828125, -6.1796875, -5.9169921875, -5.654296875, -5.3916015625, -5.12890625, -4.8662109375, -4.603515625, -4.3408203125, -4.078125, -3.8154296875, -3.552734375, -3.2900390625, -3.02734375, -2.7646484375, -2.501953125, -2.2392578125, -1.9765625, -1.7138671875, -1.451171875, -1.1884765625, -0.92578125, -0.6630859375, -0.400390625, -0.1376953125, 0.125, 0.3876953125, 0.650390625, 0.9130859375, 1.17578125, 1.4384765625, 1.701171875, 1.9638671875, 2.2265625, 2.4892578125, 2.751953125, 3.0146484375, 3.27734375, 3.5400390625, 3.802734375, 4.0654296875, 4.328125, 4.5908203125, 4.853515625, 5.1162109375, 5.37890625, 5.6416015625, 5.904296875, 6.1669921875, 6.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 16.0, 12.0, 14.0, 23.0, 27.0, 28.0, 39.0, 37.0, 41.0, 57.0, 60.0, 123.0, 802.0, 1041586.0, 5104.0, 178.0, 71.0, 51.0, 48.0, 46.0, 39.0, 26.0, 26.0, 23.0, 17.0, 10.0, 6.0, 12.0, 2.0, 3.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-26.890625, -26.176513671875, -25.46240234375, -24.748291015625, -24.0341796875, -23.320068359375, -22.60595703125, -21.891845703125, -21.177734375, -20.463623046875, -19.74951171875, -19.035400390625, -18.3212890625, -17.607177734375, -16.89306640625, -16.178955078125, -15.46484375, -14.750732421875, -14.03662109375, -13.322509765625, -12.6083984375, -11.894287109375, -11.18017578125, -10.466064453125, -9.751953125, -9.037841796875, -8.32373046875, -7.609619140625, -6.8955078125, -6.181396484375, -5.46728515625, -4.753173828125, -4.0390625, -3.324951171875, -2.61083984375, -1.896728515625, -1.1826171875, -0.468505859375, 0.24560546875, 0.959716796875, 1.673828125, 2.387939453125, 3.10205078125, 3.816162109375, 4.5302734375, 5.244384765625, 5.95849609375, 6.672607421875, 7.38671875, 8.100830078125, 8.81494140625, 9.529052734375, 10.2431640625, 10.957275390625, 11.67138671875, 12.385498046875, 13.099609375, 13.813720703125, 14.52783203125, 15.241943359375, 15.9560546875, 16.670166015625, 17.38427734375, 18.098388671875, 18.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 1.0, 1.0, 4.0, 9.0, 12.0, 9.0, 20.0, 21.0, 26.0, 28.0, 45.0, 41.0, 34.0, 47.0, 46.0, 46.0, 54.0, 62.0, 81.0, 49.0, 40.0, 47.0, 50.0, 42.0, 40.0, 25.0, 25.0, 19.0, 24.0, 12.0, 6.0, 12.0, 2.0, 2.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-9.40625, -9.15631103515625, -8.9063720703125, -8.65643310546875, -8.406494140625, -8.15655517578125, -7.9066162109375, -7.65667724609375, -7.40673828125, -7.15679931640625, -6.9068603515625, -6.65692138671875, -6.406982421875, -6.15704345703125, -5.9071044921875, -5.65716552734375, -5.4072265625, -5.15728759765625, -4.9073486328125, -4.65740966796875, -4.407470703125, -4.15753173828125, -3.9075927734375, -3.65765380859375, -3.40771484375, -3.15777587890625, -2.9078369140625, -2.65789794921875, -2.407958984375, -2.15802001953125, -1.9080810546875, -1.65814208984375, -1.408203125, -1.15826416015625, -0.9083251953125, -0.65838623046875, -0.408447265625, -0.15850830078125, 0.0914306640625, 0.34136962890625, 0.59130859375, 0.84124755859375, 1.0911865234375, 1.34112548828125, 1.591064453125, 1.84100341796875, 2.0909423828125, 2.34088134765625, 2.5908203125, 2.84075927734375, 3.0906982421875, 3.34063720703125, 3.590576171875, 3.84051513671875, 4.0904541015625, 4.34039306640625, 4.59033203125, 4.84027099609375, 5.0902099609375, 5.34014892578125, 5.590087890625, 5.84002685546875, 6.0899658203125, 6.33990478515625, 6.58984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 11.0, 27.0, 33.0, 59.0, 87.0, 205.0, 515.0, 1666.0, 9945.0, 179509.0, 832659.0, 19996.0, 2645.0, 678.0, 243.0, 120.0, 50.0, 35.0, 22.0, 7.0, 7.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53515625, -1.478607177734375, -1.42205810546875, -1.365509033203125, -1.3089599609375, -1.252410888671875, -1.19586181640625, -1.139312744140625, -1.082763671875, -1.026214599609375, -0.96966552734375, -0.913116455078125, -0.8565673828125, -0.800018310546875, -0.74346923828125, -0.686920166015625, -0.63037109375, -0.573822021484375, -0.51727294921875, -0.460723876953125, -0.4041748046875, -0.347625732421875, -0.29107666015625, -0.234527587890625, -0.177978515625, -0.121429443359375, -0.06488037109375, -0.008331298828125, 0.0482177734375, 0.104766845703125, 0.16131591796875, 0.217864990234375, 0.2744140625, 0.330963134765625, 0.38751220703125, 0.444061279296875, 0.5006103515625, 0.557159423828125, 0.61370849609375, 0.670257568359375, 0.726806640625, 0.783355712890625, 0.83990478515625, 0.896453857421875, 0.9530029296875, 1.009552001953125, 1.06610107421875, 1.122650146484375, 1.17919921875, 1.235748291015625, 1.29229736328125, 1.348846435546875, 1.4053955078125, 1.461944580078125, 1.51849365234375, 1.575042724609375, 1.631591796875, 1.688140869140625, 1.74468994140625, 1.801239013671875, 1.8577880859375, 1.914337158203125, 1.97088623046875, 2.027435302734375, 2.083984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 9.0, 7.0, 8.0, 14.0, 14.0, 21.0, 29.0, 46.0, 54.0, 78.0, 124.0, 197.0, 110.0, 72.0, 61.0, 33.0, 23.0, 19.0, 10.0, 10.0, 6.0, 6.0, 2.0, 11.0, 3.0, 0.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001074671745300293, -0.00010381732136011124, -0.00010016746819019318, -9.651761502027512e-05, -9.286776185035706e-05, -8.9217908680439e-05, -8.556805551052094e-05, -8.191820234060287e-05, -7.826834917068481e-05, -7.461849600076675e-05, -7.09686428308487e-05, -6.731878966093063e-05, -6.366893649101257e-05, -6.001908332109451e-05, -5.636923015117645e-05, -5.271937698125839e-05, -4.906952381134033e-05, -4.541967064142227e-05, -4.176981747150421e-05, -3.811996430158615e-05, -3.447011113166809e-05, -3.082025796175003e-05, -2.717040479183197e-05, -2.352055162191391e-05, -1.987069845199585e-05, -1.622084528207779e-05, -1.2570992112159729e-05, -8.921138942241669e-06, -5.271285772323608e-06, -1.621432602405548e-06, 2.028420567512512e-06, 5.6782737374305725e-06, 9.328126907348633e-06, 1.2977980077266693e-05, 1.6627833247184753e-05, 2.0277686417102814e-05, 2.3927539587020874e-05, 2.7577392756938934e-05, 3.1227245926856995e-05, 3.4877099096775055e-05, 3.8526952266693115e-05, 4.2176805436611176e-05, 4.5826658606529236e-05, 4.9476511776447296e-05, 5.3126364946365356e-05, 5.677621811628342e-05, 6.042607128620148e-05, 6.407592445611954e-05, 6.77257776260376e-05, 7.137563079595566e-05, 7.502548396587372e-05, 7.867533713579178e-05, 8.232519030570984e-05, 8.59750434756279e-05, 8.962489664554596e-05, 9.327474981546402e-05, 9.692460298538208e-05, 0.00010057445615530014, 0.0001042243093252182, 0.00010787416249513626, 0.00011152401566505432, 0.00011517386883497238, 0.00011882372200489044, 0.0001224735751748085, 0.00012612342834472656]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 2.0, 10.0, 11.0, 5.0, 13.0, 20.0, 27.0, 36.0, 77.0, 128.0, 246.0, 382.0, 923.0, 2402.0, 8768.0, 45402.0, 746191.0, 209472.0, 25586.0, 5583.0, 1755.0, 680.0, 334.0, 171.0, 107.0, 57.0, 51.0, 22.0, 18.0, 19.0, 8.0, 13.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.33203125, -1.2958755493164062, -1.2597198486328125, -1.2235641479492188, -1.187408447265625, -1.1512527465820312, -1.1150970458984375, -1.0789413452148438, -1.04278564453125, -1.0066299438476562, -0.9704742431640625, -0.9343185424804688, -0.898162841796875, -0.8620071411132812, -0.8258514404296875, -0.7896957397460938, -0.7535400390625, -0.7173843383789062, -0.6812286376953125, -0.6450729370117188, -0.608917236328125, -0.5727615356445312, -0.5366058349609375, -0.5004501342773438, -0.46429443359375, -0.42813873291015625, -0.3919830322265625, -0.35582733154296875, -0.319671630859375, -0.28351593017578125, -0.2473602294921875, -0.21120452880859375, -0.175048828125, -0.13889312744140625, -0.1027374267578125, -0.06658172607421875, -0.030426025390625, 0.00572967529296875, 0.0418853759765625, 0.07804107666015625, 0.11419677734375, 0.15035247802734375, 0.1865081787109375, 0.22266387939453125, 0.258819580078125, 0.29497528076171875, 0.3311309814453125, 0.36728668212890625, 0.4034423828125, 0.43959808349609375, 0.4757537841796875, 0.5119094848632812, 0.548065185546875, 0.5842208862304688, 0.6203765869140625, 0.6565322875976562, 0.69268798828125, 0.7288436889648438, 0.7649993896484375, 0.8011550903320312, 0.837310791015625, 0.8734664916992188, 0.9096221923828125, 0.9457778930664062, 0.98193359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 10.0, 8.0, 17.0, 10.0, 11.0, 21.0, 32.0, 27.0, 27.0, 43.0, 86.0, 258.0, 131.0, 56.0, 40.0, 39.0, 31.0, 25.0, 19.0, 25.0, 12.0, 7.0, 8.0, 6.0, 5.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2874259948730469, -0.27773284912109375, -0.2680397033691406, -0.2583465576171875, -0.24865341186523438, -0.23896026611328125, -0.22926712036132812, -0.219573974609375, -0.20988082885742188, -0.20018768310546875, -0.19049453735351562, -0.1808013916015625, -0.17110824584960938, -0.16141510009765625, -0.15172195434570312, -0.14202880859375, -0.13233566284179688, -0.12264251708984375, -0.11294937133789062, -0.1032562255859375, -0.09356307983398438, -0.08386993408203125, -0.07417678833007812, -0.064483642578125, -0.054790496826171875, -0.04509735107421875, -0.035404205322265625, -0.0257110595703125, -0.016017913818359375, -0.00632476806640625, 0.003368377685546875, 0.0130615234375, 0.022754669189453125, 0.03244781494140625, 0.042140960693359375, 0.0518341064453125, 0.061527252197265625, 0.07122039794921875, 0.08091354370117188, 0.090606689453125, 0.10029983520507812, 0.10999298095703125, 0.11968612670898438, 0.1293792724609375, 0.13907241821289062, 0.14876556396484375, 0.15845870971679688, 0.16815185546875, 0.17784500122070312, 0.18753814697265625, 0.19723129272460938, 0.2069244384765625, 0.21661758422851562, 0.22631072998046875, 0.23600387573242188, 0.245697021484375, 0.2553901672363281, 0.26508331298828125, 0.2747764587402344, 0.2844696044921875, 0.2941627502441406, 0.30385589599609375, 0.3135490417480469, 0.3232421875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 10.0, 30.0, 272.0, 561.0, 109.0, 22.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.65773010253906, -73.20014190673828, -71.74256134033203, -70.28497314453125, -68.82738494873047, -67.36979675292969, -65.91221618652344, -64.45462799072266, -62.997039794921875, -61.53945541381836, -60.08186721801758, -58.62428283691406, -57.16669464111328, -55.709110260009766, -54.25152587890625, -52.79393768310547, -51.33635330200195, -49.87876892089844, -48.421180725097656, -46.96359634399414, -45.50600814819336, -44.048423767089844, -42.59083557128906, -41.13325119018555, -39.67566680908203, -38.218082427978516, -36.760494232177734, -35.30290985107422, -33.84532165527344, -32.38773727416992, -30.930150985717773, -29.472564697265625, -28.014978408813477, -26.557392120361328, -25.09980583190918, -23.64221954345703, -22.184635162353516, -20.727046966552734, -19.26946258544922, -17.81187629699707, -16.354290008544922, -14.896703720092773, -13.439117431640625, -11.981532096862793, -10.523945808410645, -9.066359519958496, -7.608774185180664, -6.151187896728516, -4.693601608276367, -3.236015558242798, -1.7784295082092285, -0.3208436965942383, 1.1367425918579102, 2.5943288803100586, 4.051914215087891, 5.509500503540039, 6.9670867919921875, 8.424673080444336, 9.882259368896484, 11.339844703674316, 12.797430992126465, 14.255017280578613, 15.712602615356445, 17.170188903808594, 18.627775192260742]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 5.0, 3.0, 11.0, 10.0, 15.0, 17.0, 16.0, 18.0, 32.0, 23.0, 23.0, 30.0, 27.0, 36.0, 37.0, 37.0, 41.0, 29.0, 28.0, 42.0, 41.0, 40.0, 44.0, 36.0, 36.0, 27.0, 33.0, 35.0, 33.0, 23.0, 21.0, 20.0, 17.0, 15.0, 14.0, 12.0, 8.0, 10.0, 6.0, 9.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.958179473876953, -9.668221473693848, -9.378263473510742, -9.088306427001953, -8.798348426818848, -8.508390426635742, -8.218432426452637, -7.9284749031066895, -7.638517379760742, -7.348559379577637, -7.0586018562316895, -6.768643856048584, -6.478686332702637, -6.188728332519531, -5.898770332336426, -5.6088128089904785, -5.318854808807373, -5.028896808624268, -4.73893928527832, -4.448981285095215, -4.159023761749268, -3.869065761566162, -3.5791079998016357, -3.2891502380371094, -2.999192476272583, -2.7092347145080566, -2.4192769527435303, -2.129319190979004, -1.839361310005188, -1.5494035482406616, -1.2594456672668457, -0.9694879055023193, -0.679530143737793, -0.3895723521709442, -0.09961456060409546, 0.19034326076507568, 0.48030102252960205, 0.7702587842941284, 1.0602166652679443, 1.3501744270324707, 1.640132188796997, 1.9300899505615234, 2.22004771232605, 2.510005474090576, 2.7999634742736816, 3.089920997619629, 3.3798789978027344, 3.6698367595672607, 3.959794521331787, 4.249752521514893, 4.53971004486084, 4.829668045043945, 5.119625568389893, 5.409583568572998, 5.699541091918945, 5.989499092102051, 6.279457092285156, 6.569415092468262, 6.859372615814209, 7.1493306159973145, 7.439288139343262, 7.729246139526367, 8.019204139709473, 8.309162139892578, 8.599119186401367]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 6.0, 6.0, 9.0, 20.0, 20.0, 24.0, 33.0, 57.0, 81.0, 121.0, 177.0, 352.0, 760.0, 1709.0, 5195.0, 19824.0, 134807.0, 3394674.0, 573729.0, 47341.0, 9940.0, 3078.0, 1181.0, 490.0, 213.0, 110.0, 87.0, 62.0, 36.0, 29.0, 22.0, 15.0, 13.0, 11.0, 6.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.875, -6.6771240234375, -6.479248046875, -6.2813720703125, -6.08349609375, -5.8856201171875, -5.687744140625, -5.4898681640625, -5.2919921875, -5.0941162109375, -4.896240234375, -4.6983642578125, -4.50048828125, -4.3026123046875, -4.104736328125, -3.9068603515625, -3.708984375, -3.5111083984375, -3.313232421875, -3.1153564453125, -2.91748046875, -2.7196044921875, -2.521728515625, -2.3238525390625, -2.1259765625, -1.9281005859375, -1.730224609375, -1.5323486328125, -1.33447265625, -1.1365966796875, -0.938720703125, -0.7408447265625, -0.54296875, -0.3450927734375, -0.147216796875, 0.0506591796875, 0.24853515625, 0.4464111328125, 0.644287109375, 0.8421630859375, 1.0400390625, 1.2379150390625, 1.435791015625, 1.6336669921875, 1.83154296875, 2.0294189453125, 2.227294921875, 2.4251708984375, 2.623046875, 2.8209228515625, 3.018798828125, 3.2166748046875, 3.41455078125, 3.6124267578125, 3.810302734375, 4.0081787109375, 4.2060546875, 4.4039306640625, 4.601806640625, 4.7996826171875, 4.99755859375, 5.1954345703125, 5.393310546875, 5.5911865234375, 5.7890625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 15.0, 20.0, 28.0, 36.0, 69.0, 89.0, 108.0, 86.0, 110.0, 107.0, 85.0, 89.0, 34.0, 35.0, 20.0, 17.0, 10.0, 7.0, 5.0, 2.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.02734375, -6.860626220703125, -6.69390869140625, -6.527191162109375, -6.3604736328125, -6.193756103515625, -6.02703857421875, -5.860321044921875, -5.693603515625, -5.526885986328125, -5.36016845703125, -5.193450927734375, -5.0267333984375, -4.860015869140625, -4.69329833984375, -4.526580810546875, -4.35986328125, -4.193145751953125, -4.02642822265625, -3.859710693359375, -3.6929931640625, -3.526275634765625, -3.35955810546875, -3.192840576171875, -3.026123046875, -2.859405517578125, -2.69268798828125, -2.525970458984375, -2.3592529296875, -2.192535400390625, -2.02581787109375, -1.859100341796875, -1.6923828125, -1.525665283203125, -1.35894775390625, -1.192230224609375, -1.0255126953125, -0.858795166015625, -0.69207763671875, -0.525360107421875, -0.358642578125, -0.191925048828125, -0.02520751953125, 0.141510009765625, 0.3082275390625, 0.474945068359375, 0.64166259765625, 0.808380126953125, 0.97509765625, 1.141815185546875, 1.30853271484375, 1.475250244140625, 1.6419677734375, 1.808685302734375, 1.97540283203125, 2.142120361328125, 2.308837890625, 2.475555419921875, 2.64227294921875, 2.808990478515625, 2.9757080078125, 3.142425537109375, 3.30914306640625, 3.475860595703125, 3.642578125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 26.0, 38.0, 70.0, 214.0, 1390.0, 572027.0, 3618297.0, 1784.0, 260.0, 101.0, 26.0, 18.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.90625, -39.07568359375, -38.2451171875, -37.41455078125, -36.583984375, -35.75341796875, -34.9228515625, -34.09228515625, -33.26171875, -32.43115234375, -31.6005859375, -30.77001953125, -29.939453125, -29.10888671875, -28.2783203125, -27.44775390625, -26.6171875, -25.78662109375, -24.9560546875, -24.12548828125, -23.294921875, -22.46435546875, -21.6337890625, -20.80322265625, -19.97265625, -19.14208984375, -18.3115234375, -17.48095703125, -16.650390625, -15.81982421875, -14.9892578125, -14.15869140625, -13.328125, -12.49755859375, -11.6669921875, -10.83642578125, -10.005859375, -9.17529296875, -8.3447265625, -7.51416015625, -6.68359375, -5.85302734375, -5.0224609375, -4.19189453125, -3.361328125, -2.53076171875, -1.7001953125, -0.86962890625, -0.0390625, 0.79150390625, 1.6220703125, 2.45263671875, 3.283203125, 4.11376953125, 4.9443359375, 5.77490234375, 6.60546875, 7.43603515625, 8.2666015625, 9.09716796875, 9.927734375, 10.75830078125, 11.5888671875, 12.41943359375, 13.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 11.0, 2.0, 8.0, 8.0, 12.0, 16.0, 20.0, 35.0, 33.0, 41.0, 54.0, 76.0, 84.0, 156.0, 204.0, 376.0, 787.0, 874.0, 411.0, 241.0, 201.0, 96.0, 83.0, 64.0, 54.0, 32.0, 23.0, 17.0, 14.0, 6.0, 5.0, 4.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1403121948242188, -1.1077728271484375, -1.0752334594726562, -1.042694091796875, -1.0101547241210938, -0.9776153564453125, -0.9450759887695312, -0.91253662109375, -0.8799972534179688, -0.8474578857421875, -0.8149185180664062, -0.782379150390625, -0.7498397827148438, -0.7173004150390625, -0.6847610473632812, -0.6522216796875, -0.6196823120117188, -0.5871429443359375, -0.5546035766601562, -0.522064208984375, -0.48952484130859375, -0.4569854736328125, -0.42444610595703125, -0.39190673828125, -0.35936737060546875, -0.3268280029296875, -0.29428863525390625, -0.261749267578125, -0.22920989990234375, -0.1966705322265625, -0.16413116455078125, -0.131591796875, -0.09905242919921875, -0.0665130615234375, -0.03397369384765625, -0.001434326171875, 0.03110504150390625, 0.0636444091796875, 0.09618377685546875, 0.12872314453125, 0.16126251220703125, 0.1938018798828125, 0.22634124755859375, 0.258880615234375, 0.29141998291015625, 0.3239593505859375, 0.35649871826171875, 0.3890380859375, 0.42157745361328125, 0.4541168212890625, 0.48665618896484375, 0.519195556640625, 0.5517349243164062, 0.5842742919921875, 0.6168136596679688, 0.64935302734375, 0.6818923950195312, 0.7144317626953125, 0.7469711303710938, 0.779510498046875, 0.8120498657226562, 0.8445892333984375, 0.8771286010742188, 0.90966796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 6.0, 2.0, 5.0, 9.0, 23.0, 33.0, 69.0, 109.0, 204.0, 222.0, 152.0, 74.0, 36.0, 21.0, 13.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.142258644104004, -8.839942932128906, -8.537628173828125, -8.235312461853027, -7.932997226715088, -7.630681991577148, -7.328366279602051, -7.026051044464111, -6.723735809326172, -6.421420574188232, -6.119105339050293, -5.816789627075195, -5.514474391937256, -5.212159156799316, -4.909843444824219, -4.607528209686279, -4.30521297454834, -4.0028977394104, -3.700582265853882, -3.3982667922973633, -3.095951557159424, -2.7936363220214844, -2.491320848464966, -2.1890053749084473, -1.8866901397705078, -1.5843747854232788, -1.2820594310760498, -0.9797440767288208, -0.6774287223815918, -0.3751133680343628, -0.07279801368713379, 0.22951745986938477, 0.5318336486816406, 0.8341490030288696, 1.1364643573760986, 1.4387797117233276, 1.7410950660705566, 2.043410301208496, 2.3457257747650146, 2.648041248321533, 2.9503564834594727, 3.252671718597412, 3.5549871921539307, 3.857302665710449, 4.159617900848389, 4.461933135986328, 4.764248847961426, 5.066564083099365, 5.368879318237305, 5.671194553375244, 5.973509788513184, 6.275825500488281, 6.578140735626221, 6.88045597076416, 7.182771682739258, 7.485086917877197, 7.787402153015137, 8.089717864990234, 8.392032623291016, 8.694348335266113, 8.996664047241211, 9.298978805541992, 9.60129451751709, 9.903610229492188, 10.205924987792969]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 15.0, 15.0, 27.0, 31.0, 38.0, 63.0, 95.0, 105.0, 103.0, 92.0, 93.0, 88.0, 69.0, 46.0, 49.0, 26.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.074833393096924, -6.884274482727051, -6.693715572357178, -6.5031561851501465, -6.312597274780273, -6.1220383644104, -5.931479454040527, -5.740920066833496, -5.550361156463623, -5.35980224609375, -5.169243335723877, -4.978683948516846, -4.788125038146973, -4.5975661277771, -4.407007217407227, -4.216447830200195, -4.0258893966674805, -3.8353304862976074, -3.6447713375091553, -3.4542124271392822, -3.26365327835083, -3.073094367980957, -2.882535457611084, -2.691976308822632, -2.5014171600341797, -2.3108582496643066, -2.1202991008758545, -1.9297401905059814, -1.7391810417175293, -1.5486221313476562, -1.3580631017684937, -1.167504072189331, -0.9769449234008789, -0.7863858938217163, -0.5958268642425537, -0.4052678942680359, -0.2147088646888733, -0.024149835109710693, 0.16640913486480713, 0.3569681644439697, 0.5475271940231323, 0.7380862236022949, 0.9286452531814575, 1.1192042827606201, 1.3097631931304932, 1.5003223419189453, 1.6908812522888184, 1.881440281867981, 2.0719993114471436, 2.2625582218170166, 2.4531173706054688, 2.643676280975342, 2.834235429763794, 3.024794340133667, 3.215353488922119, 3.405912399291992, 3.5964713096618652, 3.7870302200317383, 3.9775893688201904, 4.168148517608643, 4.358707427978516, 4.549266338348389, 4.739825248718262, 4.930384635925293, 5.120943546295166]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 16.0, 23.0, 40.0, 78.0, 194.0, 541.0, 1771.0, 15990.0, 1006834.0, 20107.0, 2002.0, 527.0, 196.0, 96.0, 48.0, 22.0, 18.0, 14.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.453125, -1.396209716796875, -1.33929443359375, -1.282379150390625, -1.2254638671875, -1.168548583984375, -1.11163330078125, -1.054718017578125, -0.997802734375, -0.940887451171875, -0.88397216796875, -0.827056884765625, -0.7701416015625, -0.713226318359375, -0.65631103515625, -0.599395751953125, -0.54248046875, -0.485565185546875, -0.42864990234375, -0.371734619140625, -0.3148193359375, -0.257904052734375, -0.20098876953125, -0.144073486328125, -0.087158203125, -0.030242919921875, 0.02667236328125, 0.083587646484375, 0.1405029296875, 0.197418212890625, 0.25433349609375, 0.311248779296875, 0.3681640625, 0.425079345703125, 0.48199462890625, 0.538909912109375, 0.5958251953125, 0.652740478515625, 0.70965576171875, 0.766571044921875, 0.823486328125, 0.880401611328125, 0.93731689453125, 0.994232177734375, 1.0511474609375, 1.108062744140625, 1.16497802734375, 1.221893310546875, 1.27880859375, 1.335723876953125, 1.39263916015625, 1.449554443359375, 1.5064697265625, 1.563385009765625, 1.62030029296875, 1.677215576171875, 1.734130859375, 1.791046142578125, 1.84796142578125, 1.904876708984375, 1.9617919921875, 2.018707275390625, 2.07562255859375, 2.132537841796875, 2.189453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 11.0, 11.0, 15.0, 33.0, 42.0, 63.0, 99.0, 126.0, 140.0, 127.0, 99.0, 90.0, 55.0, 31.0, 23.0, 16.0, 7.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.467803955078125, -5.31842041015625, -5.169036865234375, -5.0196533203125, -4.870269775390625, -4.72088623046875, -4.571502685546875, -4.422119140625, -4.272735595703125, -4.12335205078125, -3.973968505859375, -3.8245849609375, -3.675201416015625, -3.52581787109375, -3.376434326171875, -3.22705078125, -3.077667236328125, -2.92828369140625, -2.778900146484375, -2.6295166015625, -2.480133056640625, -2.33074951171875, -2.181365966796875, -2.031982421875, -1.882598876953125, -1.73321533203125, -1.583831787109375, -1.4344482421875, -1.285064697265625, -1.13568115234375, -0.986297607421875, -0.8369140625, -0.687530517578125, -0.53814697265625, -0.388763427734375, -0.2393798828125, -0.089996337890625, 0.05938720703125, 0.208770751953125, 0.358154296875, 0.507537841796875, 0.65692138671875, 0.806304931640625, 0.9556884765625, 1.105072021484375, 1.25445556640625, 1.403839111328125, 1.55322265625, 1.702606201171875, 1.85198974609375, 2.001373291015625, 2.1507568359375, 2.300140380859375, 2.44952392578125, 2.598907470703125, 2.748291015625, 2.897674560546875, 3.04705810546875, 3.196441650390625, 3.3458251953125, 3.495208740234375, 3.64459228515625, 3.793975830078125, 3.943359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 5.0, 5.0, 8.0, 11.0, 18.0, 17.0, 26.0, 37.0, 50.0, 68.0, 72.0, 111.0, 142.0, 193.0, 259.0, 421.0, 879.0, 4023.0, 45402.0, 653801.0, 319543.0, 19284.0, 2157.0, 691.0, 372.0, 241.0, 175.0, 158.0, 98.0, 71.0, 58.0, 37.0, 35.0, 32.0, 19.0, 11.0, 7.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.393798828125, -0.3828086853027344, -0.37181854248046875, -0.3608283996582031, -0.3498382568359375, -0.3388481140136719, -0.32785797119140625, -0.3168678283691406, -0.305877685546875, -0.2948875427246094, -0.28389739990234375, -0.2729072570800781, -0.2619171142578125, -0.2509269714355469, -0.23993682861328125, -0.22894668579101562, -0.21795654296875, -0.20696640014648438, -0.19597625732421875, -0.18498611450195312, -0.1739959716796875, -0.16300582885742188, -0.15201568603515625, -0.14102554321289062, -0.130035400390625, -0.11904525756835938, -0.10805511474609375, -0.09706497192382812, -0.0860748291015625, -0.07508468627929688, -0.06409454345703125, -0.053104400634765625, -0.0421142578125, -0.031124114990234375, -0.02013397216796875, -0.009143829345703125, 0.0018463134765625, 0.012836456298828125, 0.02382659912109375, 0.034816741943359375, 0.045806884765625, 0.056797027587890625, 0.06778717041015625, 0.07877731323242188, 0.0897674560546875, 0.10075759887695312, 0.11174774169921875, 0.12273788452148438, 0.13372802734375, 0.14471817016601562, 0.15570831298828125, 0.16669845581054688, 0.1776885986328125, 0.18867874145507812, 0.19966888427734375, 0.21065902709960938, 0.221649169921875, 0.23263931274414062, 0.24362945556640625, 0.2546195983886719, 0.2656097412109375, 0.2765998840332031, 0.28759002685546875, 0.2985801696777344, 0.3095703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 13.0, 10.0, 11.0, 22.0, 19.0, 22.0, 26.0, 41.0, 33.0, 37.0, 34.0, 47.0, 51.0, 40.0, 46.0, 55.0, 41.0, 46.0, 50.0, 40.0, 46.0, 40.0, 46.0, 18.0, 31.0, 25.0, 20.0, 16.0, 11.0, 17.0, 6.0, 6.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.92578125, -3.8170166015625, -3.708251953125, -3.5994873046875, -3.49072265625, -3.3819580078125, -3.273193359375, -3.1644287109375, -3.0556640625, -2.9468994140625, -2.838134765625, -2.7293701171875, -2.62060546875, -2.5118408203125, -2.403076171875, -2.2943115234375, -2.185546875, -2.0767822265625, -1.968017578125, -1.8592529296875, -1.75048828125, -1.6417236328125, -1.532958984375, -1.4241943359375, -1.3154296875, -1.2066650390625, -1.097900390625, -0.9891357421875, -0.88037109375, -0.7716064453125, -0.662841796875, -0.5540771484375, -0.4453125, -0.3365478515625, -0.227783203125, -0.1190185546875, -0.01025390625, 0.0985107421875, 0.207275390625, 0.3160400390625, 0.4248046875, 0.5335693359375, 0.642333984375, 0.7510986328125, 0.85986328125, 0.9686279296875, 1.077392578125, 1.1861572265625, 1.294921875, 1.4036865234375, 1.512451171875, 1.6212158203125, 1.72998046875, 1.8387451171875, 1.947509765625, 2.0562744140625, 2.1650390625, 2.2738037109375, 2.382568359375, 2.4913330078125, 2.60009765625, 2.7088623046875, 2.817626953125, 2.9263916015625, 3.03515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 19.0, 14.0, 19.0, 39.0, 43.0, 59.0, 90.0, 95.0, 152.0, 192.0, 311.0, 654.0, 1990.0, 15504.0, 847556.0, 172525.0, 6496.0, 1347.0, 463.0, 290.0, 173.0, 129.0, 86.0, 75.0, 50.0, 34.0, 27.0, 22.0, 14.0, 22.0, 8.0, 3.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12922382354736328, -0.12551307678222656, -0.12180233001708984, -0.11809158325195312, -0.1143808364868164, -0.11067008972167969, -0.10695934295654297, -0.10324859619140625, -0.09953784942626953, -0.09582710266113281, -0.0921163558959961, -0.08840560913085938, -0.08469486236572266, -0.08098411560058594, -0.07727336883544922, -0.0735626220703125, -0.06985187530517578, -0.06614112854003906, -0.062430381774902344, -0.058719635009765625, -0.055008888244628906, -0.05129814147949219, -0.04758739471435547, -0.04387664794921875, -0.04016590118408203, -0.03645515441894531, -0.032744407653808594, -0.029033660888671875, -0.025322914123535156, -0.021612167358398438, -0.01790142059326172, -0.014190673828125, -0.010479927062988281, -0.0067691802978515625, -0.0030584335327148438, 0.000652313232421875, 0.004363059997558594, 0.008073806762695312, 0.011784553527832031, 0.01549530029296875, 0.01920604705810547, 0.022916793823242188, 0.026627540588378906, 0.030338287353515625, 0.034049034118652344, 0.03775978088378906, 0.04147052764892578, 0.0451812744140625, 0.04889202117919922, 0.05260276794433594, 0.056313514709472656, 0.060024261474609375, 0.0637350082397461, 0.06744575500488281, 0.07115650177001953, 0.07486724853515625, 0.07857799530029297, 0.08228874206542969, 0.0859994888305664, 0.08971023559570312, 0.09342098236083984, 0.09713172912597656, 0.10084247589111328, 0.10455322265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 14.0, 18.0, 19.0, 45.0, 44.0, 69.0, 83.0, 115.0, 122.0, 114.0, 98.0, 85.0, 57.0, 29.0, 13.0, 21.0, 9.0, 7.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61611557006836e-05, -6.457231938838959e-05, -6.298348307609558e-05, -6.139464676380157e-05, -5.980581045150757e-05, -5.821697413921356e-05, -5.6628137826919556e-05, -5.503930151462555e-05, -5.345046520233154e-05, -5.186162889003754e-05, -5.027279257774353e-05, -4.8683956265449524e-05, -4.709511995315552e-05, -4.550628364086151e-05, -4.3917447328567505e-05, -4.23286110162735e-05, -4.073977470397949e-05, -3.9150938391685486e-05, -3.756210207939148e-05, -3.597326576709747e-05, -3.438442945480347e-05, -3.279559314250946e-05, -3.1206756830215454e-05, -2.9617920517921448e-05, -2.802908420562744e-05, -2.6440247893333435e-05, -2.485141158103943e-05, -2.3262575268745422e-05, -2.1673738956451416e-05, -2.008490264415741e-05, -1.8496066331863403e-05, -1.6907230019569397e-05, -1.531839370727539e-05, -1.3729557394981384e-05, -1.2140721082687378e-05, -1.0551884770393372e-05, -8.963048458099365e-06, -7.374212145805359e-06, -5.7853758335113525e-06, -4.196539521217346e-06, -2.60770320892334e-06, -1.0188668966293335e-06, 5.699694156646729e-07, 2.158805727958679e-06, 3.7476420402526855e-06, 5.336478352546692e-06, 6.925314664840698e-06, 8.514150977134705e-06, 1.0102987289428711e-05, 1.1691823601722717e-05, 1.3280659914016724e-05, 1.486949622631073e-05, 1.6458332538604736e-05, 1.8047168850898743e-05, 1.963600516319275e-05, 2.1224841475486755e-05, 2.2813677787780762e-05, 2.4402514100074768e-05, 2.5991350412368774e-05, 2.758018672466278e-05, 2.9169023036956787e-05, 3.0757859349250793e-05, 3.23466956615448e-05, 3.3935531973838806e-05, 3.552436828613281e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 13.0, 23.0, 46.0, 114.0, 251.0, 739.0, 3012.0, 23061.0, 960526.0, 54588.0, 4502.0, 1020.0, 331.0, 142.0, 69.0, 31.0, 25.0, 18.0, 12.0, 8.0, 6.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21875, -0.21083450317382812, -0.20291900634765625, -0.19500350952148438, -0.1870880126953125, -0.17917251586914062, -0.17125701904296875, -0.16334152221679688, -0.155426025390625, -0.14751052856445312, -0.13959503173828125, -0.13167953491210938, -0.1237640380859375, -0.11584854125976562, -0.10793304443359375, -0.10001754760742188, -0.09210205078125, -0.08418655395507812, -0.07627105712890625, -0.06835556030273438, -0.0604400634765625, -0.052524566650390625, -0.04460906982421875, -0.036693572998046875, -0.028778076171875, -0.020862579345703125, -0.01294708251953125, -0.005031585693359375, 0.0028839111328125, 0.010799407958984375, 0.01871490478515625, 0.026630401611328125, 0.0345458984375, 0.042461395263671875, 0.05037689208984375, 0.058292388916015625, 0.0662078857421875, 0.07412338256835938, 0.08203887939453125, 0.08995437622070312, 0.097869873046875, 0.10578536987304688, 0.11370086669921875, 0.12161636352539062, 0.1295318603515625, 0.13744735717773438, 0.14536285400390625, 0.15327835083007812, 0.16119384765625, 0.16910934448242188, 0.17702484130859375, 0.18494033813476562, 0.1928558349609375, 0.20077133178710938, 0.20868682861328125, 0.21660232543945312, 0.224517822265625, 0.23243331909179688, 0.24034881591796875, 0.24826431274414062, 0.2561798095703125, 0.2640953063964844, 0.27201080322265625, 0.2799263000488281, 0.287841796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 9.0, 11.0, 22.0, 24.0, 31.0, 65.0, 135.0, 213.0, 189.0, 94.0, 46.0, 33.0, 25.0, 15.0, 18.0, 4.0, 12.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014862060546875, -0.014307260513305664, -0.013752460479736328, -0.013197660446166992, -0.012642860412597656, -0.01208806037902832, -0.011533260345458984, -0.010978460311889648, -0.010423660278320312, -0.009868860244750977, -0.00931406021118164, -0.008759260177612305, -0.008204460144042969, -0.007649660110473633, -0.007094860076904297, -0.006540060043334961, -0.005985260009765625, -0.005430459976196289, -0.004875659942626953, -0.004320859909057617, -0.0037660598754882812, -0.0032112598419189453, -0.0026564598083496094, -0.0021016597747802734, -0.0015468597412109375, -0.0009920597076416016, -0.0004372596740722656, 0.00011754035949707031, 0.0006723403930664062, 0.0012271404266357422, 0.0017819404602050781, 0.002336740493774414, 0.00289154052734375, 0.003446340560913086, 0.004001140594482422, 0.004555940628051758, 0.005110740661621094, 0.00566554069519043, 0.006220340728759766, 0.0067751407623291016, 0.0073299407958984375, 0.007884740829467773, 0.00843954086303711, 0.008994340896606445, 0.009549140930175781, 0.010103940963745117, 0.010658740997314453, 0.011213541030883789, 0.011768341064453125, 0.012323141098022461, 0.012877941131591797, 0.013432741165161133, 0.013987541198730469, 0.014542341232299805, 0.01509714126586914, 0.015651941299438477, 0.016206741333007812, 0.01676154136657715, 0.017316341400146484, 0.01787114143371582, 0.018425941467285156, 0.018980741500854492, 0.019535541534423828, 0.020090341567993164, 0.0206451416015625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 29.0, 45.0, 96.0, 223.0, 285.0, 154.0, 70.0, 38.0, 12.0, 13.0, 2.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.319628715515137, -8.090072631835938, -7.86051607131958, -7.630959510803223, -7.401403427124023, -7.171846866607666, -6.942290306091309, -6.712734222412109, -6.483177661895752, -6.2536211013793945, -6.024065017700195, -5.794508457183838, -5.5649518966674805, -5.335395812988281, -5.105839252471924, -4.876282691955566, -4.646726608276367, -4.41717004776001, -4.1876139640808105, -3.958057403564453, -3.728501081466675, -3.4989447593688965, -3.269388198852539, -3.0398318767547607, -2.8102755546569824, -2.580719232559204, -2.351162910461426, -2.1216063499450684, -1.89205002784729, -1.6624937057495117, -1.4329372644424438, -1.203380823135376, -0.9738240242004395, -0.7442676424980164, -0.5147112607955933, -0.28515487909317017, -0.05559849739074707, 0.17395782470703125, 0.4035142660140991, 0.633070707321167, 0.8626270294189453, 1.0921833515167236, 1.3217397928237915, 1.5512962341308594, 1.7808525562286377, 2.010408878326416, 2.2399654388427734, 2.4695217609405518, 2.69907808303833, 2.9286344051361084, 3.1581907272338867, 3.387747287750244, 3.6173036098480225, 3.846859931945801, 4.076416492462158, 4.305973052978516, 4.535529136657715, 4.765085697174072, 4.9946417808532715, 5.224198341369629, 5.453754425048828, 5.6833109855651855, 5.912867546081543, 6.142423629760742, 6.3719801902771]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 22.0, 23.0, 28.0, 48.0, 78.0, 129.0, 127.0, 132.0, 113.0, 99.0, 68.0, 52.0, 33.0, 20.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.416303634643555, -5.270781517028809, -5.1252593994140625, -4.979737281799316, -4.83421516418457, -4.688693046569824, -4.543170928955078, -4.39764928817749, -4.252127170562744, -4.106605052947998, -3.961082935333252, -3.815560817718506, -3.670038938522339, -3.5245168209075928, -3.3789947032928467, -3.2334728240966797, -3.0879504680633545, -2.9424283504486084, -2.7969062328338623, -2.6513843536376953, -2.505862236022949, -2.360340118408203, -2.214818000793457, -2.069295883178711, -1.9237738847732544, -1.7782517671585083, -1.6327297687530518, -1.4872076511383057, -1.3416855335235596, -1.196163535118103, -1.050641417503357, -0.9051194190979004, -0.7595973014831543, -0.614075243473053, -0.4685531556606293, -0.32303106784820557, -0.17750900983810425, -0.03198695182800293, 0.11353516578674316, 0.2590571641921997, 0.4045792818069458, 0.5501013398170471, 0.6956233978271484, 0.8411455154418945, 0.9866675734519958, 1.1321896314620972, 1.2777117490768433, 1.4232337474822998, 1.568755865097046, 1.714277982711792, 1.8597999811172485, 2.005321979522705, 2.150844097137451, 2.2963662147521973, 2.4418883323669434, 2.5874104499816895, 2.7329325675964355, 2.8784546852111816, 3.0239768028259277, 3.169498920440674, 3.315020799636841, 3.460542917251587, 3.606065034866333, 3.7515869140625, 3.897109031677246]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 8.0, 16.0, 22.0, 53.0, 88.0, 162.0, 350.0, 782.0, 2258.0, 6334.0, 25270.0, 146881.0, 690872.0, 141034.0, 24570.0, 6246.0, 2154.0, 793.0, 322.0, 141.0, 82.0, 43.0, 17.0, 20.0, 12.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.51171875, -3.39654541015625, -3.2813720703125, -3.16619873046875, -3.051025390625, -2.93585205078125, -2.8206787109375, -2.70550537109375, -2.59033203125, -2.47515869140625, -2.3599853515625, -2.24481201171875, -2.129638671875, -2.01446533203125, -1.8992919921875, -1.78411865234375, -1.6689453125, -1.55377197265625, -1.4385986328125, -1.32342529296875, -1.208251953125, -1.09307861328125, -0.9779052734375, -0.86273193359375, -0.74755859375, -0.63238525390625, -0.5172119140625, -0.40203857421875, -0.286865234375, -0.17169189453125, -0.0565185546875, 0.05865478515625, 0.173828125, 0.28900146484375, 0.4041748046875, 0.51934814453125, 0.634521484375, 0.74969482421875, 0.8648681640625, 0.98004150390625, 1.09521484375, 1.21038818359375, 1.3255615234375, 1.44073486328125, 1.555908203125, 1.67108154296875, 1.7862548828125, 1.90142822265625, 2.0166015625, 2.13177490234375, 2.2469482421875, 2.36212158203125, 2.477294921875, 2.59246826171875, 2.7076416015625, 2.82281494140625, 2.93798828125, 3.05316162109375, 3.1683349609375, 3.28350830078125, 3.398681640625, 3.51385498046875, 3.6290283203125, 3.74420166015625, 3.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 16.0, 16.0, 28.0, 32.0, 52.0, 71.0, 108.0, 115.0, 96.0, 103.0, 102.0, 80.0, 55.0, 32.0, 35.0, 14.0, 8.0, 9.0, 2.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -8.9964599609375, -8.727294921875, -8.4581298828125, -8.18896484375, -7.9197998046875, -7.650634765625, -7.3814697265625, -7.1123046875, -6.8431396484375, -6.573974609375, -6.3048095703125, -6.03564453125, -5.7664794921875, -5.497314453125, -5.2281494140625, -4.958984375, -4.6898193359375, -4.420654296875, -4.1514892578125, -3.88232421875, -3.6131591796875, -3.343994140625, -3.0748291015625, -2.8056640625, -2.5364990234375, -2.267333984375, -1.9981689453125, -1.72900390625, -1.4598388671875, -1.190673828125, -0.9215087890625, -0.65234375, -0.3831787109375, -0.114013671875, 0.1551513671875, 0.42431640625, 0.6934814453125, 0.962646484375, 1.2318115234375, 1.5009765625, 1.7701416015625, 2.039306640625, 2.3084716796875, 2.57763671875, 2.8468017578125, 3.115966796875, 3.3851318359375, 3.654296875, 3.9234619140625, 4.192626953125, 4.4617919921875, 4.73095703125, 5.0001220703125, 5.269287109375, 5.5384521484375, 5.8076171875, 6.0767822265625, 6.345947265625, 6.6151123046875, 6.88427734375, 7.1534423828125, 7.422607421875, 7.6917724609375, 7.9609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 11.0, 13.0, 19.0, 14.0, 18.0, 23.0, 29.0, 32.0, 24.0, 23.0, 43.0, 46.0, 67.0, 212.0, 3767.0, 1012381.0, 30751.0, 572.0, 116.0, 58.0, 43.0, 36.0, 36.0, 29.0, 25.0, 32.0, 18.0, 14.0, 18.0, 12.0, 12.0, 6.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.125, -14.7012939453125, -14.277587890625, -13.8538818359375, -13.43017578125, -13.0064697265625, -12.582763671875, -12.1590576171875, -11.7353515625, -11.3116455078125, -10.887939453125, -10.4642333984375, -10.04052734375, -9.6168212890625, -9.193115234375, -8.7694091796875, -8.345703125, -7.9219970703125, -7.498291015625, -7.0745849609375, -6.65087890625, -6.2271728515625, -5.803466796875, -5.3797607421875, -4.9560546875, -4.5323486328125, -4.108642578125, -3.6849365234375, -3.26123046875, -2.8375244140625, -2.413818359375, -1.9901123046875, -1.56640625, -1.1427001953125, -0.718994140625, -0.2952880859375, 0.12841796875, 0.5521240234375, 0.975830078125, 1.3995361328125, 1.8232421875, 2.2469482421875, 2.670654296875, 3.0943603515625, 3.51806640625, 3.9417724609375, 4.365478515625, 4.7891845703125, 5.212890625, 5.6365966796875, 6.060302734375, 6.4840087890625, 6.90771484375, 7.3314208984375, 7.755126953125, 8.1788330078125, 8.6025390625, 9.0262451171875, 9.449951171875, 9.8736572265625, 10.29736328125, 10.7210693359375, 11.144775390625, 11.5684814453125, 11.9921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 9.0, 6.0, 11.0, 11.0, 15.0, 23.0, 19.0, 26.0, 19.0, 23.0, 39.0, 25.0, 32.0, 37.0, 38.0, 52.0, 43.0, 52.0, 40.0, 35.0, 58.0, 34.0, 47.0, 37.0, 29.0, 31.0, 25.0, 30.0, 28.0, 20.0, 17.0, 11.0, 11.0, 11.0, 6.0, 15.0, 5.0, 4.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.890625, -4.7554931640625, -4.620361328125, -4.4852294921875, -4.35009765625, -4.2149658203125, -4.079833984375, -3.9447021484375, -3.8095703125, -3.6744384765625, -3.539306640625, -3.4041748046875, -3.26904296875, -3.1339111328125, -2.998779296875, -2.8636474609375, -2.728515625, -2.5933837890625, -2.458251953125, -2.3231201171875, -2.18798828125, -2.0528564453125, -1.917724609375, -1.7825927734375, -1.6474609375, -1.5123291015625, -1.377197265625, -1.2420654296875, -1.10693359375, -0.9718017578125, -0.836669921875, -0.7015380859375, -0.56640625, -0.4312744140625, -0.296142578125, -0.1610107421875, -0.02587890625, 0.1092529296875, 0.244384765625, 0.3795166015625, 0.5146484375, 0.6497802734375, 0.784912109375, 0.9200439453125, 1.05517578125, 1.1903076171875, 1.325439453125, 1.4605712890625, 1.595703125, 1.7308349609375, 1.865966796875, 2.0010986328125, 2.13623046875, 2.2713623046875, 2.406494140625, 2.5416259765625, 2.6767578125, 2.8118896484375, 2.947021484375, 3.0821533203125, 3.21728515625, 3.3524169921875, 3.487548828125, 3.6226806640625, 3.7578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 10.0, 6.0, 18.0, 17.0, 52.0, 64.0, 136.0, 247.0, 568.0, 1527.0, 5046.0, 23871.0, 201854.0, 728683.0, 70499.0, 11336.0, 2753.0, 1002.0, 389.0, 201.0, 104.0, 62.0, 31.0, 19.0, 15.0, 8.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.6279296875, -1.584259033203125, -1.54058837890625, -1.496917724609375, -1.4532470703125, -1.409576416015625, -1.36590576171875, -1.322235107421875, -1.278564453125, -1.234893798828125, -1.19122314453125, -1.147552490234375, -1.1038818359375, -1.060211181640625, -1.01654052734375, -0.972869873046875, -0.92919921875, -0.885528564453125, -0.84185791015625, -0.798187255859375, -0.7545166015625, -0.710845947265625, -0.66717529296875, -0.623504638671875, -0.579833984375, -0.536163330078125, -0.49249267578125, -0.448822021484375, -0.4051513671875, -0.361480712890625, -0.31781005859375, -0.274139404296875, -0.23046875, -0.186798095703125, -0.14312744140625, -0.099456787109375, -0.0557861328125, -0.012115478515625, 0.03155517578125, 0.075225830078125, 0.118896484375, 0.162567138671875, 0.20623779296875, 0.249908447265625, 0.2935791015625, 0.337249755859375, 0.38092041015625, 0.424591064453125, 0.46826171875, 0.511932373046875, 0.55560302734375, 0.599273681640625, 0.6429443359375, 0.686614990234375, 0.73028564453125, 0.773956298828125, 0.817626953125, 0.861297607421875, 0.90496826171875, 0.948638916015625, 0.9923095703125, 1.035980224609375, 1.07965087890625, 1.123321533203125, 1.1669921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 12.0, 16.0, 22.0, 38.0, 48.0, 55.0, 67.0, 75.0, 104.0, 105.0, 87.0, 58.0, 60.0, 49.0, 27.0, 27.0, 28.0, 13.0, 10.0, 17.0, 10.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00015115737915039062, -0.00014696363359689713, -0.00014276988804340363, -0.00013857614248991013, -0.00013438239693641663, -0.00013018865138292313, -0.00012599490582942963, -0.00012180116027593613, -0.00011760741472244263, -0.00011341366916894913, -0.00010921992361545563, -0.00010502617806196213, -0.00010083243250846863, -9.663868695497513e-05, -9.244494140148163e-05, -8.825119584798813e-05, -8.405745029449463e-05, -7.986370474100113e-05, -7.566995918750763e-05, -7.147621363401413e-05, -6.728246808052063e-05, -6.308872252702713e-05, -5.889497697353363e-05, -5.470123142004013e-05, -5.050748586654663e-05, -4.631374031305313e-05, -4.211999475955963e-05, -3.792624920606613e-05, -3.373250365257263e-05, -2.9538758099079132e-05, -2.5345012545585632e-05, -2.1151266992092133e-05, -1.6957521438598633e-05, -1.2763775885105133e-05, -8.570030331611633e-06, -4.3762847781181335e-06, -1.825392246246338e-07, 4.011206328868866e-06, 8.204951882362366e-06, 1.2398697435855865e-05, 1.6592442989349365e-05, 2.0786188542842865e-05, 2.4979934096336365e-05, 2.9173679649829865e-05, 3.3367425203323364e-05, 3.7561170756816864e-05, 4.1754916310310364e-05, 4.5948661863803864e-05, 5.014240741729736e-05, 5.433615297079086e-05, 5.852989852428436e-05, 6.272364407777786e-05, 6.691738963127136e-05, 7.111113518476486e-05, 7.530488073825836e-05, 7.949862629175186e-05, 8.369237184524536e-05, 8.788611739873886e-05, 9.207986295223236e-05, 9.627360850572586e-05, 0.00010046735405921936, 0.00010466109961271286, 0.00010885484516620636, 0.00011304859071969986, 0.00011724233627319336]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 13.0, 13.0, 26.0, 35.0, 46.0, 75.0, 102.0, 196.0, 392.0, 885.0, 2099.0, 6110.0, 22624.0, 121482.0, 703657.0, 152688.0, 26844.0, 7010.0, 2269.0, 984.0, 411.0, 238.0, 126.0, 86.0, 43.0, 37.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.939453125, -0.90655517578125, -0.8736572265625, -0.84075927734375, -0.807861328125, -0.77496337890625, -0.7420654296875, -0.70916748046875, -0.67626953125, -0.64337158203125, -0.6104736328125, -0.57757568359375, -0.544677734375, -0.51177978515625, -0.4788818359375, -0.44598388671875, -0.4130859375, -0.38018798828125, -0.3472900390625, -0.31439208984375, -0.281494140625, -0.24859619140625, -0.2156982421875, -0.18280029296875, -0.14990234375, -0.11700439453125, -0.0841064453125, -0.05120849609375, -0.018310546875, 0.01458740234375, 0.0474853515625, 0.08038330078125, 0.11328125, 0.14617919921875, 0.1790771484375, 0.21197509765625, 0.244873046875, 0.27777099609375, 0.3106689453125, 0.34356689453125, 0.37646484375, 0.40936279296875, 0.4422607421875, 0.47515869140625, 0.508056640625, 0.54095458984375, 0.5738525390625, 0.60675048828125, 0.6396484375, 0.67254638671875, 0.7054443359375, 0.73834228515625, 0.771240234375, 0.80413818359375, 0.8370361328125, 0.86993408203125, 0.90283203125, 0.93572998046875, 0.9686279296875, 1.00152587890625, 1.034423828125, 1.06732177734375, 1.1002197265625, 1.13311767578125, 1.166015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 10.0, 15.0, 28.0, 25.0, 46.0, 68.0, 107.0, 152.0, 152.0, 128.0, 84.0, 44.0, 42.0, 31.0, 18.0, 7.0, 5.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5000381469726562, -0.4810333251953125, -0.46202850341796875, -0.443023681640625, -0.42401885986328125, -0.4050140380859375, -0.38600921630859375, -0.36700439453125, -0.34799957275390625, -0.3289947509765625, -0.30998992919921875, -0.290985107421875, -0.27198028564453125, -0.2529754638671875, -0.23397064208984375, -0.2149658203125, -0.19596099853515625, -0.1769561767578125, -0.15795135498046875, -0.138946533203125, -0.11994171142578125, -0.1009368896484375, -0.08193206787109375, -0.06292724609375, -0.04392242431640625, -0.0249176025390625, -0.00591278076171875, 0.013092041015625, 0.03209686279296875, 0.0511016845703125, 0.07010650634765625, 0.089111328125, 0.10811614990234375, 0.1271209716796875, 0.14612579345703125, 0.165130615234375, 0.18413543701171875, 0.2031402587890625, 0.22214508056640625, 0.24114990234375, 0.26015472412109375, 0.2791595458984375, 0.29816436767578125, 0.317169189453125, 0.33617401123046875, 0.3551788330078125, 0.37418365478515625, 0.3931884765625, 0.41219329833984375, 0.4311981201171875, 0.45020294189453125, 0.469207763671875, 0.48821258544921875, 0.5072174072265625, 0.5262222290039062, 0.54522705078125, 0.5642318725585938, 0.5832366943359375, 0.6022415161132812, 0.621246337890625, 0.6402511596679688, 0.6592559814453125, 0.6782608032226562, 0.697265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 34.0, 185.0, 526.0, 197.0, 35.0, 13.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-55.455902099609375, -54.43771743774414, -53.41952896118164, -52.401344299316406, -51.383155822753906, -50.36497116088867, -49.34678649902344, -48.32859802246094, -47.3104133605957, -46.29222869873047, -45.27404022216797, -44.255855560302734, -43.2376708984375, -42.219482421875, -41.201297760009766, -40.183109283447266, -39.16492462158203, -38.1467399597168, -37.1285514831543, -36.11036682128906, -35.09217834472656, -34.07399368286133, -33.055809020996094, -32.037620544433594, -31.01943588256836, -30.001249313354492, -28.983062744140625, -27.96487808227539, -26.946691513061523, -25.928504943847656, -24.910320281982422, -23.892133712768555, -22.873950958251953, -21.855764389038086, -20.83757781982422, -19.819393157958984, -18.801206588745117, -17.78302001953125, -16.764835357666016, -15.746648788452148, -14.728461265563965, -13.710275650024414, -12.692089080810547, -11.67390251159668, -10.655716896057129, -9.637531280517578, -8.619344711303711, -7.601158618927002, -6.582972526550293, -5.564786434173584, -4.546600341796875, -3.528414249420166, -2.510228157043457, -1.492042064666748, -0.47385597229003906, 0.5443301200866699, 1.562516212463379, 2.580702304840088, 3.598888397216797, 4.617074489593506, 5.635260581970215, 6.653446674346924, 7.671632766723633, 8.6898193359375, 9.70800495147705]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 13.0, 8.0, 13.0, 15.0, 26.0, 31.0, 34.0, 46.0, 47.0, 58.0, 58.0, 63.0, 69.0, 68.0, 57.0, 53.0, 49.0, 58.0, 40.0, 23.0, 28.0, 25.0, 27.0, 25.0, 11.0, 8.0, 9.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.137054443359375, -8.83527660369873, -8.533498764038086, -8.231721878051758, -7.929944038391113, -7.628166198730469, -7.326388835906982, -7.024611473083496, -6.722833633422852, -6.421055793762207, -6.119278430938721, -5.817501068115234, -5.51572322845459, -5.213945388793945, -4.912168025970459, -4.610390663146973, -4.308612823486328, -4.006834983825684, -3.7050576210021973, -3.403280019760132, -3.1015024185180664, -2.799724817276001, -2.4979472160339355, -2.19616961479187, -1.8943920135498047, -1.5926144123077393, -1.2908368110656738, -0.9890592098236084, -0.687281608581543, -0.38550400733947754, -0.08372640609741211, 0.21805119514465332, 0.5198287963867188, 0.8216063976287842, 1.1233839988708496, 1.425161600112915, 1.7269392013549805, 2.028716802597046, 2.3304944038391113, 2.6322720050811768, 2.934049606323242, 3.2358272075653076, 3.537604808807373, 3.8393824100494385, 4.141160011291504, 4.442937850952148, 4.744715213775635, 5.046492576599121, 5.348270416259766, 5.65004825592041, 5.9518256187438965, 6.253602981567383, 6.555380821228027, 6.857158660888672, 7.158936023712158, 7.4607133865356445, 7.762491226196289, 8.064269065856934, 8.366046905517578, 8.667823791503906, 8.96960163116455, 9.271379470825195, 9.573156356811523, 9.874934196472168, 10.176712036132812]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 11.0, 8.0, 14.0, 12.0, 8.0, 21.0, 16.0, 26.0, 34.0, 41.0, 44.0, 74.0, 155.0, 642.0, 3474.0, 42414.0, 3751925.0, 380710.0, 12305.0, 1595.0, 368.0, 115.0, 62.0, 34.0, 25.0, 26.0, 26.0, 22.0, 10.0, 10.0, 5.0, 7.0, 12.0, 6.0, 8.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1015625, -8.7738037109375, -8.446044921875, -8.1182861328125, -7.79052734375, -7.4627685546875, -7.135009765625, -6.8072509765625, -6.4794921875, -6.1517333984375, -5.823974609375, -5.4962158203125, -5.16845703125, -4.8406982421875, -4.512939453125, -4.1851806640625, -3.857421875, -3.5296630859375, -3.201904296875, -2.8741455078125, -2.54638671875, -2.2186279296875, -1.890869140625, -1.5631103515625, -1.2353515625, -0.9075927734375, -0.579833984375, -0.2520751953125, 0.07568359375, 0.4034423828125, 0.731201171875, 1.0589599609375, 1.38671875, 1.7144775390625, 2.042236328125, 2.3699951171875, 2.69775390625, 3.0255126953125, 3.353271484375, 3.6810302734375, 4.0087890625, 4.3365478515625, 4.664306640625, 4.9920654296875, 5.31982421875, 5.6475830078125, 5.975341796875, 6.3031005859375, 6.630859375, 6.9586181640625, 7.286376953125, 7.6141357421875, 7.94189453125, 8.2696533203125, 8.597412109375, 8.9251708984375, 9.2529296875, 9.5806884765625, 9.908447265625, 10.2362060546875, 10.56396484375, 10.8917236328125, 11.219482421875, 11.5472412109375, 11.875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 7.0, 9.0, 12.0, 20.0, 42.0, 64.0, 67.0, 101.0, 119.0, 133.0, 128.0, 98.0, 73.0, 49.0, 22.0, 29.0, 14.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.25, -7.07904052734375, -6.9080810546875, -6.73712158203125, -6.566162109375, -6.39520263671875, -6.2242431640625, -6.05328369140625, -5.88232421875, -5.71136474609375, -5.5404052734375, -5.36944580078125, -5.198486328125, -5.02752685546875, -4.8565673828125, -4.68560791015625, -4.5146484375, -4.34368896484375, -4.1727294921875, -4.00177001953125, -3.830810546875, -3.65985107421875, -3.4888916015625, -3.31793212890625, -3.14697265625, -2.97601318359375, -2.8050537109375, -2.63409423828125, -2.463134765625, -2.29217529296875, -2.1212158203125, -1.95025634765625, -1.779296875, -1.60833740234375, -1.4373779296875, -1.26641845703125, -1.095458984375, -0.92449951171875, -0.7535400390625, -0.58258056640625, -0.41162109375, -0.24066162109375, -0.0697021484375, 0.10125732421875, 0.272216796875, 0.44317626953125, 0.6141357421875, 0.78509521484375, 0.9560546875, 1.12701416015625, 1.2979736328125, 1.46893310546875, 1.639892578125, 1.81085205078125, 1.9818115234375, 2.15277099609375, 2.32373046875, 2.49468994140625, 2.6656494140625, 2.83660888671875, 3.007568359375, 3.17852783203125, 3.3494873046875, 3.52044677734375, 3.69140625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 18.0, 17.0, 55.0, 183.0, 956.0, 308804.0, 3882414.0, 1484.0, 207.0, 70.0, 29.0, 15.0, 12.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.171875, -27.2939453125, -26.416015625, -25.5380859375, -24.66015625, -23.7822265625, -22.904296875, -22.0263671875, -21.1484375, -20.2705078125, -19.392578125, -18.5146484375, -17.63671875, -16.7587890625, -15.880859375, -15.0029296875, -14.125, -13.2470703125, -12.369140625, -11.4912109375, -10.61328125, -9.7353515625, -8.857421875, -7.9794921875, -7.1015625, -6.2236328125, -5.345703125, -4.4677734375, -3.58984375, -2.7119140625, -1.833984375, -0.9560546875, -0.078125, 0.7998046875, 1.677734375, 2.5556640625, 3.43359375, 4.3115234375, 5.189453125, 6.0673828125, 6.9453125, 7.8232421875, 8.701171875, 9.5791015625, 10.45703125, 11.3349609375, 12.212890625, 13.0908203125, 13.96875, 14.8466796875, 15.724609375, 16.6025390625, 17.48046875, 18.3583984375, 19.236328125, 20.1142578125, 20.9921875, 21.8701171875, 22.748046875, 23.6259765625, 24.50390625, 25.3818359375, 26.259765625, 27.1376953125, 28.015625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 12.0, 23.0, 38.0, 59.0, 71.0, 92.0, 130.0, 186.0, 315.0, 608.0, 967.0, 533.0, 314.0, 218.0, 128.0, 95.0, 74.0, 39.0, 29.0, 24.0, 18.0, 13.0, 11.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.002532958984375, -0.96600341796875, -0.929473876953125, -0.8929443359375, -0.856414794921875, -0.81988525390625, -0.783355712890625, -0.746826171875, -0.710296630859375, -0.67376708984375, -0.637237548828125, -0.6007080078125, -0.564178466796875, -0.52764892578125, -0.491119384765625, -0.45458984375, -0.418060302734375, -0.38153076171875, -0.345001220703125, -0.3084716796875, -0.271942138671875, -0.23541259765625, -0.198883056640625, -0.162353515625, -0.125823974609375, -0.08929443359375, -0.052764892578125, -0.0162353515625, 0.020294189453125, 0.05682373046875, 0.093353271484375, 0.1298828125, 0.166412353515625, 0.20294189453125, 0.239471435546875, 0.2760009765625, 0.312530517578125, 0.34906005859375, 0.385589599609375, 0.422119140625, 0.458648681640625, 0.49517822265625, 0.531707763671875, 0.5682373046875, 0.604766845703125, 0.64129638671875, 0.677825927734375, 0.71435546875, 0.750885009765625, 0.78741455078125, 0.823944091796875, 0.8604736328125, 0.897003173828125, 0.93353271484375, 0.970062255859375, 1.006591796875, 1.043121337890625, 1.07965087890625, 1.116180419921875, 1.1527099609375, 1.189239501953125, 1.22576904296875, 1.262298583984375, 1.298828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 18.0, 23.0, 32.0, 53.0, 84.0, 113.0, 144.0, 138.0, 126.0, 72.0, 65.0, 37.0, 15.0, 16.0, 12.0, 7.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.720313549041748, -4.545834064483643, -4.371354579925537, -4.196875095367432, -4.022396087646484, -3.8479163646698, -3.6734371185302734, -3.498957633972168, -3.3244781494140625, -3.149998664855957, -2.9755191802978516, -2.801039934158325, -2.6265604496002197, -2.4520809650421143, -2.277601718902588, -2.1031222343444824, -1.928642749786377, -1.7541632652282715, -1.5796838998794556, -1.4052045345306396, -1.2307250499725342, -1.0562455654144287, -0.8817662000656128, -0.7072868347167969, -0.5328073501586914, -0.3583279252052307, -0.18384850025177002, -0.009369075298309326, 0.16511034965515137, 0.33958977460861206, 0.5140691995620728, 0.6885485649108887, 0.8630285263061523, 1.0375080108642578, 1.2119873762130737, 1.3864667415618896, 1.5609462261199951, 1.7354257106781006, 1.9099050760269165, 2.0843844413757324, 2.258863925933838, 2.4333434104919434, 2.607822895050049, 2.782302141189575, 2.9567816257476807, 3.131261110305786, 3.3057403564453125, 3.480219841003418, 3.6546993255615234, 3.829178810119629, 4.003658294677734, 4.17813777923584, 4.352617263793945, 4.527096271514893, 4.701575756072998, 4.8760552406311035, 5.050534725189209, 5.2250142097473145, 5.39949369430542, 5.573973178863525, 5.748452186584473, 5.922931671142578, 6.097411155700684, 6.271890640258789, 6.4463701248168945]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 6.0, 16.0, 29.0, 42.0, 60.0, 53.0, 93.0, 84.0, 111.0, 95.0, 90.0, 67.0, 78.0, 49.0, 31.0, 22.0, 25.0, 15.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.394373416900635, -6.220241546630859, -6.046109199523926, -5.87197732925415, -5.697845458984375, -5.523713111877441, -5.349581241607666, -5.175449371337891, -5.001317024230957, -4.827185153961182, -4.653052806854248, -4.478920936584473, -4.304789066314697, -4.130657196044922, -3.9565248489379883, -3.782392978668213, -3.6082611083984375, -3.434128999710083, -3.2599971294403076, -3.085865020751953, -2.9117331504821777, -2.7376010417938232, -2.5634689331054688, -2.3893370628356934, -2.215204954147339, -2.0410728454589844, -1.866940975189209, -1.6928088665008545, -1.5186768770217896, -1.3445448875427246, -1.1704127788543701, -0.9962807893753052, -0.8221492767333984, -0.6480172872543335, -0.4738852381706238, -0.29975318908691406, -0.12562119960784912, 0.04851078987121582, 0.2226428985595703, 0.39677488803863525, 0.5709068775177002, 0.7450388669967651, 0.9191709160804749, 1.0933029651641846, 1.2674349546432495, 1.4415669441223145, 1.615699052810669, 1.7898310422897339, 1.9639630317687988, 2.1380951404571533, 2.3122270107269287, 2.486359119415283, 2.6604909896850586, 2.834623098373413, 3.0087552070617676, 3.182887077331543, 3.3570191860198975, 3.531151294708252, 3.7052831649780273, 3.879415273666382, 4.053547382354736, 4.227679252624512, 4.401811599731445, 4.575943470001221, 4.750075340270996]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 13.0, 12.0, 14.0, 25.0, 43.0, 87.0, 179.0, 514.0, 1607.0, 14641.0, 980156.0, 47379.0, 2697.0, 671.0, 239.0, 111.0, 65.0, 31.0, 21.0, 21.0, 8.0, 6.0, 4.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3971710205078125, -1.356842041015625, -1.3165130615234375, -1.27618408203125, -1.2358551025390625, -1.195526123046875, -1.1551971435546875, -1.1148681640625, -1.0745391845703125, -1.034210205078125, -0.9938812255859375, -0.95355224609375, -0.9132232666015625, -0.872894287109375, -0.8325653076171875, -0.792236328125, -0.7519073486328125, -0.711578369140625, -0.6712493896484375, -0.63092041015625, -0.5905914306640625, -0.550262451171875, -0.5099334716796875, -0.4696044921875, -0.4292755126953125, -0.388946533203125, -0.3486175537109375, -0.30828857421875, -0.2679595947265625, -0.227630615234375, -0.1873016357421875, -0.14697265625, -0.1066436767578125, -0.066314697265625, -0.0259857177734375, 0.01434326171875, 0.0546722412109375, 0.095001220703125, 0.1353302001953125, 0.1756591796875, 0.2159881591796875, 0.256317138671875, 0.2966461181640625, 0.33697509765625, 0.3773040771484375, 0.417633056640625, 0.4579620361328125, 0.498291015625, 0.5386199951171875, 0.578948974609375, 0.6192779541015625, 0.65960693359375, 0.6999359130859375, 0.740264892578125, 0.7805938720703125, 0.8209228515625, 0.8612518310546875, 0.901580810546875, 0.9419097900390625, 0.98223876953125, 1.0225677490234375, 1.062896728515625, 1.1032257080078125, 1.1435546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 10.0, 13.0, 30.0, 46.0, 76.0, 79.0, 104.0, 129.0, 105.0, 113.0, 89.0, 55.0, 40.0, 28.0, 21.0, 15.0, 8.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.4813232421875, -4.353271484375, -4.2252197265625, -4.09716796875, -3.9691162109375, -3.841064453125, -3.7130126953125, -3.5849609375, -3.4569091796875, -3.328857421875, -3.2008056640625, -3.07275390625, -2.9447021484375, -2.816650390625, -2.6885986328125, -2.560546875, -2.4324951171875, -2.304443359375, -2.1763916015625, -2.04833984375, -1.9202880859375, -1.792236328125, -1.6641845703125, -1.5361328125, -1.4080810546875, -1.280029296875, -1.1519775390625, -1.02392578125, -0.8958740234375, -0.767822265625, -0.6397705078125, -0.51171875, -0.3836669921875, -0.255615234375, -0.1275634765625, 0.00048828125, 0.1285400390625, 0.256591796875, 0.3846435546875, 0.5126953125, 0.6407470703125, 0.768798828125, 0.8968505859375, 1.02490234375, 1.1529541015625, 1.281005859375, 1.4090576171875, 1.537109375, 1.6651611328125, 1.793212890625, 1.9212646484375, 2.04931640625, 2.1773681640625, 2.305419921875, 2.4334716796875, 2.5615234375, 2.6895751953125, 2.817626953125, 2.9456787109375, 3.07373046875, 3.2017822265625, 3.329833984375, 3.4578857421875, 3.5859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 15.0, 14.0, 22.0, 21.0, 37.0, 55.0, 65.0, 60.0, 99.0, 145.0, 199.0, 308.0, 449.0, 941.0, 3785.0, 40511.0, 622197.0, 354332.0, 20653.0, 2556.0, 721.0, 405.0, 281.0, 180.0, 114.0, 78.0, 64.0, 57.0, 38.0, 25.0, 22.0, 9.0, 20.0, 13.0, 12.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.384521484375, -0.37380218505859375, -0.3630828857421875, -0.35236358642578125, -0.341644287109375, -0.33092498779296875, -0.3202056884765625, -0.30948638916015625, -0.29876708984375, -0.28804779052734375, -0.2773284912109375, -0.26660919189453125, -0.255889892578125, -0.24517059326171875, -0.2344512939453125, -0.22373199462890625, -0.2130126953125, -0.20229339599609375, -0.1915740966796875, -0.18085479736328125, -0.170135498046875, -0.15941619873046875, -0.1486968994140625, -0.13797760009765625, -0.12725830078125, -0.11653900146484375, -0.1058197021484375, -0.09510040283203125, -0.084381103515625, -0.07366180419921875, -0.0629425048828125, -0.05222320556640625, -0.04150390625, -0.03078460693359375, -0.0200653076171875, -0.00934600830078125, 0.001373291015625, 0.01209259033203125, 0.0228118896484375, 0.03353118896484375, 0.04425048828125, 0.05496978759765625, 0.0656890869140625, 0.07640838623046875, 0.087127685546875, 0.09784698486328125, 0.1085662841796875, 0.11928558349609375, 0.1300048828125, 0.14072418212890625, 0.1514434814453125, 0.16216278076171875, 0.172882080078125, 0.18360137939453125, 0.1943206787109375, 0.20503997802734375, 0.21575927734375, 0.22647857666015625, 0.2371978759765625, 0.24791717529296875, 0.258636474609375, 0.26935577392578125, 0.2800750732421875, 0.29079437255859375, 0.301513671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 11.0, 6.0, 20.0, 11.0, 11.0, 18.0, 22.0, 32.0, 32.0, 32.0, 29.0, 48.0, 44.0, 38.0, 37.0, 41.0, 54.0, 43.0, 55.0, 50.0, 38.0, 43.0, 48.0, 34.0, 33.0, 25.0, 22.0, 16.0, 11.0, 11.0, 13.0, 13.0, 7.0, 13.0, 4.0, 5.0, 4.0, 5.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.39453125, -3.292022705078125, -3.18951416015625, -3.087005615234375, -2.9844970703125, -2.881988525390625, -2.77947998046875, -2.676971435546875, -2.574462890625, -2.471954345703125, -2.36944580078125, -2.266937255859375, -2.1644287109375, -2.061920166015625, -1.95941162109375, -1.856903076171875, -1.75439453125, -1.651885986328125, -1.54937744140625, -1.446868896484375, -1.3443603515625, -1.241851806640625, -1.13934326171875, -1.036834716796875, -0.934326171875, -0.831817626953125, -0.72930908203125, -0.626800537109375, -0.5242919921875, -0.421783447265625, -0.31927490234375, -0.216766357421875, -0.1142578125, -0.011749267578125, 0.09075927734375, 0.193267822265625, 0.2957763671875, 0.398284912109375, 0.50079345703125, 0.603302001953125, 0.705810546875, 0.808319091796875, 0.91082763671875, 1.013336181640625, 1.1158447265625, 1.218353271484375, 1.32086181640625, 1.423370361328125, 1.52587890625, 1.628387451171875, 1.73089599609375, 1.833404541015625, 1.9359130859375, 2.038421630859375, 2.14093017578125, 2.243438720703125, 2.345947265625, 2.448455810546875, 2.55096435546875, 2.653472900390625, 2.7559814453125, 2.858489990234375, 2.96099853515625, 3.063507080078125, 3.166015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 18.0, 16.0, 31.0, 22.0, 40.0, 65.0, 78.0, 96.0, 208.0, 351.0, 838.0, 3102.0, 78108.0, 951016.0, 11870.0, 1404.0, 503.0, 248.0, 164.0, 94.0, 72.0, 51.0, 28.0, 17.0, 20.0, 6.0, 15.0, 7.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10089111328125, -0.09673404693603516, -0.09257698059082031, -0.08841991424560547, -0.08426284790039062, -0.08010578155517578, -0.07594871520996094, -0.0717916488647461, -0.06763458251953125, -0.0634775161743164, -0.05932044982910156, -0.05516338348388672, -0.051006317138671875, -0.04684925079345703, -0.04269218444824219, -0.038535118103027344, -0.0343780517578125, -0.030220985412597656, -0.026063919067382812, -0.02190685272216797, -0.017749786376953125, -0.013592720031738281, -0.009435653686523438, -0.005278587341308594, -0.00112152099609375, 0.0030355453491210938, 0.0071926116943359375, 0.011349678039550781, 0.015506744384765625, 0.01966381072998047, 0.023820877075195312, 0.027977943420410156, 0.032135009765625, 0.036292076110839844, 0.04044914245605469, 0.04460620880126953, 0.048763275146484375, 0.05292034149169922, 0.05707740783691406, 0.061234474182128906, 0.06539154052734375, 0.0695486068725586, 0.07370567321777344, 0.07786273956298828, 0.08201980590820312, 0.08617687225341797, 0.09033393859863281, 0.09449100494384766, 0.0986480712890625, 0.10280513763427734, 0.10696220397949219, 0.11111927032470703, 0.11527633666992188, 0.11943340301513672, 0.12359046936035156, 0.1277475357055664, 0.13190460205078125, 0.1360616683959961, 0.14021873474121094, 0.14437580108642578, 0.14853286743164062, 0.15268993377685547, 0.1568470001220703, 0.16100406646728516, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 1.0, 7.0, 11.0, 12.0, 12.0, 11.0, 8.0, 23.0, 29.0, 22.0, 36.0, 43.0, 50.0, 64.0, 72.0, 78.0, 75.0, 60.0, 59.0, 53.0, 53.0, 44.0, 30.0, 23.0, 25.0, 24.0, 13.0, 8.0, 7.0, 2.0, 6.0, 0.0, 6.0, 6.0, 1.0, 4.0, 0.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.47955322265625e-05, -2.3974105715751648e-05, -2.3152679204940796e-05, -2.2331252694129944e-05, -2.1509826183319092e-05, -2.068839967250824e-05, -1.9866973161697388e-05, -1.9045546650886536e-05, -1.8224120140075684e-05, -1.740269362926483e-05, -1.658126711845398e-05, -1.5759840607643127e-05, -1.4938414096832275e-05, -1.4116987586021423e-05, -1.3295561075210571e-05, -1.247413456439972e-05, -1.1652708053588867e-05, -1.0831281542778015e-05, -1.0009855031967163e-05, -9.188428521156311e-06, -8.367002010345459e-06, -7.545575499534607e-06, -6.724148988723755e-06, -5.902722477912903e-06, -5.081295967102051e-06, -4.259869456291199e-06, -3.4384429454803467e-06, -2.6170164346694946e-06, -1.7955899238586426e-06, -9.741634130477905e-07, -1.5273690223693848e-07, 6.686896085739136e-07, 1.4901161193847656e-06, 2.3115426301956177e-06, 3.1329691410064697e-06, 3.954395651817322e-06, 4.775822162628174e-06, 5.597248673439026e-06, 6.418675184249878e-06, 7.24010169506073e-06, 8.061528205871582e-06, 8.882954716682434e-06, 9.704381227493286e-06, 1.0525807738304138e-05, 1.134723424911499e-05, 1.2168660759925842e-05, 1.2990087270736694e-05, 1.3811513781547546e-05, 1.4632940292358398e-05, 1.545436680316925e-05, 1.6275793313980103e-05, 1.7097219824790955e-05, 1.7918646335601807e-05, 1.874007284641266e-05, 1.956149935722351e-05, 2.0382925868034363e-05, 2.1204352378845215e-05, 2.2025778889656067e-05, 2.284720540046692e-05, 2.366863191127777e-05, 2.4490058422088623e-05, 2.5311484932899475e-05, 2.6132911443710327e-05, 2.695433795452118e-05, 2.777576446533203e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 4.0, 6.0, 9.0, 15.0, 20.0, 25.0, 48.0, 74.0, 114.0, 189.0, 350.0, 673.0, 1288.0, 2848.0, 7322.0, 27330.0, 260808.0, 683601.0, 46311.0, 10461.0, 3718.0, 1532.0, 770.0, 421.0, 250.0, 148.0, 69.0, 43.0, 25.0, 26.0, 13.0, 10.0, 11.0, 5.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.0767812728881836, -0.07372856140136719, -0.07067584991455078, -0.06762313842773438, -0.06457042694091797, -0.06151771545410156, -0.058465003967285156, -0.05541229248046875, -0.052359580993652344, -0.04930686950683594, -0.04625415802001953, -0.043201446533203125, -0.04014873504638672, -0.03709602355957031, -0.034043312072753906, -0.0309906005859375, -0.027937889099121094, -0.024885177612304688, -0.02183246612548828, -0.018779754638671875, -0.01572704315185547, -0.012674331665039062, -0.009621620178222656, -0.00656890869140625, -0.0035161972045898438, -0.0004634857177734375, 0.0025892257690429688, 0.005641937255859375, 0.008694648742675781, 0.011747360229492188, 0.014800071716308594, 0.017852783203125, 0.020905494689941406, 0.023958206176757812, 0.02701091766357422, 0.030063629150390625, 0.03311634063720703, 0.03616905212402344, 0.039221763610839844, 0.04227447509765625, 0.045327186584472656, 0.04837989807128906, 0.05143260955810547, 0.054485321044921875, 0.05753803253173828, 0.06059074401855469, 0.0636434555053711, 0.0666961669921875, 0.0697488784790039, 0.07280158996582031, 0.07585430145263672, 0.07890701293945312, 0.08195972442626953, 0.08501243591308594, 0.08806514739990234, 0.09111785888671875, 0.09417057037353516, 0.09722328186035156, 0.10027599334716797, 0.10332870483398438, 0.10638141632080078, 0.10943412780761719, 0.1124868392944336, 0.11553955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 12.0, 11.0, 5.0, 12.0, 24.0, 40.0, 68.0, 116.0, 222.0, 208.0, 117.0, 52.0, 22.0, 19.0, 20.0, 8.0, 10.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.033660888671875, -0.032837629318237305, -0.03201436996459961, -0.031191110610961914, -0.03036785125732422, -0.029544591903686523, -0.028721332550048828, -0.027898073196411133, -0.027074813842773438, -0.026251554489135742, -0.025428295135498047, -0.02460503578186035, -0.023781776428222656, -0.02295851707458496, -0.022135257720947266, -0.02131199836730957, -0.020488739013671875, -0.01966547966003418, -0.018842220306396484, -0.01801896095275879, -0.017195701599121094, -0.0163724422454834, -0.015549182891845703, -0.014725923538208008, -0.013902664184570312, -0.013079404830932617, -0.012256145477294922, -0.011432886123657227, -0.010609626770019531, -0.009786367416381836, -0.00896310806274414, -0.008139848709106445, -0.00731658935546875, -0.006493330001831055, -0.005670070648193359, -0.004846811294555664, -0.004023551940917969, -0.0032002925872802734, -0.002377033233642578, -0.0015537738800048828, -0.0007305145263671875, 9.274482727050781e-05, 0.0009160041809082031, 0.0017392635345458984, 0.0025625228881835938, 0.003385782241821289, 0.004209041595458984, 0.00503230094909668, 0.005855560302734375, 0.00667881965637207, 0.007502079010009766, 0.008325338363647461, 0.009148597717285156, 0.009971857070922852, 0.010795116424560547, 0.011618375778198242, 0.012441635131835938, 0.013264894485473633, 0.014088153839111328, 0.014911413192749023, 0.01573467254638672, 0.016557931900024414, 0.01738119125366211, 0.018204450607299805, 0.0190277099609375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 14.0, 32.0, 44.0, 75.0, 157.0, 184.0, 199.0, 105.0, 69.0, 33.0, 24.0, 14.0, 6.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.593433856964111, -5.445555686950684, -5.297677516937256, -5.149799823760986, -5.001921653747559, -4.854043483734131, -4.706165313720703, -4.558287143707275, -4.410408973693848, -4.26253080368042, -4.114652633666992, -3.9667747020721436, -3.818896770477295, -3.671018600463867, -3.5231404304504395, -3.3752622604370117, -3.227384567260742, -3.0795063972473145, -2.931628465652466, -2.783750295639038, -2.6358723640441895, -2.4879941940307617, -2.340116024017334, -2.1922378540039062, -2.0443599224090576, -1.8964818716049194, -1.7486038208007812, -1.6007256507873535, -1.4528475999832153, -1.3049695491790771, -1.1570913791656494, -1.0092133283615112, -0.8613357543945312, -0.7134577035903931, -0.5655795931816101, -0.41770151257514954, -0.26982343196868896, -0.12194538116455078, 0.025932729244232178, 0.17381083965301514, 0.3216888904571533, 0.4695669710636139, 0.6174450516700745, 0.7653231620788574, 0.9132012128829956, 1.0610792636871338, 1.2089574337005615, 1.3568354845046997, 1.504713535308838, 1.652591586112976, 1.8004696369171143, 1.948347806930542, 2.0962257385253906, 2.2441039085388184, 2.391982078552246, 2.539860248565674, 2.6877381801605225, 2.83561635017395, 2.983494281768799, 3.1313724517822266, 3.2792506217956543, 3.427128553390503, 3.5750067234039307, 3.7228846549987793, 3.870762825012207]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 12.0, 13.0, 28.0, 49.0, 71.0, 90.0, 108.0, 140.0, 127.0, 103.0, 77.0, 56.0, 36.0, 26.0, 20.0, 11.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.927026271820068, -4.793264865875244, -4.659503936767578, -4.525742530822754, -4.39198112487793, -4.2582197189331055, -4.1244587898254395, -3.9906973838806152, -3.85693621635437, -3.723175048828125, -3.589413642883301, -3.4556524753570557, -3.3218913078308105, -3.1881299018859863, -3.054368734359741, -2.920607566833496, -2.786846160888672, -2.6530849933624268, -2.5193235874176025, -2.3855624198913574, -2.251801013946533, -2.118039846420288, -1.984278678894043, -1.8505173921585083, -1.7167561054229736, -1.582994818687439, -1.4492335319519043, -1.3154723644256592, -1.1817110776901245, -1.0479497909545898, -0.9141885638237, -0.7804273366928101, -0.6466658115386963, -0.5129045248031616, -0.37914329767227173, -0.24538204073905945, -0.11162078380584717, 0.0221405029296875, 0.1559017300605774, 0.2896629571914673, 0.42342424392700195, 0.5571855306625366, 0.6909467577934265, 0.8247079849243164, 0.9584692716598511, 1.0922305583953857, 1.2259917259216309, 1.3597530126571655, 1.4935142993927002, 1.6272755861282349, 1.7610368728637695, 1.8947980403900146, 2.0285592079162598, 2.162320613861084, 2.296081781387329, 2.429842948913574, 2.5636043548583984, 2.6973655223846436, 2.8311269283294678, 2.964888095855713, 3.098649501800537, 3.2324106693267822, 3.3661718368530273, 3.4999332427978516, 3.6336944103240967]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 21.0, 21.0, 30.0, 33.0, 42.0, 58.0, 122.0, 145.0, 265.0, 388.0, 579.0, 988.0, 1563.0, 2900.0, 5627.0, 11268.0, 25556.0, 66094.0, 210112.0, 441694.0, 178331.0, 57838.0, 22922.0, 10078.0, 5081.0, 2707.0, 1510.0, 907.0, 568.0, 312.0, 238.0, 139.0, 98.0, 80.0, 56.0, 36.0, 39.0, 33.0, 14.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.548828125, -2.467742919921875, -2.38665771484375, -2.305572509765625, -2.2244873046875, -2.143402099609375, -2.06231689453125, -1.981231689453125, -1.900146484375, -1.819061279296875, -1.73797607421875, -1.656890869140625, -1.5758056640625, -1.494720458984375, -1.41363525390625, -1.332550048828125, -1.25146484375, -1.170379638671875, -1.08929443359375, -1.008209228515625, -0.9271240234375, -0.846038818359375, -0.76495361328125, -0.683868408203125, -0.602783203125, -0.521697998046875, -0.44061279296875, -0.359527587890625, -0.2784423828125, -0.197357177734375, -0.11627197265625, -0.035186767578125, 0.0458984375, 0.126983642578125, 0.20806884765625, 0.289154052734375, 0.3702392578125, 0.451324462890625, 0.53240966796875, 0.613494873046875, 0.694580078125, 0.775665283203125, 0.85675048828125, 0.937835693359375, 1.0189208984375, 1.100006103515625, 1.18109130859375, 1.262176513671875, 1.34326171875, 1.424346923828125, 1.50543212890625, 1.586517333984375, 1.6676025390625, 1.748687744140625, 1.82977294921875, 1.910858154296875, 1.991943359375, 2.073028564453125, 2.15411376953125, 2.235198974609375, 2.3162841796875, 2.397369384765625, 2.47845458984375, 2.559539794921875, 2.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 13.0, 11.0, 10.0, 28.0, 34.0, 40.0, 59.0, 79.0, 106.0, 130.0, 112.0, 87.0, 82.0, 51.0, 46.0, 33.0, 16.0, 17.0, 14.0, 8.0, 8.0, 7.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.93939208984375, -8.6834716796875, -8.42755126953125, -8.171630859375, -7.91571044921875, -7.6597900390625, -7.40386962890625, -7.14794921875, -6.89202880859375, -6.6361083984375, -6.38018798828125, -6.124267578125, -5.86834716796875, -5.6124267578125, -5.35650634765625, -5.1005859375, -4.84466552734375, -4.5887451171875, -4.33282470703125, -4.076904296875, -3.82098388671875, -3.5650634765625, -3.30914306640625, -3.05322265625, -2.79730224609375, -2.5413818359375, -2.28546142578125, -2.029541015625, -1.77362060546875, -1.5177001953125, -1.26177978515625, -1.005859375, -0.74993896484375, -0.4940185546875, -0.23809814453125, 0.017822265625, 0.27374267578125, 0.5296630859375, 0.78558349609375, 1.04150390625, 1.29742431640625, 1.5533447265625, 1.80926513671875, 2.065185546875, 2.32110595703125, 2.5770263671875, 2.83294677734375, 3.0888671875, 3.34478759765625, 3.6007080078125, 3.85662841796875, 4.112548828125, 4.36846923828125, 4.6243896484375, 4.88031005859375, 5.13623046875, 5.39215087890625, 5.6480712890625, 5.90399169921875, 6.159912109375, 6.41583251953125, 6.6717529296875, 6.92767333984375, 7.18359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 2.0, 6.0, 4.0, 7.0, 16.0, 7.0, 15.0, 16.0, 24.0, 17.0, 25.0, 38.0, 36.0, 32.0, 33.0, 66.0, 84.0, 160.0, 754.0, 9691.0, 903580.0, 130462.0, 2618.0, 359.0, 98.0, 76.0, 33.0, 31.0, 46.0, 24.0, 30.0, 34.0, 16.0, 25.0, 9.0, 11.0, 19.0, 4.0, 11.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.4765625, -14.0604248046875, -13.644287109375, -13.2281494140625, -12.81201171875, -12.3958740234375, -11.979736328125, -11.5635986328125, -11.1474609375, -10.7313232421875, -10.315185546875, -9.8990478515625, -9.48291015625, -9.0667724609375, -8.650634765625, -8.2344970703125, -7.818359375, -7.4022216796875, -6.986083984375, -6.5699462890625, -6.15380859375, -5.7376708984375, -5.321533203125, -4.9053955078125, -4.4892578125, -4.0731201171875, -3.656982421875, -3.2408447265625, -2.82470703125, -2.4085693359375, -1.992431640625, -1.5762939453125, -1.16015625, -0.7440185546875, -0.327880859375, 0.0882568359375, 0.50439453125, 0.9205322265625, 1.336669921875, 1.7528076171875, 2.1689453125, 2.5850830078125, 3.001220703125, 3.4173583984375, 3.83349609375, 4.2496337890625, 4.665771484375, 5.0819091796875, 5.498046875, 5.9141845703125, 6.330322265625, 6.7464599609375, 7.16259765625, 7.5787353515625, 7.994873046875, 8.4110107421875, 8.8271484375, 9.2432861328125, 9.659423828125, 10.0755615234375, 10.49169921875, 10.9078369140625, 11.323974609375, 11.7401123046875, 12.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 5.0, 3.0, 4.0, 10.0, 8.0, 7.0, 13.0, 14.0, 19.0, 18.0, 27.0, 20.0, 14.0, 43.0, 31.0, 34.0, 38.0, 48.0, 37.0, 35.0, 38.0, 31.0, 48.0, 33.0, 38.0, 31.0, 36.0, 41.0, 37.0, 25.0, 29.0, 29.0, 28.0, 17.0, 13.0, 19.0, 14.0, 15.0, 12.0, 8.0, 4.0, 8.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.32415771484375, -4.1834716796875, -4.04278564453125, -3.902099609375, -3.76141357421875, -3.6207275390625, -3.48004150390625, -3.33935546875, -3.19866943359375, -3.0579833984375, -2.91729736328125, -2.776611328125, -2.63592529296875, -2.4952392578125, -2.35455322265625, -2.2138671875, -2.07318115234375, -1.9324951171875, -1.79180908203125, -1.651123046875, -1.51043701171875, -1.3697509765625, -1.22906494140625, -1.08837890625, -0.94769287109375, -0.8070068359375, -0.66632080078125, -0.525634765625, -0.38494873046875, -0.2442626953125, -0.10357666015625, 0.037109375, 0.17779541015625, 0.3184814453125, 0.45916748046875, 0.599853515625, 0.74053955078125, 0.8812255859375, 1.02191162109375, 1.16259765625, 1.30328369140625, 1.4439697265625, 1.58465576171875, 1.725341796875, 1.86602783203125, 2.0067138671875, 2.14739990234375, 2.2880859375, 2.42877197265625, 2.5694580078125, 2.71014404296875, 2.850830078125, 2.99151611328125, 3.1322021484375, 3.27288818359375, 3.41357421875, 3.55426025390625, 3.6949462890625, 3.83563232421875, 3.976318359375, 4.11700439453125, 4.2576904296875, 4.39837646484375, 4.5390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 9.0, 9.0, 10.0, 11.0, 31.0, 35.0, 63.0, 82.0, 130.0, 194.0, 348.0, 630.0, 1248.0, 2883.0, 8048.0, 26874.0, 111628.0, 439180.0, 344895.0, 81006.0, 20042.0, 6313.0, 2399.0, 1046.0, 543.0, 337.0, 174.0, 112.0, 67.0, 47.0, 29.0, 31.0, 15.0, 15.0, 16.0, 15.0, 8.0, 6.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.033203125, -1.0044174194335938, -0.9756317138671875, -0.9468460083007812, -0.918060302734375, -0.8892745971679688, -0.8604888916015625, -0.8317031860351562, -0.80291748046875, -0.7741317749023438, -0.7453460693359375, -0.7165603637695312, -0.687774658203125, -0.6589889526367188, -0.6302032470703125, -0.6014175415039062, -0.5726318359375, -0.5438461303710938, -0.5150604248046875, -0.48627471923828125, -0.457489013671875, -0.42870330810546875, -0.3999176025390625, -0.37113189697265625, -0.34234619140625, -0.31356048583984375, -0.2847747802734375, -0.25598907470703125, -0.227203369140625, -0.19841766357421875, -0.1696319580078125, -0.14084625244140625, -0.112060546875, -0.08327484130859375, -0.0544891357421875, -0.02570343017578125, 0.003082275390625, 0.03186798095703125, 0.0606536865234375, 0.08943939208984375, 0.11822509765625, 0.14701080322265625, 0.1757965087890625, 0.20458221435546875, 0.233367919921875, 0.26215362548828125, 0.2909393310546875, 0.31972503662109375, 0.3485107421875, 0.37729644775390625, 0.4060821533203125, 0.43486785888671875, 0.463653564453125, 0.49243927001953125, 0.5212249755859375, 0.5500106811523438, 0.57879638671875, 0.6075820922851562, 0.6363677978515625, 0.6651535034179688, 0.693939208984375, 0.7227249145507812, 0.7515106201171875, 0.7802963256835938, 0.80908203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 15.0, 18.0, 26.0, 24.0, 18.0, 39.0, 21.0, 46.0, 48.0, 54.0, 52.0, 61.0, 58.0, 73.0, 63.0, 40.0, 52.0, 52.0, 41.0, 26.0, 29.0, 24.0, 16.0, 11.0, 15.0, 12.0, 14.0, 1.0, 5.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.00014317035675048828, -0.00013899803161621094, -0.0001348257064819336, -0.00013065338134765625, -0.0001264810562133789, -0.00012230873107910156, -0.00011813640594482422, -0.00011396408081054688, -0.00010979175567626953, -0.00010561943054199219, -0.00010144710540771484, -9.72747802734375e-05, -9.310245513916016e-05, -8.893013000488281e-05, -8.475780487060547e-05, -8.058547973632812e-05, -7.641315460205078e-05, -7.224082946777344e-05, -6.80685043334961e-05, -6.389617919921875e-05, -5.9723854064941406e-05, -5.555152893066406e-05, -5.137920379638672e-05, -4.7206878662109375e-05, -4.303455352783203e-05, -3.886222839355469e-05, -3.4689903259277344e-05, -3.0517578125e-05, -2.6345252990722656e-05, -2.2172927856445312e-05, -1.800060272216797e-05, -1.3828277587890625e-05, -9.655952453613281e-06, -5.4836273193359375e-06, -1.3113021850585938e-06, 2.86102294921875e-06, 7.033348083496094e-06, 1.1205673217773438e-05, 1.537799835205078e-05, 1.9550323486328125e-05, 2.372264862060547e-05, 2.7894973754882812e-05, 3.2067298889160156e-05, 3.62396240234375e-05, 4.0411949157714844e-05, 4.458427429199219e-05, 4.875659942626953e-05, 5.2928924560546875e-05, 5.710124969482422e-05, 6.127357482910156e-05, 6.54458999633789e-05, 6.961822509765625e-05, 7.37905502319336e-05, 7.796287536621094e-05, 8.213520050048828e-05, 8.630752563476562e-05, 9.047985076904297e-05, 9.465217590332031e-05, 9.882450103759766e-05, 0.000102996826171875, 0.00010716915130615234, 0.00011134147644042969, 0.00011551380157470703, 0.00011968612670898438]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 15.0, 16.0, 51.0, 56.0, 74.0, 106.0, 135.0, 225.0, 394.0, 713.0, 1331.0, 2862.0, 6634.0, 17497.0, 55064.0, 190215.0, 444170.0, 227452.0, 66559.0, 20812.0, 7534.0, 3185.0, 1445.0, 767.0, 436.0, 250.0, 152.0, 105.0, 73.0, 63.0, 28.0, 33.0, 20.0, 16.0, 14.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6909942626953125, -0.667633056640625, -0.6442718505859375, -0.62091064453125, -0.5975494384765625, -0.574188232421875, -0.5508270263671875, -0.5274658203125, -0.5041046142578125, -0.480743408203125, -0.4573822021484375, -0.43402099609375, -0.4106597900390625, -0.387298583984375, -0.3639373779296875, -0.340576171875, -0.3172149658203125, -0.293853759765625, -0.2704925537109375, -0.24713134765625, -0.2237701416015625, -0.200408935546875, -0.1770477294921875, -0.1536865234375, -0.1303253173828125, -0.106964111328125, -0.0836029052734375, -0.06024169921875, -0.0368804931640625, -0.013519287109375, 0.0098419189453125, 0.033203125, 0.0565643310546875, 0.079925537109375, 0.1032867431640625, 0.12664794921875, 0.1500091552734375, 0.173370361328125, 0.1967315673828125, 0.2200927734375, 0.2434539794921875, 0.266815185546875, 0.2901763916015625, 0.31353759765625, 0.3368988037109375, 0.360260009765625, 0.3836212158203125, 0.406982421875, 0.4303436279296875, 0.453704833984375, 0.4770660400390625, 0.50042724609375, 0.5237884521484375, 0.547149658203125, 0.5705108642578125, 0.5938720703125, 0.6172332763671875, 0.640594482421875, 0.6639556884765625, 0.68731689453125, 0.7106781005859375, 0.734039306640625, 0.7574005126953125, 0.78076171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 12.0, 8.0, 10.0, 11.0, 14.0, 24.0, 31.0, 19.0, 31.0, 36.0, 24.0, 27.0, 32.0, 52.0, 56.0, 56.0, 63.0, 46.0, 63.0, 36.0, 45.0, 34.0, 36.0, 38.0, 33.0, 25.0, 24.0, 19.0, 19.0, 17.0, 13.0, 11.0, 7.0, 10.0, 4.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.360107421875, -0.3492851257324219, -0.33846282958984375, -0.3276405334472656, -0.3168182373046875, -0.3059959411621094, -0.29517364501953125, -0.2843513488769531, -0.273529052734375, -0.2627067565917969, -0.25188446044921875, -0.24106216430664062, -0.2302398681640625, -0.21941757202148438, -0.20859527587890625, -0.19777297973632812, -0.18695068359375, -0.17612838745117188, -0.16530609130859375, -0.15448379516601562, -0.1436614990234375, -0.13283920288085938, -0.12201690673828125, -0.11119461059570312, -0.100372314453125, -0.08955001831054688, -0.07872772216796875, -0.06790542602539062, -0.0570831298828125, -0.046260833740234375, -0.03543853759765625, -0.024616241455078125, -0.0137939453125, -0.002971649169921875, 0.00785064697265625, 0.018672943115234375, 0.0294952392578125, 0.040317535400390625, 0.05113983154296875, 0.061962127685546875, 0.072784423828125, 0.08360671997070312, 0.09442901611328125, 0.10525131225585938, 0.1160736083984375, 0.12689590454101562, 0.13771820068359375, 0.14854049682617188, 0.15936279296875, 0.17018508911132812, 0.18100738525390625, 0.19182968139648438, 0.2026519775390625, 0.21347427368164062, 0.22429656982421875, 0.23511886596679688, 0.245941162109375, 0.2567634582519531, 0.26758575439453125, 0.2784080505371094, 0.2892303466796875, 0.3000526428222656, 0.31087493896484375, 0.3216972351074219, 0.33251953125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 8.0, 6.0, 13.0, 22.0, 38.0, 74.0, 125.0, 143.0, 167.0, 140.0, 83.0, 67.0, 37.0, 21.0, 15.0, 10.0, 0.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4451904296875, -9.169502258300781, -8.893815040588379, -8.618127822875977, -8.342439651489258, -8.066751480102539, -7.791064262390137, -7.515376567840576, -7.239688873291016, -6.964001178741455, -6.6883134841918945, -6.412625789642334, -6.136938095092773, -5.861250400543213, -5.585562705993652, -5.309875011444092, -5.034187316894531, -4.758499622344971, -4.48281192779541, -4.20712423324585, -3.931436538696289, -3.6557488441467285, -3.380061149597168, -3.1043734550476074, -2.828685760498047, -2.5529980659484863, -2.277310371398926, -2.0016226768493652, -1.7259349822998047, -1.4502472877502441, -1.1745595932006836, -0.898871898651123, -0.6231842041015625, -0.34749650955200195, -0.0718088150024414, 0.20387887954711914, 0.4795665740966797, 0.7552542686462402, 1.0309419631958008, 1.3066296577453613, 1.5823173522949219, 1.8580050468444824, 2.133692741394043, 2.4093804359436035, 2.685068130493164, 2.9607558250427246, 3.236443519592285, 3.5121312141418457, 3.7878189086914062, 4.063506603240967, 4.339194297790527, 4.614881992340088, 4.890569686889648, 5.166257381439209, 5.4419450759887695, 5.71763277053833, 5.993320465087891, 6.269008159637451, 6.544695854187012, 6.820383548736572, 7.096071243286133, 7.371758937835693, 7.647446632385254, 7.9231343269348145, 8.198822021484375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 9.0, 3.0, 6.0, 6.0, 11.0, 14.0, 18.0, 20.0, 18.0, 30.0, 31.0, 42.0, 39.0, 49.0, 60.0, 60.0, 41.0, 42.0, 65.0, 56.0, 62.0, 55.0, 35.0, 32.0, 27.0, 22.0, 29.0, 31.0, 17.0, 22.0, 6.0, 13.0, 6.0, 8.0, 3.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.960089683532715, -10.629469871520996, -10.298850059509277, -9.968230247497559, -9.63761043548584, -9.306990623474121, -8.976370811462402, -8.645751953125, -8.315132141113281, -7.9845123291015625, -7.653892517089844, -7.323272705078125, -6.992652893066406, -6.6620330810546875, -6.331413745880127, -6.000793933868408, -5.670173645019531, -5.3395538330078125, -5.008934020996094, -4.678314208984375, -4.347694396972656, -4.0170745849609375, -3.686455249786377, -3.355835437774658, -3.0252156257629395, -2.6945958137512207, -2.363976001739502, -2.0333564281463623, -1.7027366161346436, -1.3721168041229248, -1.0414971113204956, -0.7108774185180664, -0.38025665283203125, -0.049636900424957275, 0.2809828519821167, 0.6116026043891907, 0.9422223567962646, 1.2728421688079834, 1.6034618616104126, 1.9340815544128418, 2.2647013664245605, 2.5953211784362793, 2.925940990447998, 3.2565605640411377, 3.5871803760528564, 3.917800188064575, 4.248419761657715, 4.579039573669434, 4.909659385681152, 5.240279197692871, 5.57089900970459, 5.901518821716309, 6.232138633728027, 6.562758445739746, 6.893377780914307, 7.223997592926025, 7.554617404937744, 7.885237216949463, 8.215856552124023, 8.546476364135742, 8.877096176147461, 9.20771598815918, 9.538335800170898, 9.868955612182617, 10.199575424194336]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 11.0, 11.0, 13.0, 25.0, 35.0, 42.0, 88.0, 109.0, 169.0, 255.0, 397.0, 646.0, 1199.0, 2344.0, 5146.0, 12345.0, 36239.0, 152473.0, 2058517.0, 1728635.0, 139049.0, 33906.0, 11915.0, 5117.0, 2498.0, 1163.0, 696.0, 447.0, 276.0, 183.0, 107.0, 77.0, 39.0, 33.0, 24.0, 9.0, 14.0, 8.0, 7.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.320556640625, -3.21337890625, -3.106201171875, -2.9990234375, -2.891845703125, -2.78466796875, -2.677490234375, -2.5703125, -2.463134765625, -2.35595703125, -2.248779296875, -2.1416015625, -2.034423828125, -1.92724609375, -1.820068359375, -1.712890625, -1.605712890625, -1.49853515625, -1.391357421875, -1.2841796875, -1.177001953125, -1.06982421875, -0.962646484375, -0.85546875, -0.748291015625, -0.64111328125, -0.533935546875, -0.4267578125, -0.319580078125, -0.21240234375, -0.105224609375, 0.001953125, 0.109130859375, 0.21630859375, 0.323486328125, 0.4306640625, 0.537841796875, 0.64501953125, 0.752197265625, 0.859375, 0.966552734375, 1.07373046875, 1.180908203125, 1.2880859375, 1.395263671875, 1.50244140625, 1.609619140625, 1.716796875, 1.823974609375, 1.93115234375, 2.038330078125, 2.1455078125, 2.252685546875, 2.35986328125, 2.467041015625, 2.57421875, 2.681396484375, 2.78857421875, 2.895751953125, 3.0029296875, 3.110107421875, 3.21728515625, 3.324462890625, 3.431640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 7.0, 13.0, 17.0, 24.0, 37.0, 63.0, 78.0, 110.0, 110.0, 145.0, 114.0, 78.0, 63.0, 38.0, 35.0, 20.0, 16.0, 14.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.49609375, -6.326171875, -6.15625, -5.986328125, -5.81640625, -5.646484375, -5.4765625, -5.306640625, -5.13671875, -4.966796875, -4.796875, -4.626953125, -4.45703125, -4.287109375, -4.1171875, -3.947265625, -3.77734375, -3.607421875, -3.4375, -3.267578125, -3.09765625, -2.927734375, -2.7578125, -2.587890625, -2.41796875, -2.248046875, -2.078125, -1.908203125, -1.73828125, -1.568359375, -1.3984375, -1.228515625, -1.05859375, -0.888671875, -0.71875, -0.548828125, -0.37890625, -0.208984375, -0.0390625, 0.130859375, 0.30078125, 0.470703125, 0.640625, 0.810546875, 0.98046875, 1.150390625, 1.3203125, 1.490234375, 1.66015625, 1.830078125, 2.0, 2.169921875, 2.33984375, 2.509765625, 2.6796875, 2.849609375, 3.01953125, 3.189453125, 3.359375, 3.529296875, 3.69921875, 3.869140625, 4.0390625, 4.208984375, 4.37890625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 14.0, 18.0, 32.0, 58.0, 93.0, 152.0, 424.0, 3227.0, 502408.0, 3681468.0, 5352.0, 572.0, 194.0, 85.0, 58.0, 37.0, 20.0, 16.0, 13.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.078125, -14.576904296875, -14.07568359375, -13.574462890625, -13.0732421875, -12.572021484375, -12.07080078125, -11.569580078125, -11.068359375, -10.567138671875, -10.06591796875, -9.564697265625, -9.0634765625, -8.562255859375, -8.06103515625, -7.559814453125, -7.05859375, -6.557373046875, -6.05615234375, -5.554931640625, -5.0537109375, -4.552490234375, -4.05126953125, -3.550048828125, -3.048828125, -2.547607421875, -2.04638671875, -1.545166015625, -1.0439453125, -0.542724609375, -0.04150390625, 0.459716796875, 0.9609375, 1.462158203125, 1.96337890625, 2.464599609375, 2.9658203125, 3.467041015625, 3.96826171875, 4.469482421875, 4.970703125, 5.471923828125, 5.97314453125, 6.474365234375, 6.9755859375, 7.476806640625, 7.97802734375, 8.479248046875, 8.98046875, 9.481689453125, 9.98291015625, 10.484130859375, 10.9853515625, 11.486572265625, 11.98779296875, 12.489013671875, 12.990234375, 13.491455078125, 13.99267578125, 14.493896484375, 14.9951171875, 15.496337890625, 15.99755859375, 16.498779296875, 17.0]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 9.0, 14.0, 19.0, 29.0, 33.0, 38.0, 49.0, 90.0, 128.0, 172.0, 312.0, 589.0, 1110.0, 565.0, 313.0, 175.0, 106.0, 74.0, 56.0, 47.0, 37.0, 25.0, 21.0, 9.0, 10.0, 6.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.849609375, -0.8175048828125, -0.785400390625, -0.7532958984375, -0.72119140625, -0.6890869140625, -0.656982421875, -0.6248779296875, -0.5927734375, -0.5606689453125, -0.528564453125, -0.4964599609375, -0.46435546875, -0.4322509765625, -0.400146484375, -0.3680419921875, -0.3359375, -0.3038330078125, -0.271728515625, -0.2396240234375, -0.20751953125, -0.1754150390625, -0.143310546875, -0.1112060546875, -0.0791015625, -0.0469970703125, -0.014892578125, 0.0172119140625, 0.04931640625, 0.0814208984375, 0.113525390625, 0.1456298828125, 0.177734375, 0.2098388671875, 0.241943359375, 0.2740478515625, 0.30615234375, 0.3382568359375, 0.370361328125, 0.4024658203125, 0.4345703125, 0.4666748046875, 0.498779296875, 0.5308837890625, 0.56298828125, 0.5950927734375, 0.627197265625, 0.6593017578125, 0.69140625, 0.7235107421875, 0.755615234375, 0.7877197265625, 0.81982421875, 0.8519287109375, 0.884033203125, 0.9161376953125, 0.9482421875, 0.9803466796875, 1.012451171875, 1.0445556640625, 1.07666015625, 1.1087646484375, 1.140869140625, 1.1729736328125, 1.205078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 17.0, 23.0, 44.0, 78.0, 100.0, 166.0, 150.0, 112.0, 104.0, 56.0, 40.0, 24.0, 15.0, 10.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.421330451965332, -5.24224853515625, -5.063167095184326, -4.884085178375244, -4.70500373840332, -4.525921821594238, -4.346839904785156, -4.167757987976074, -3.9886765480041504, -3.8095948696136475, -3.6305131912231445, -3.4514312744140625, -3.2723495960235596, -3.0932679176330566, -2.9141860008239746, -2.7351043224334717, -2.5560226440429688, -2.376940965652466, -2.197859287261963, -2.018777370452881, -1.839695692062378, -1.660614013671875, -1.4815322160720825, -1.30245041847229, -1.123368740081787, -0.9442870020866394, -0.7652052640914917, -0.586123526096344, -0.4070417881011963, -0.22796005010604858, -0.04887831211090088, 0.1302034854888916, 0.30928564071655273, 0.48836737871170044, 0.6674491167068481, 0.8465308547019958, 1.0256125926971436, 1.2046942710876465, 1.383776068687439, 1.5628578662872314, 1.7419395446777344, 1.9210212230682373, 2.1001029014587402, 2.2791848182678223, 2.458266496658325, 2.637348175048828, 2.81643009185791, 2.995511770248413, 3.174593448638916, 3.353675127029419, 3.532756805419922, 3.711838722229004, 3.890920400619507, 4.07000207901001, 4.249083995819092, 4.428165435791016, 4.607247352600098, 4.78632926940918, 4.9654107093811035, 5.1444926261901855, 5.323574066162109, 5.502655982971191, 5.681737899780273, 5.8608198165893555, 6.039901256561279]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 12.0, 12.0, 27.0, 28.0, 39.0, 64.0, 65.0, 80.0, 75.0, 91.0, 84.0, 76.0, 78.0, 59.0, 54.0, 37.0, 18.0, 21.0, 15.0, 14.0, 13.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.287173748016357, -5.141117095947266, -4.995060443878174, -4.849003791809082, -4.702946662902832, -4.55689001083374, -4.410833358764648, -4.264776706695557, -4.118720054626465, -3.972663402557373, -3.8266067504882812, -3.6805498600006104, -3.5344932079315186, -3.3884365558624268, -3.242379665374756, -3.096323013305664, -2.9502663612365723, -2.8042097091674805, -2.6581530570983887, -2.5120961666107178, -2.366039514541626, -2.219982862472534, -2.0739259719848633, -1.9278693199157715, -1.7818126678466797, -1.635756015777588, -1.4896992444992065, -1.3436424732208252, -1.1975858211517334, -1.0515291690826416, -0.9054723978042603, -0.7594156265258789, -0.6133584976196289, -0.46730178594589233, -0.32124507427215576, -0.1751883625984192, -0.029131650924682617, 0.11692506074905396, 0.2629817724227905, 0.4090385437011719, 0.5550951957702637, 0.7011519074440002, 0.8472086191177368, 0.9932653307914734, 1.13932204246521, 1.2853786945343018, 1.431435465812683, 1.5774922370910645, 1.7235488891601562, 1.869605541229248, 2.01566219329834, 2.1617190837860107, 2.3077757358551025, 2.4538323879241943, 2.5998892784118652, 2.745945930480957, 2.892002582550049, 3.0380592346191406, 3.1841158866882324, 3.3301727771759033, 3.476229429244995, 3.622286081314087, 3.768342971801758, 3.9143996238708496, 4.060456275939941]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 23.0, 23.0, 56.0, 94.0, 191.0, 373.0, 1004.0, 3102.0, 17310.0, 329059.0, 662840.0, 28047.0, 4240.0, 1249.0, 453.0, 200.0, 116.0, 60.0, 23.0, 22.0, 20.0, 7.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.492919921875, -0.4759864807128906, -0.45905303955078125, -0.4421195983886719, -0.4251861572265625, -0.4082527160644531, -0.39131927490234375, -0.3743858337402344, -0.357452392578125, -0.3405189514160156, -0.32358551025390625, -0.3066520690917969, -0.2897186279296875, -0.2727851867675781, -0.25585174560546875, -0.23891830444335938, -0.22198486328125, -0.20505142211914062, -0.18811798095703125, -0.17118453979492188, -0.1542510986328125, -0.13731765747070312, -0.12038421630859375, -0.10345077514648438, -0.086517333984375, -0.06958389282226562, -0.05265045166015625, -0.035717010498046875, -0.0187835693359375, -0.001850128173828125, 0.01508331298828125, 0.032016754150390625, 0.0489501953125, 0.06588363647460938, 0.08281707763671875, 0.09975051879882812, 0.1166839599609375, 0.13361740112304688, 0.15055084228515625, 0.16748428344726562, 0.184417724609375, 0.20135116577148438, 0.21828460693359375, 0.23521804809570312, 0.2521514892578125, 0.2690849304199219, 0.28601837158203125, 0.3029518127441406, 0.31988525390625, 0.3368186950683594, 0.35375213623046875, 0.3706855773925781, 0.3876190185546875, 0.4045524597167969, 0.42148590087890625, 0.4384193420410156, 0.455352783203125, 0.4722862243652344, 0.48921966552734375, 0.5061531066894531, 0.5230865478515625, 0.5400199890136719, 0.5569534301757812, 0.5738868713378906, 0.5908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 9.0, 18.0, 26.0, 48.0, 56.0, 99.0, 94.0, 108.0, 127.0, 113.0, 65.0, 57.0, 44.0, 28.0, 25.0, 18.0, 9.0, 12.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.91351318359375, -3.7918701171875, -3.67022705078125, -3.548583984375, -3.42694091796875, -3.3052978515625, -3.18365478515625, -3.06201171875, -2.94036865234375, -2.8187255859375, -2.69708251953125, -2.575439453125, -2.45379638671875, -2.3321533203125, -2.21051025390625, -2.0888671875, -1.96722412109375, -1.8455810546875, -1.72393798828125, -1.602294921875, -1.48065185546875, -1.3590087890625, -1.23736572265625, -1.11572265625, -0.99407958984375, -0.8724365234375, -0.75079345703125, -0.629150390625, -0.50750732421875, -0.3858642578125, -0.26422119140625, -0.142578125, -0.02093505859375, 0.1007080078125, 0.22235107421875, 0.343994140625, 0.46563720703125, 0.5872802734375, 0.70892333984375, 0.83056640625, 0.95220947265625, 1.0738525390625, 1.19549560546875, 1.317138671875, 1.43878173828125, 1.5604248046875, 1.68206787109375, 1.8037109375, 1.92535400390625, 2.0469970703125, 2.16864013671875, 2.290283203125, 2.41192626953125, 2.5335693359375, 2.65521240234375, 2.77685546875, 2.89849853515625, 3.0201416015625, 3.14178466796875, 3.263427734375, 3.38507080078125, 3.5067138671875, 3.62835693359375, 3.75]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 8.0, 4.0, 4.0, 4.0, 6.0, 8.0, 10.0, 12.0, 14.0, 21.0, 26.0, 30.0, 41.0, 48.0, 65.0, 85.0, 119.0, 151.0, 256.0, 412.0, 821.0, 2903.0, 19390.0, 216499.0, 701208.0, 92551.0, 10062.0, 1908.0, 677.0, 372.0, 220.0, 140.0, 97.0, 75.0, 47.0, 50.0, 49.0, 29.0, 27.0, 26.0, 16.0, 14.0, 11.0, 7.0, 7.0, 9.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.3056640625, -0.2964935302734375, -0.287322998046875, -0.2781524658203125, -0.26898193359375, -0.2598114013671875, -0.250640869140625, -0.2414703369140625, -0.2322998046875, -0.2231292724609375, -0.213958740234375, -0.2047882080078125, -0.19561767578125, -0.1864471435546875, -0.177276611328125, -0.1681060791015625, -0.158935546875, -0.1497650146484375, -0.140594482421875, -0.1314239501953125, -0.12225341796875, -0.1130828857421875, -0.103912353515625, -0.0947418212890625, -0.0855712890625, -0.0764007568359375, -0.067230224609375, -0.0580596923828125, -0.04888916015625, -0.0397186279296875, -0.030548095703125, -0.0213775634765625, -0.01220703125, -0.0030364990234375, 0.006134033203125, 0.0153045654296875, 0.02447509765625, 0.0336456298828125, 0.042816162109375, 0.0519866943359375, 0.0611572265625, 0.0703277587890625, 0.079498291015625, 0.0886688232421875, 0.09783935546875, 0.1070098876953125, 0.116180419921875, 0.1253509521484375, 0.134521484375, 0.1436920166015625, 0.152862548828125, 0.1620330810546875, 0.17120361328125, 0.1803741455078125, 0.189544677734375, 0.1987152099609375, 0.2078857421875, 0.2170562744140625, 0.226226806640625, 0.2353973388671875, 0.24456787109375, 0.2537384033203125, 0.262908935546875, 0.2720794677734375, 0.28125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 8.0, 15.0, 13.0, 9.0, 13.0, 19.0, 23.0, 33.0, 35.0, 22.0, 42.0, 33.0, 47.0, 55.0, 46.0, 47.0, 49.0, 32.0, 39.0, 41.0, 53.0, 29.0, 38.0, 33.0, 32.0, 31.0, 24.0, 23.0, 15.0, 15.0, 17.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.228515625, -3.118865966796875, -3.00921630859375, -2.899566650390625, -2.7899169921875, -2.680267333984375, -2.57061767578125, -2.460968017578125, -2.351318359375, -2.241668701171875, -2.13201904296875, -2.022369384765625, -1.9127197265625, -1.803070068359375, -1.69342041015625, -1.583770751953125, -1.47412109375, -1.364471435546875, -1.25482177734375, -1.145172119140625, -1.0355224609375, -0.925872802734375, -0.81622314453125, -0.706573486328125, -0.596923828125, -0.487274169921875, -0.37762451171875, -0.267974853515625, -0.1583251953125, -0.048675537109375, 0.06097412109375, 0.170623779296875, 0.2802734375, 0.389923095703125, 0.49957275390625, 0.609222412109375, 0.7188720703125, 0.828521728515625, 0.93817138671875, 1.047821044921875, 1.157470703125, 1.267120361328125, 1.37677001953125, 1.486419677734375, 1.5960693359375, 1.705718994140625, 1.81536865234375, 1.925018310546875, 2.03466796875, 2.144317626953125, 2.25396728515625, 2.363616943359375, 2.4732666015625, 2.582916259765625, 2.69256591796875, 2.802215576171875, 2.911865234375, 3.021514892578125, 3.13116455078125, 3.240814208984375, 3.3504638671875, 3.460113525390625, 3.56976318359375, 3.679412841796875, 3.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 26.0, 27.0, 65.0, 109.0, 271.0, 1052.0, 102597.0, 942429.0, 1327.0, 339.0, 119.0, 71.0, 34.0, 17.0, 15.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43359375, -0.4204826354980469, -0.40737152099609375, -0.3942604064941406, -0.3811492919921875, -0.3680381774902344, -0.35492706298828125, -0.3418159484863281, -0.328704833984375, -0.3155937194824219, -0.30248260498046875, -0.2893714904785156, -0.2762603759765625, -0.2631492614746094, -0.25003814697265625, -0.23692703247070312, -0.22381591796875, -0.21070480346679688, -0.19759368896484375, -0.18448257446289062, -0.1713714599609375, -0.15826034545898438, -0.14514923095703125, -0.13203811645507812, -0.118927001953125, -0.10581588745117188, -0.09270477294921875, -0.07959365844726562, -0.0664825439453125, -0.053371429443359375, -0.04026031494140625, -0.027149200439453125, -0.0140380859375, -0.000926971435546875, 0.01218414306640625, 0.025295257568359375, 0.0384063720703125, 0.051517486572265625, 0.06462860107421875, 0.07773971557617188, 0.090850830078125, 0.10396194458007812, 0.11707305908203125, 0.13018417358398438, 0.1432952880859375, 0.15640640258789062, 0.16951751708984375, 0.18262863159179688, 0.19573974609375, 0.20885086059570312, 0.22196197509765625, 0.23507308959960938, 0.2481842041015625, 0.2612953186035156, 0.27440643310546875, 0.2875175476074219, 0.300628662109375, 0.3137397766113281, 0.32685089111328125, 0.3399620056152344, 0.3530731201171875, 0.3661842346191406, 0.37929534912109375, 0.3924064636230469, 0.405517578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 15.0, 20.0, 34.0, 64.0, 116.0, 173.0, 189.0, 141.0, 80.0, 44.0, 24.0, 24.0, 15.0, 17.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.854534149169922e-05, -6.659794598817825e-05, -6.465055048465729e-05, -6.270315498113632e-05, -6.0755759477615356e-05, -5.880836397409439e-05, -5.6860968470573425e-05, -5.491357296705246e-05, -5.2966177463531494e-05, -5.101878196001053e-05, -4.907138645648956e-05, -4.71239909529686e-05, -4.517659544944763e-05, -4.3229199945926666e-05, -4.12818044424057e-05, -3.9334408938884735e-05, -3.738701343536377e-05, -3.5439617931842804e-05, -3.349222242832184e-05, -3.154482692480087e-05, -2.9597431421279907e-05, -2.765003591775894e-05, -2.5702640414237976e-05, -2.375524491071701e-05, -2.1807849407196045e-05, -1.986045390367508e-05, -1.7913058400154114e-05, -1.5965662896633148e-05, -1.4018267393112183e-05, -1.2070871889591217e-05, -1.0123476386070251e-05, -8.176080882549286e-06, -6.22868537902832e-06, -4.281289875507355e-06, -2.333894371986389e-06, -3.864988684654236e-07, 1.560896635055542e-06, 3.5082921385765076e-06, 5.455687642097473e-06, 7.403083145618439e-06, 9.350478649139404e-06, 1.129787415266037e-05, 1.3245269656181335e-05, 1.5192665159702301e-05, 1.7140060663223267e-05, 1.9087456166744232e-05, 2.1034851670265198e-05, 2.2982247173786163e-05, 2.492964267730713e-05, 2.6877038180828094e-05, 2.882443368434906e-05, 3.0771829187870026e-05, 3.271922469139099e-05, 3.466662019491196e-05, 3.661401569843292e-05, 3.856141120195389e-05, 4.0508806705474854e-05, 4.245620220899582e-05, 4.4403597712516785e-05, 4.635099321603775e-05, 4.8298388719558716e-05, 5.024578422307968e-05, 5.219317972660065e-05, 5.414057523012161e-05, 5.608797073364258e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 12.0, 11.0, 13.0, 15.0, 39.0, 84.0, 218.0, 619.0, 2915.0, 74654.0, 962355.0, 6172.0, 916.0, 280.0, 112.0, 58.0, 27.0, 21.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41943359375, -0.4078407287597656, -0.39624786376953125, -0.3846549987792969, -0.3730621337890625, -0.3614692687988281, -0.34987640380859375, -0.3382835388183594, -0.326690673828125, -0.3150978088378906, -0.30350494384765625, -0.2919120788574219, -0.2803192138671875, -0.2687263488769531, -0.25713348388671875, -0.24554061889648438, -0.23394775390625, -0.22235488891601562, -0.21076202392578125, -0.19916915893554688, -0.1875762939453125, -0.17598342895507812, -0.16439056396484375, -0.15279769897460938, -0.141204833984375, -0.12961196899414062, -0.11801910400390625, -0.10642623901367188, -0.0948333740234375, -0.08324050903320312, -0.07164764404296875, -0.060054779052734375, -0.0484619140625, -0.036869049072265625, -0.02527618408203125, -0.013683319091796875, -0.0020904541015625, 0.009502410888671875, 0.02109527587890625, 0.032688140869140625, 0.044281005859375, 0.055873870849609375, 0.06746673583984375, 0.07905960083007812, 0.0906524658203125, 0.10224533081054688, 0.11383819580078125, 0.12543106079101562, 0.13702392578125, 0.14861679077148438, 0.16020965576171875, 0.17180252075195312, 0.1833953857421875, 0.19498825073242188, 0.20658111572265625, 0.21817398071289062, 0.229766845703125, 0.24135971069335938, 0.25295257568359375, 0.2645454406738281, 0.2761383056640625, 0.2877311706542969, 0.29932403564453125, 0.3109169006347656, 0.322509765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 0.0, 4.0, 6.0, 12.0, 12.0, 18.0, 25.0, 33.0, 132.0, 415.0, 181.0, 71.0, 33.0, 13.0, 15.0, 7.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054351806640625, -0.0525212287902832, -0.050690650939941406, -0.04886007308959961, -0.04702949523925781, -0.045198917388916016, -0.04336833953857422, -0.04153776168823242, -0.039707183837890625, -0.03787660598754883, -0.03604602813720703, -0.034215450286865234, -0.03238487243652344, -0.03055429458618164, -0.028723716735839844, -0.026893138885498047, -0.02506256103515625, -0.023231983184814453, -0.021401405334472656, -0.01957082748413086, -0.017740249633789062, -0.015909671783447266, -0.014079093933105469, -0.012248516082763672, -0.010417938232421875, -0.008587360382080078, -0.006756782531738281, -0.004926204681396484, -0.0030956268310546875, -0.0012650489807128906, 0.0005655288696289062, 0.002396106719970703, 0.0042266845703125, 0.006057262420654297, 0.007887840270996094, 0.00971841812133789, 0.011548995971679688, 0.013379573822021484, 0.015210151672363281, 0.017040729522705078, 0.018871307373046875, 0.020701885223388672, 0.02253246307373047, 0.024363040924072266, 0.026193618774414062, 0.02802419662475586, 0.029854774475097656, 0.03168535232543945, 0.03351593017578125, 0.03534650802612305, 0.037177085876464844, 0.03900766372680664, 0.04083824157714844, 0.042668819427490234, 0.04449939727783203, 0.04632997512817383, 0.048160552978515625, 0.04999113082885742, 0.05182170867919922, 0.053652286529541016, 0.05548286437988281, 0.05731344223022461, 0.059144020080566406, 0.0609745979309082, 0.06280517578125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 6.0, 8.0, 9.0, 21.0, 41.0, 71.0, 126.0, 203.0, 176.0, 141.0, 78.0, 38.0, 21.0, 14.0, 13.0, 5.0, 7.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.707956790924072, -4.5609540939331055, -4.4139509201049805, -4.2669477462768555, -4.119945049285889, -3.9729421138763428, -3.825939178466797, -3.678936243057251, -3.531933307647705, -3.384930372238159, -3.2379274368286133, -3.0909245014190674, -2.9439215660095215, -2.7969186305999756, -2.6499156951904297, -2.502912759780884, -2.355909824371338, -2.208906888961792, -2.061903953552246, -1.9149010181427002, -1.7678980827331543, -1.6208951473236084, -1.4738922119140625, -1.3268892765045166, -1.1798863410949707, -1.0328834056854248, -0.8858804702758789, -0.738877534866333, -0.5918745994567871, -0.4448716640472412, -0.2978687286376953, -0.15086579322814941, -0.0038628578186035156, 0.14314007759094238, 0.2901430130004883, 0.4371459484100342, 0.5841488838195801, 0.731151819229126, 0.8781547546386719, 1.0251576900482178, 1.1721606254577637, 1.3191635608673096, 1.4661664962768555, 1.6131694316864014, 1.7601723670959473, 1.9071753025054932, 2.054178237915039, 2.201181173324585, 2.348184108734131, 2.4951870441436768, 2.6421899795532227, 2.7891929149627686, 2.9361958503723145, 3.0831987857818604, 3.2302017211914062, 3.377204656600952, 3.524207592010498, 3.671210527420044, 3.81821346282959, 3.9652163982391357, 4.112219333648682, 4.259222030639648, 4.406225204467773, 4.553228378295898, 4.700231075286865]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 18.0, 26.0, 37.0, 50.0, 64.0, 96.0, 92.0, 116.0, 105.0, 97.0, 78.0, 59.0, 33.0, 26.0, 20.0, 15.0, 8.0, 13.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.16665506362915, -4.053471088409424, -3.940286636352539, -3.8271026611328125, -3.713918447494507, -3.600734233856201, -3.4875502586364746, -3.374366044998169, -3.2611818313598633, -3.1479976177215576, -3.034813404083252, -2.9216294288635254, -2.8084452152252197, -2.695261001586914, -2.5820770263671875, -2.468892812728882, -2.355708599090576, -2.2425243854522705, -2.129340171813965, -2.0161561965942383, -1.9029719829559326, -1.789787769317627, -1.6766036748886108, -1.5634195804595947, -1.450235366821289, -1.3370511531829834, -1.2238670587539673, -1.1106829643249512, -0.9974987506866455, -0.8843145966529846, -0.7711304426193237, -0.6579462885856628, -0.544762134552002, -0.43157798051834106, -0.3183938264846802, -0.2052096724510193, -0.0920255184173584, 0.02115863561630249, 0.13434278964996338, 0.24752694368362427, 0.36071109771728516, 0.47389525175094604, 0.5870794057846069, 0.7002635598182678, 0.8134477138519287, 0.9266318678855896, 1.0398160219192505, 1.1530001163482666, 1.2661843299865723, 1.379368543624878, 1.492552638053894, 1.6057367324829102, 1.7189209461212158, 1.8321051597595215, 1.9452892541885376, 2.0584733486175537, 2.1716575622558594, 2.284841775894165, 2.3980259895324707, 2.5112099647521973, 2.624394178390503, 2.7375783920288086, 2.850762367248535, 2.963946580886841, 3.0771307945251465]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 9.0, 14.0, 18.0, 32.0, 42.0, 58.0, 130.0, 206.0, 699.0, 2366.0, 9859.0, 58700.0, 534805.0, 388478.0, 42334.0, 7747.0, 1945.0, 569.0, 243.0, 104.0, 50.0, 44.0, 15.0, 13.0, 13.0, 18.0, 11.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.34375, -5.206451416015625, -5.06915283203125, -4.931854248046875, -4.7945556640625, -4.657257080078125, -4.51995849609375, -4.382659912109375, -4.245361328125, -4.108062744140625, -3.97076416015625, -3.833465576171875, -3.6961669921875, -3.558868408203125, -3.42156982421875, -3.284271240234375, -3.14697265625, -3.009674072265625, -2.87237548828125, -2.735076904296875, -2.5977783203125, -2.460479736328125, -2.32318115234375, -2.185882568359375, -2.048583984375, -1.911285400390625, -1.77398681640625, -1.636688232421875, -1.4993896484375, -1.362091064453125, -1.22479248046875, -1.087493896484375, -0.9501953125, -0.812896728515625, -0.67559814453125, -0.538299560546875, -0.4010009765625, -0.263702392578125, -0.12640380859375, 0.010894775390625, 0.148193359375, 0.285491943359375, 0.42279052734375, 0.560089111328125, 0.6973876953125, 0.834686279296875, 0.97198486328125, 1.109283447265625, 1.24658203125, 1.383880615234375, 1.52117919921875, 1.658477783203125, 1.7957763671875, 1.933074951171875, 2.07037353515625, 2.207672119140625, 2.344970703125, 2.482269287109375, 2.61956787109375, 2.756866455078125, 2.8941650390625, 3.031463623046875, 3.16876220703125, 3.306060791015625, 3.443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 8.0, 14.0, 29.0, 42.0, 75.0, 133.0, 175.0, 185.0, 134.0, 83.0, 43.0, 29.0, 19.0, 8.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-20.234375, -19.82220458984375, -19.4100341796875, -18.99786376953125, -18.585693359375, -18.17352294921875, -17.7613525390625, -17.34918212890625, -16.93701171875, -16.52484130859375, -16.1126708984375, -15.70050048828125, -15.288330078125, -14.87615966796875, -14.4639892578125, -14.05181884765625, -13.6396484375, -13.22747802734375, -12.8153076171875, -12.40313720703125, -11.990966796875, -11.57879638671875, -11.1666259765625, -10.75445556640625, -10.34228515625, -9.93011474609375, -9.5179443359375, -9.10577392578125, -8.693603515625, -8.28143310546875, -7.8692626953125, -7.45709228515625, -7.044921875, -6.63275146484375, -6.2205810546875, -5.80841064453125, -5.396240234375, -4.98406982421875, -4.5718994140625, -4.15972900390625, -3.74755859375, -3.33538818359375, -2.9232177734375, -2.51104736328125, -2.098876953125, -1.68670654296875, -1.2745361328125, -0.86236572265625, -0.4501953125, -0.03802490234375, 0.3741455078125, 0.78631591796875, 1.198486328125, 1.61065673828125, 2.0228271484375, 2.43499755859375, 2.84716796875, 3.25933837890625, 3.6715087890625, 4.08367919921875, 4.495849609375, 4.90802001953125, 5.3201904296875, 5.73236083984375, 6.14453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 11.0, 22.0, 16.0, 23.0, 24.0, 29.0, 39.0, 61.0, 61.0, 81.0, 103.0, 140.0, 336.0, 1275.0, 13816.0, 736234.0, 287578.0, 6944.0, 847.0, 286.0, 133.0, 95.0, 74.0, 62.0, 58.0, 49.0, 27.0, 23.0, 19.0, 20.0, 14.0, 14.0, 9.0, 8.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.92999267578125, -7.6959228515625, -7.46185302734375, -7.227783203125, -6.99371337890625, -6.7596435546875, -6.52557373046875, -6.29150390625, -6.05743408203125, -5.8233642578125, -5.58929443359375, -5.355224609375, -5.12115478515625, -4.8870849609375, -4.65301513671875, -4.4189453125, -4.18487548828125, -3.9508056640625, -3.71673583984375, -3.482666015625, -3.24859619140625, -3.0145263671875, -2.78045654296875, -2.54638671875, -2.31231689453125, -2.0782470703125, -1.84417724609375, -1.610107421875, -1.37603759765625, -1.1419677734375, -0.90789794921875, -0.673828125, -0.43975830078125, -0.2056884765625, 0.02838134765625, 0.262451171875, 0.49652099609375, 0.7305908203125, 0.96466064453125, 1.19873046875, 1.43280029296875, 1.6668701171875, 1.90093994140625, 2.135009765625, 2.36907958984375, 2.6031494140625, 2.83721923828125, 3.0712890625, 3.30535888671875, 3.5394287109375, 3.77349853515625, 4.007568359375, 4.24163818359375, 4.4757080078125, 4.70977783203125, 4.94384765625, 5.17791748046875, 5.4119873046875, 5.64605712890625, 5.880126953125, 6.11419677734375, 6.3482666015625, 6.58233642578125, 6.81640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 5.0, 11.0, 11.0, 9.0, 19.0, 24.0, 25.0, 32.0, 31.0, 36.0, 31.0, 30.0, 46.0, 54.0, 58.0, 47.0, 50.0, 57.0, 40.0, 56.0, 38.0, 33.0, 37.0, 32.0, 33.0, 34.0, 23.0, 6.0, 16.0, 15.0, 11.0, 16.0, 7.0, 8.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9610595703125, -5.781494140625, -5.6019287109375, -5.42236328125, -5.2427978515625, -5.063232421875, -4.8836669921875, -4.7041015625, -4.5245361328125, -4.344970703125, -4.1654052734375, -3.98583984375, -3.8062744140625, -3.626708984375, -3.4471435546875, -3.267578125, -3.0880126953125, -2.908447265625, -2.7288818359375, -2.54931640625, -2.3697509765625, -2.190185546875, -2.0106201171875, -1.8310546875, -1.6514892578125, -1.471923828125, -1.2923583984375, -1.11279296875, -0.9332275390625, -0.753662109375, -0.5740966796875, -0.39453125, -0.2149658203125, -0.035400390625, 0.1441650390625, 0.32373046875, 0.5032958984375, 0.682861328125, 0.8624267578125, 1.0419921875, 1.2215576171875, 1.401123046875, 1.5806884765625, 1.76025390625, 1.9398193359375, 2.119384765625, 2.2989501953125, 2.478515625, 2.6580810546875, 2.837646484375, 3.0172119140625, 3.19677734375, 3.3763427734375, 3.555908203125, 3.7354736328125, 3.9150390625, 4.0946044921875, 4.274169921875, 4.4537353515625, 4.63330078125, 4.8128662109375, 4.992431640625, 5.1719970703125, 5.3515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 8.0, 20.0, 23.0, 28.0, 46.0, 71.0, 99.0, 130.0, 223.0, 351.0, 546.0, 958.0, 1801.0, 3995.0, 9184.0, 25557.0, 89091.0, 349610.0, 406424.0, 110080.0, 30522.0, 10558.0, 4304.0, 2131.0, 1125.0, 584.0, 362.0, 233.0, 155.0, 84.0, 62.0, 45.0, 35.0, 19.0, 21.0, 14.0, 12.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62158203125, -0.6002044677734375, -0.578826904296875, -0.5574493408203125, -0.53607177734375, -0.5146942138671875, -0.493316650390625, -0.4719390869140625, -0.4505615234375, -0.4291839599609375, -0.407806396484375, -0.3864288330078125, -0.36505126953125, -0.3436737060546875, -0.322296142578125, -0.3009185791015625, -0.279541015625, -0.2581634521484375, -0.236785888671875, -0.2154083251953125, -0.19403076171875, -0.1726531982421875, -0.151275634765625, -0.1298980712890625, -0.1085205078125, -0.0871429443359375, -0.065765380859375, -0.0443878173828125, -0.02301025390625, -0.0016326904296875, 0.019744873046875, 0.0411224365234375, 0.0625, 0.0838775634765625, 0.105255126953125, 0.1266326904296875, 0.14801025390625, 0.1693878173828125, 0.190765380859375, 0.2121429443359375, 0.2335205078125, 0.2548980712890625, 0.276275634765625, 0.2976531982421875, 0.31903076171875, 0.3404083251953125, 0.361785888671875, 0.3831634521484375, 0.404541015625, 0.4259185791015625, 0.447296142578125, 0.4686737060546875, 0.49005126953125, 0.5114288330078125, 0.532806396484375, 0.5541839599609375, 0.5755615234375, 0.5969390869140625, 0.618316650390625, 0.6396942138671875, 0.66107177734375, 0.6824493408203125, 0.703826904296875, 0.7252044677734375, 0.74658203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 15.0, 13.0, 16.0, 13.0, 22.0, 16.0, 20.0, 27.0, 29.0, 59.0, 63.0, 59.0, 67.0, 83.0, 70.0, 70.0, 69.0, 51.0, 45.0, 44.0, 30.0, 27.0, 12.0, 19.0, 12.0, 10.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.0001506805419921875, -0.0001467997208237648, -0.0001429188996553421, -0.0001390380784869194, -0.0001351572573184967, -0.000131276436150074, -0.0001273956149816513, -0.0001235147938132286, -0.00011963397264480591, -0.00011575315147638321, -0.00011187233030796051, -0.00010799150913953781, -0.00010411068797111511, -0.00010022986680269241, -9.634904563426971e-05, -9.246822446584702e-05, -8.858740329742432e-05, -8.470658212900162e-05, -8.082576096057892e-05, -7.694493979215622e-05, -7.306411862373352e-05, -6.918329745531082e-05, -6.530247628688812e-05, -6.142165511846542e-05, -5.7540833950042725e-05, -5.3660012781620026e-05, -4.977919161319733e-05, -4.589837044477463e-05, -4.201754927635193e-05, -3.813672810792923e-05, -3.425590693950653e-05, -3.0375085771083832e-05, -2.6494264602661133e-05, -2.2613443434238434e-05, -1.8732622265815735e-05, -1.4851801097393036e-05, -1.0970979928970337e-05, -7.090158760547638e-06, -3.209337592124939e-06, 6.7148357629776e-07, 4.552304744720459e-06, 8.433125913143158e-06, 1.2313947081565857e-05, 1.6194768249988556e-05, 2.0075589418411255e-05, 2.3956410586833954e-05, 2.7837231755256653e-05, 3.171805292367935e-05, 3.559887409210205e-05, 3.947969526052475e-05, 4.336051642894745e-05, 4.724133759737015e-05, 5.112215876579285e-05, 5.5002979934215546e-05, 5.8883801102638245e-05, 6.276462227106094e-05, 6.664544343948364e-05, 7.052626460790634e-05, 7.440708577632904e-05, 7.828790694475174e-05, 8.216872811317444e-05, 8.604954928159714e-05, 8.993037045001984e-05, 9.381119161844254e-05, 9.769201278686523e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 14.0, 19.0, 29.0, 60.0, 93.0, 133.0, 231.0, 411.0, 888.0, 2141.0, 5887.0, 21092.0, 125070.0, 649186.0, 200632.0, 30300.0, 7507.0, 2590.0, 1078.0, 522.0, 300.0, 143.0, 76.0, 46.0, 35.0, 20.0, 13.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.912017822265625, -0.87774658203125, -0.843475341796875, -0.8092041015625, -0.774932861328125, -0.74066162109375, -0.706390380859375, -0.672119140625, -0.637847900390625, -0.60357666015625, -0.569305419921875, -0.5350341796875, -0.500762939453125, -0.46649169921875, -0.432220458984375, -0.39794921875, -0.363677978515625, -0.32940673828125, -0.295135498046875, -0.2608642578125, -0.226593017578125, -0.19232177734375, -0.158050537109375, -0.123779296875, -0.089508056640625, -0.05523681640625, -0.020965576171875, 0.0133056640625, 0.047576904296875, 0.08184814453125, 0.116119384765625, 0.150390625, 0.184661865234375, 0.21893310546875, 0.253204345703125, 0.2874755859375, 0.321746826171875, 0.35601806640625, 0.390289306640625, 0.424560546875, 0.458831787109375, 0.49310302734375, 0.527374267578125, 0.5616455078125, 0.595916748046875, 0.63018798828125, 0.664459228515625, 0.69873046875, 0.733001708984375, 0.76727294921875, 0.801544189453125, 0.8358154296875, 0.870086669921875, 0.90435791015625, 0.938629150390625, 0.972900390625, 1.007171630859375, 1.04144287109375, 1.075714111328125, 1.1099853515625, 1.144256591796875, 1.17852783203125, 1.212799072265625, 1.2470703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 3.0, 9.0, 8.0, 14.0, 22.0, 20.0, 28.0, 32.0, 31.0, 63.0, 80.0, 80.0, 84.0, 70.0, 74.0, 77.0, 51.0, 62.0, 29.0, 41.0, 24.0, 21.0, 19.0, 13.0, 8.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.505859375, -0.4915199279785156, -0.47718048095703125, -0.4628410339355469, -0.4485015869140625, -0.4341621398925781, -0.41982269287109375, -0.4054832458496094, -0.391143798828125, -0.3768043518066406, -0.36246490478515625, -0.3481254577636719, -0.3337860107421875, -0.3194465637207031, -0.30510711669921875, -0.2907676696777344, -0.27642822265625, -0.2620887756347656, -0.24774932861328125, -0.23340988159179688, -0.2190704345703125, -0.20473098754882812, -0.19039154052734375, -0.17605209350585938, -0.161712646484375, -0.14737319946289062, -0.13303375244140625, -0.11869430541992188, -0.1043548583984375, -0.09001541137695312, -0.07567596435546875, -0.061336517333984375, -0.0469970703125, -0.032657623291015625, -0.01831817626953125, -0.003978729248046875, 0.0103607177734375, 0.024700164794921875, 0.03903961181640625, 0.053379058837890625, 0.067718505859375, 0.08205795288085938, 0.09639739990234375, 0.11073684692382812, 0.1250762939453125, 0.13941574096679688, 0.15375518798828125, 0.16809463500976562, 0.18243408203125, 0.19677352905273438, 0.21111297607421875, 0.22545242309570312, 0.2397918701171875, 0.2541313171386719, 0.26847076416015625, 0.2828102111816406, 0.297149658203125, 0.3114891052246094, 0.32582855224609375, 0.3401679992675781, 0.3545074462890625, 0.3688468933105469, 0.38318634033203125, 0.3975257873535156, 0.411865234375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 6.0, 21.0, 63.0, 197.0, 344.0, 212.0, 82.0, 35.0, 17.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.076003074645996, -7.522428512573242, -6.96885347366333, -6.415278911590576, -5.861703872680664, -5.30812931060791, -4.754554748535156, -4.200980186462402, -3.6474051475524902, -3.0938303470611572, -2.540255546569824, -1.9866809844970703, -1.4331061840057373, -0.8795313835144043, -0.3259568214416504, 0.22761797904968262, 0.7811927795410156, 1.3347675800323486, 1.888342261314392, 2.4419169425964355, 2.9954917430877686, 3.5490665435791016, 4.1026411056518555, 4.656215667724609, 5.2097907066345215, 5.763365268707275, 6.3169403076171875, 6.870514869689941, 7.424089431762695, 7.977664470672607, 8.531238555908203, 9.084814071655273, 9.638389587402344, 10.191964149475098, 10.745538711547852, 11.299114227294922, 11.852688789367676, 12.40626335144043, 12.959837913513184, 13.513412475585938, 14.066987991333008, 14.620562553405762, 15.174137115478516, 15.727712631225586, 16.281286239624023, 16.834861755371094, 17.38843536376953, 17.9420108795166, 18.495586395263672, 19.049161911010742, 19.60273551940918, 20.15631103515625, 20.709884643554688, 21.263460159301758, 21.817035675048828, 22.370609283447266, 22.924182891845703, 23.477758407592773, 24.03133201599121, 24.58490753173828, 25.13848114013672, 25.69205665588379, 26.24563217163086, 26.799205780029297, 27.352781295776367]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 14.0, 15.0, 9.0, 28.0, 35.0, 36.0, 45.0, 57.0, 57.0, 74.0, 54.0, 71.0, 66.0, 71.0, 73.0, 58.0, 50.0, 39.0, 32.0, 24.0, 28.0, 17.0, 14.0, 12.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.78019905090332, -17.322389602661133, -16.864580154418945, -16.406770706176758, -15.948962211608887, -15.4911527633667, -15.033343315124512, -14.575533866882324, -14.117724418640137, -13.65991497039795, -13.202105522155762, -12.74429702758789, -12.286487579345703, -11.828678131103516, -11.370868682861328, -10.91305923461914, -10.455249786376953, -9.997440338134766, -9.539630889892578, -9.08182144165039, -8.62401294708252, -8.166203498840332, -7.7083940505981445, -7.250584602355957, -6.792776107788086, -6.334966659545898, -5.877157688140869, -5.419348239898682, -4.961538791656494, -4.503729820251465, -4.045920372009277, -3.58811092376709, -3.1303014755249023, -2.672492265701294, -2.2146828174591064, -1.756873607635498, -1.2990642786026, -0.8412549495697021, -0.38344573974609375, 0.07436370849609375, 0.5321729183197021, 0.9899822473526001, 1.447791576385498, 1.9056007862091064, 2.363409996032715, 2.8212194442749023, 3.2790286540985107, 3.7368381023406982, 4.194647312164307, 4.652456760406494, 5.110265731811523, 5.568075180053711, 6.025884628295898, 6.483694076538086, 6.941503047943115, 7.399312496185303, 7.857121467590332, 8.31493091583252, 8.772740364074707, 9.230548858642578, 9.688358306884766, 10.146167755126953, 10.60397720336914, 11.061786651611328, 11.519596099853516]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 11.0, 6.0, 20.0, 12.0, 25.0, 35.0, 52.0, 68.0, 126.0, 183.0, 345.0, 638.0, 1642.0, 4855.0, 20155.0, 161195.0, 3690687.0, 277232.0, 27255.0, 5952.0, 2039.0, 764.0, 351.0, 201.0, 113.0, 90.0, 55.0, 41.0, 29.0, 24.0, 14.0, 17.0, 14.0, 9.0, 5.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.23828125, -5.08233642578125, -4.9263916015625, -4.77044677734375, -4.614501953125, -4.45855712890625, -4.3026123046875, -4.14666748046875, -3.99072265625, -3.83477783203125, -3.6788330078125, -3.52288818359375, -3.366943359375, -3.21099853515625, -3.0550537109375, -2.89910888671875, -2.7431640625, -2.58721923828125, -2.4312744140625, -2.27532958984375, -2.119384765625, -1.96343994140625, -1.8074951171875, -1.65155029296875, -1.49560546875, -1.33966064453125, -1.1837158203125, -1.02777099609375, -0.871826171875, -0.71588134765625, -0.5599365234375, -0.40399169921875, -0.248046875, -0.09210205078125, 0.0638427734375, 0.21978759765625, 0.375732421875, 0.53167724609375, 0.6876220703125, 0.84356689453125, 0.99951171875, 1.15545654296875, 1.3114013671875, 1.46734619140625, 1.623291015625, 1.77923583984375, 1.9351806640625, 2.09112548828125, 2.2470703125, 2.40301513671875, 2.5589599609375, 2.71490478515625, 2.870849609375, 3.02679443359375, 3.1827392578125, 3.33868408203125, 3.49462890625, 3.65057373046875, 3.8065185546875, 3.96246337890625, 4.118408203125, 4.27435302734375, 4.4302978515625, 4.58624267578125, 4.7421875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 11.0, 11.0, 21.0, 22.0, 28.0, 65.0, 66.0, 83.0, 100.0, 115.0, 102.0, 111.0, 75.0, 55.0, 43.0, 29.0, 25.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.24700927734375, -5.0916748046875, -4.93634033203125, -4.781005859375, -4.62567138671875, -4.4703369140625, -4.31500244140625, -4.15966796875, -4.00433349609375, -3.8489990234375, -3.69366455078125, -3.538330078125, -3.38299560546875, -3.2276611328125, -3.07232666015625, -2.9169921875, -2.76165771484375, -2.6063232421875, -2.45098876953125, -2.295654296875, -2.14031982421875, -1.9849853515625, -1.82965087890625, -1.67431640625, -1.51898193359375, -1.3636474609375, -1.20831298828125, -1.052978515625, -0.89764404296875, -0.7423095703125, -0.58697509765625, -0.431640625, -0.27630615234375, -0.1209716796875, 0.03436279296875, 0.189697265625, 0.34503173828125, 0.5003662109375, 0.65570068359375, 0.81103515625, 0.96636962890625, 1.1217041015625, 1.27703857421875, 1.432373046875, 1.58770751953125, 1.7430419921875, 1.89837646484375, 2.0537109375, 2.20904541015625, 2.3643798828125, 2.51971435546875, 2.675048828125, 2.83038330078125, 2.9857177734375, 3.14105224609375, 3.29638671875, 3.45172119140625, 3.6070556640625, 3.76239013671875, 3.917724609375, 4.07305908203125, 4.2283935546875, 4.38372802734375, 4.5390625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 5.0, 10.0, 9.0, 15.0, 9.0, 16.0, 30.0, 46.0, 55.0, 94.0, 145.0, 241.0, 710.0, 3420.0, 40744.0, 4011846.0, 128973.0, 6085.0, 1024.0, 346.0, 145.0, 70.0, 51.0, 34.0, 32.0, 23.0, 10.0, 11.0, 9.0, 12.0, 7.0, 6.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7421875, -9.45263671875, -9.1630859375, -8.87353515625, -8.583984375, -8.29443359375, -8.0048828125, -7.71533203125, -7.42578125, -7.13623046875, -6.8466796875, -6.55712890625, -6.267578125, -5.97802734375, -5.6884765625, -5.39892578125, -5.109375, -4.81982421875, -4.5302734375, -4.24072265625, -3.951171875, -3.66162109375, -3.3720703125, -3.08251953125, -2.79296875, -2.50341796875, -2.2138671875, -1.92431640625, -1.634765625, -1.34521484375, -1.0556640625, -0.76611328125, -0.4765625, -0.18701171875, 0.1025390625, 0.39208984375, 0.681640625, 0.97119140625, 1.2607421875, 1.55029296875, 1.83984375, 2.12939453125, 2.4189453125, 2.70849609375, 2.998046875, 3.28759765625, 3.5771484375, 3.86669921875, 4.15625, 4.44580078125, 4.7353515625, 5.02490234375, 5.314453125, 5.60400390625, 5.8935546875, 6.18310546875, 6.47265625, 6.76220703125, 7.0517578125, 7.34130859375, 7.630859375, 7.92041015625, 8.2099609375, 8.49951171875, 8.7890625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 7.0, 4.0, 4.0, 19.0, 12.0, 13.0, 27.0, 26.0, 44.0, 49.0, 50.0, 75.0, 110.0, 158.0, 262.0, 480.0, 1117.0, 582.0, 304.0, 183.0, 116.0, 105.0, 55.0, 57.0, 46.0, 30.0, 31.0, 14.0, 19.0, 12.0, 5.0, 11.0, 3.0, 4.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6170501708984375, -0.592987060546875, -0.5689239501953125, -0.54486083984375, -0.5207977294921875, -0.496734619140625, -0.4726715087890625, -0.4486083984375, -0.4245452880859375, -0.400482177734375, -0.3764190673828125, -0.35235595703125, -0.3282928466796875, -0.304229736328125, -0.2801666259765625, -0.256103515625, -0.2320404052734375, -0.207977294921875, -0.1839141845703125, -0.15985107421875, -0.1357879638671875, -0.111724853515625, -0.0876617431640625, -0.0635986328125, -0.0395355224609375, -0.015472412109375, 0.0085906982421875, 0.03265380859375, 0.0567169189453125, 0.080780029296875, 0.1048431396484375, 0.12890625, 0.1529693603515625, 0.177032470703125, 0.2010955810546875, 0.22515869140625, 0.2492218017578125, 0.273284912109375, 0.2973480224609375, 0.3214111328125, 0.3454742431640625, 0.369537353515625, 0.3936004638671875, 0.41766357421875, 0.4417266845703125, 0.465789794921875, 0.4898529052734375, 0.513916015625, 0.5379791259765625, 0.562042236328125, 0.5861053466796875, 0.61016845703125, 0.6342315673828125, 0.658294677734375, 0.6823577880859375, 0.7064208984375, 0.7304840087890625, 0.754547119140625, 0.7786102294921875, 0.80267333984375, 0.8267364501953125, 0.850799560546875, 0.8748626708984375, 0.89892578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 17.0, 21.0, 40.0, 68.0, 152.0, 172.0, 186.0, 123.0, 78.0, 48.0, 26.0, 13.0, 12.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.059237003326416, -6.852049827575684, -6.644863128662109, -6.437675952911377, -6.2304887771606445, -6.023301601409912, -5.81611442565918, -5.6089277267456055, -5.401740550994873, -5.194553375244141, -4.987366676330566, -4.780179500579834, -4.572992324829102, -4.365805149078369, -4.158617973327637, -3.9514312744140625, -3.74424409866333, -3.5370569229125977, -3.3298699855804443, -3.122683048248291, -2.9154958724975586, -2.708308696746826, -2.501121759414673, -2.2939348220825195, -2.086747646331787, -1.8795605897903442, -1.6723735332489014, -1.4651864767074585, -1.2579994201660156, -1.0508123636245728, -0.8436253070831299, -0.636438250541687, -0.42925071716308594, -0.22206366062164307, -0.014876604080200195, 0.19231045246124268, 0.39949750900268555, 0.6066845655441284, 0.8138716220855713, 1.0210586786270142, 1.228245735168457, 1.4354327917099, 1.6426198482513428, 1.8498069047927856, 2.0569939613342285, 2.264181137084961, 2.4713680744171143, 2.6785550117492676, 2.8857421875, 3.0929293632507324, 3.3001163005828857, 3.507303237915039, 3.7144904136657715, 3.921677589416504, 4.128864288330078, 4.3360514640808105, 4.543238639831543, 4.750425815582275, 4.957612991333008, 5.164799690246582, 5.3719868659973145, 5.579174041748047, 5.786360740661621, 5.9935479164123535, 6.200735092163086]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 10.0, 11.0, 14.0, 17.0, 30.0, 40.0, 49.0, 49.0, 75.0, 83.0, 88.0, 83.0, 103.0, 63.0, 68.0, 65.0, 39.0, 29.0, 21.0, 13.0, 15.0, 9.0, 11.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.132678031921387, -4.987570285797119, -4.842462539672852, -4.697354793548584, -4.552247047424316, -4.407139301300049, -4.262031555175781, -4.1169233322143555, -3.971815824508667, -3.8267080783843994, -3.681600332260132, -3.5364925861358643, -3.3913846015930176, -3.24627685546875, -3.1011691093444824, -2.956061363220215, -2.8109536170959473, -2.6658458709716797, -2.520738124847412, -2.3756303787231445, -2.230522632598877, -2.0854148864746094, -1.9403069019317627, -1.7951991558074951, -1.6500914096832275, -1.50498366355896, -1.3598759174346924, -1.2147680521011353, -1.0696603059768677, -0.9245525598526001, -0.7794447541236877, -0.6343369483947754, -0.4892292022705078, -0.34412142634391785, -0.19901365041732788, -0.053905874490737915, 0.09120190143585205, 0.23630964756011963, 0.381417453289032, 0.5265252590179443, 0.6716330051422119, 0.8167407512664795, 0.9618485569953918, 1.1069563627243042, 1.2520641088485718, 1.3971718549728394, 1.5422797203063965, 1.687387466430664, 1.8324952125549316, 1.9776029586791992, 2.122710704803467, 2.2678184509277344, 2.412926197052002, 2.5580339431762695, 2.703141927719116, 2.848249673843384, 2.9933574199676514, 3.138465166091919, 3.2835729122161865, 3.428680658340454, 3.573788642883301, 3.7188963890075684, 3.864004135131836, 4.0091118812561035, 4.154219627380371]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 7.0, 10.0, 8.0, 17.0, 33.0, 39.0, 72.0, 128.0, 224.0, 386.0, 862.0, 2158.0, 6433.0, 27595.0, 249993.0, 671332.0, 70686.0, 12372.0, 3584.0, 1288.0, 573.0, 284.0, 162.0, 99.0, 55.0, 26.0, 25.0, 22.0, 10.0, 14.0, 5.0, 10.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.4443359375, -0.43271636962890625, -0.4210968017578125, -0.40947723388671875, -0.397857666015625, -0.38623809814453125, -0.3746185302734375, -0.36299896240234375, -0.35137939453125, -0.33975982666015625, -0.3281402587890625, -0.31652069091796875, -0.304901123046875, -0.29328155517578125, -0.2816619873046875, -0.27004241943359375, -0.2584228515625, -0.24680328369140625, -0.2351837158203125, -0.22356414794921875, -0.211944580078125, -0.20032501220703125, -0.1887054443359375, -0.17708587646484375, -0.16546630859375, -0.15384674072265625, -0.1422271728515625, -0.13060760498046875, -0.118988037109375, -0.10736846923828125, -0.0957489013671875, -0.08412933349609375, -0.072509765625, -0.06089019775390625, -0.0492706298828125, -0.03765106201171875, -0.026031494140625, -0.01441192626953125, -0.0027923583984375, 0.00882720947265625, 0.02044677734375, 0.03206634521484375, 0.0436859130859375, 0.05530548095703125, 0.066925048828125, 0.07854461669921875, 0.0901641845703125, 0.10178375244140625, 0.1134033203125, 0.12502288818359375, 0.1366424560546875, 0.14826202392578125, 0.159881591796875, 0.17150115966796875, 0.1831207275390625, 0.19474029541015625, 0.20635986328125, 0.21797943115234375, 0.2295989990234375, 0.24121856689453125, 0.252838134765625, 0.26445770263671875, 0.2760772705078125, 0.28769683837890625, 0.29931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 13.0, 26.0, 37.0, 41.0, 59.0, 74.0, 104.0, 117.0, 123.0, 109.0, 97.0, 50.0, 52.0, 25.0, 18.0, 11.0, 11.0, 11.0, 5.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.614105224609375, -4.48602294921875, -4.357940673828125, -4.2298583984375, -4.101776123046875, -3.97369384765625, -3.845611572265625, -3.717529296875, -3.589447021484375, -3.46136474609375, -3.333282470703125, -3.2052001953125, -3.077117919921875, -2.94903564453125, -2.820953369140625, -2.69287109375, -2.564788818359375, -2.43670654296875, -2.308624267578125, -2.1805419921875, -2.052459716796875, -1.92437744140625, -1.796295166015625, -1.668212890625, -1.540130615234375, -1.41204833984375, -1.283966064453125, -1.1558837890625, -1.027801513671875, -0.89971923828125, -0.771636962890625, -0.6435546875, -0.515472412109375, -0.38739013671875, -0.259307861328125, -0.1312255859375, -0.003143310546875, 0.12493896484375, 0.253021240234375, 0.381103515625, 0.509185791015625, 0.63726806640625, 0.765350341796875, 0.8934326171875, 1.021514892578125, 1.14959716796875, 1.277679443359375, 1.40576171875, 1.533843994140625, 1.66192626953125, 1.790008544921875, 1.9180908203125, 2.046173095703125, 2.17425537109375, 2.302337646484375, 2.430419921875, 2.558502197265625, 2.68658447265625, 2.814666748046875, 2.9427490234375, 3.070831298828125, 3.19891357421875, 3.326995849609375, 3.455078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 17.0, 15.0, 14.0, 22.0, 29.0, 39.0, 56.0, 83.0, 131.0, 203.0, 364.0, 757.0, 2969.0, 34023.0, 692449.0, 300210.0, 13762.0, 1932.0, 587.0, 284.0, 156.0, 112.0, 87.0, 45.0, 46.0, 36.0, 26.0, 13.0, 13.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3572883605957031, -0.34397125244140625, -0.3306541442871094, -0.3173370361328125, -0.3040199279785156, -0.29070281982421875, -0.2773857116699219, -0.264068603515625, -0.2507514953613281, -0.23743438720703125, -0.22411727905273438, -0.2108001708984375, -0.19748306274414062, -0.18416595458984375, -0.17084884643554688, -0.15753173828125, -0.14421463012695312, -0.13089752197265625, -0.11758041381835938, -0.1042633056640625, -0.09094619750976562, -0.07762908935546875, -0.06431198120117188, -0.050994873046875, -0.037677764892578125, -0.02436065673828125, -0.011043548583984375, 0.0022735595703125, 0.015590667724609375, 0.02890777587890625, 0.042224884033203125, 0.0555419921875, 0.06885910034179688, 0.08217620849609375, 0.09549331665039062, 0.1088104248046875, 0.12212753295898438, 0.13544464111328125, 0.14876174926757812, 0.162078857421875, 0.17539596557617188, 0.18871307373046875, 0.20203018188476562, 0.2153472900390625, 0.22866439819335938, 0.24198150634765625, 0.2552986145019531, 0.26861572265625, 0.2819328308105469, 0.29524993896484375, 0.3085670471191406, 0.3218841552734375, 0.3352012634277344, 0.34851837158203125, 0.3618354797363281, 0.375152587890625, 0.3884696960449219, 0.40178680419921875, 0.4151039123535156, 0.4284210205078125, 0.4417381286621094, 0.45505523681640625, 0.4683723449707031, 0.481689453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 7.0, 6.0, 7.0, 6.0, 13.0, 12.0, 17.0, 16.0, 29.0, 37.0, 36.0, 32.0, 34.0, 49.0, 43.0, 63.0, 40.0, 57.0, 76.0, 37.0, 53.0, 46.0, 51.0, 40.0, 43.0, 36.0, 26.0, 17.0, 15.0, 16.0, 9.0, 5.0, 7.0, 4.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.73828125, -4.5946044921875, -4.450927734375, -4.3072509765625, -4.16357421875, -4.0198974609375, -3.876220703125, -3.7325439453125, -3.5888671875, -3.4451904296875, -3.301513671875, -3.1578369140625, -3.01416015625, -2.8704833984375, -2.726806640625, -2.5831298828125, -2.439453125, -2.2957763671875, -2.152099609375, -2.0084228515625, -1.86474609375, -1.7210693359375, -1.577392578125, -1.4337158203125, -1.2900390625, -1.1463623046875, -1.002685546875, -0.8590087890625, -0.71533203125, -0.5716552734375, -0.427978515625, -0.2843017578125, -0.140625, 0.0030517578125, 0.146728515625, 0.2904052734375, 0.43408203125, 0.5777587890625, 0.721435546875, 0.8651123046875, 1.0087890625, 1.1524658203125, 1.296142578125, 1.4398193359375, 1.58349609375, 1.7271728515625, 1.870849609375, 2.0145263671875, 2.158203125, 2.3018798828125, 2.445556640625, 2.5892333984375, 2.73291015625, 2.8765869140625, 3.020263671875, 3.1639404296875, 3.3076171875, 3.4512939453125, 3.594970703125, 3.7386474609375, 3.88232421875, 4.0260009765625, 4.169677734375, 4.3133544921875, 4.45703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 11.0, 5.0, 10.0, 16.0, 12.0, 33.0, 27.0, 53.0, 94.0, 182.0, 434.0, 1999.0, 128660.0, 913221.0, 2740.0, 531.0, 197.0, 105.0, 61.0, 36.0, 28.0, 11.0, 11.0, 13.0, 10.0, 6.0, 7.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.382080078125, -0.37230491638183594, -0.3625297546386719, -0.3527545928955078, -0.34297943115234375, -0.3332042694091797, -0.3234291076660156, -0.31365394592285156, -0.3038787841796875, -0.29410362243652344, -0.2843284606933594, -0.2745532989501953, -0.26477813720703125, -0.2550029754638672, -0.24522781372070312, -0.23545265197753906, -0.225677490234375, -0.21590232849121094, -0.20612716674804688, -0.1963520050048828, -0.18657684326171875, -0.1768016815185547, -0.16702651977539062, -0.15725135803222656, -0.1474761962890625, -0.13770103454589844, -0.12792587280273438, -0.11815071105957031, -0.10837554931640625, -0.09860038757324219, -0.08882522583007812, -0.07905006408691406, -0.06927490234375, -0.05949974060058594, -0.049724578857421875, -0.03994941711425781, -0.03017425537109375, -0.020399093627929688, -0.010623931884765625, -0.0008487701416015625, 0.0089263916015625, 0.018701553344726562, 0.028476715087890625, 0.03825187683105469, 0.04802703857421875, 0.05780220031738281, 0.06757736206054688, 0.07735252380371094, 0.087127685546875, 0.09690284729003906, 0.10667800903320312, 0.11645317077636719, 0.12622833251953125, 0.1360034942626953, 0.14577865600585938, 0.15555381774902344, 0.1653289794921875, 0.17510414123535156, 0.18487930297851562, 0.1946544647216797, 0.20442962646484375, 0.2142047882080078, 0.22397994995117188, 0.23375511169433594, 0.2435302734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 6.0, 1.0, 8.0, 16.0, 10.0, 13.0, 16.0, 32.0, 33.0, 41.0, 53.0, 54.0, 78.0, 109.0, 89.0, 81.0, 59.0, 53.0, 44.0, 34.0, 27.0, 28.0, 28.0, 21.0, 8.0, 11.0, 11.0, 8.0, 4.0, 5.0, 1.0, 0.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2961368560791016e-05, -3.194250166416168e-05, -3.092363476753235e-05, -2.9904767870903015e-05, -2.888590097427368e-05, -2.7867034077644348e-05, -2.6848167181015015e-05, -2.582930028438568e-05, -2.4810433387756348e-05, -2.3791566491127014e-05, -2.277269959449768e-05, -2.1753832697868347e-05, -2.0734965801239014e-05, -1.971609890460968e-05, -1.8697232007980347e-05, -1.7678365111351013e-05, -1.665949821472168e-05, -1.5640631318092346e-05, -1.4621764421463013e-05, -1.360289752483368e-05, -1.2584030628204346e-05, -1.1565163731575012e-05, -1.0546296834945679e-05, -9.527429938316345e-06, -8.508563041687012e-06, -7.489696145057678e-06, -6.470829248428345e-06, -5.451962351799011e-06, -4.433095455169678e-06, -3.4142285585403442e-06, -2.3953616619110107e-06, -1.3764947652816772e-06, -3.5762786865234375e-07, 6.612390279769897e-07, 1.6801059246063232e-06, 2.6989728212356567e-06, 3.7178397178649902e-06, 4.736706614494324e-06, 5.755573511123657e-06, 6.774440407752991e-06, 7.793307304382324e-06, 8.812174201011658e-06, 9.831041097640991e-06, 1.0849907994270325e-05, 1.1868774890899658e-05, 1.2887641787528992e-05, 1.3906508684158325e-05, 1.4925375580787659e-05, 1.5944242477416992e-05, 1.6963109374046326e-05, 1.798197627067566e-05, 1.9000843167304993e-05, 2.0019710063934326e-05, 2.103857696056366e-05, 2.2057443857192993e-05, 2.3076310753822327e-05, 2.409517765045166e-05, 2.5114044547080994e-05, 2.6132911443710327e-05, 2.715177834033966e-05, 2.8170645236968994e-05, 2.9189512133598328e-05, 3.020837903022766e-05, 3.1227245926856995e-05, 3.224611282348633e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 10.0, 18.0, 19.0, 31.0, 55.0, 106.0, 246.0, 759.0, 3293.0, 39317.0, 977987.0, 23145.0, 2495.0, 616.0, 207.0, 93.0, 51.0, 33.0, 14.0, 15.0, 7.0, 5.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.30224609375, -0.29346466064453125, -0.2846832275390625, -0.27590179443359375, -0.267120361328125, -0.25833892822265625, -0.2495574951171875, -0.24077606201171875, -0.23199462890625, -0.22321319580078125, -0.2144317626953125, -0.20565032958984375, -0.196868896484375, -0.18808746337890625, -0.1793060302734375, -0.17052459716796875, -0.1617431640625, -0.15296173095703125, -0.1441802978515625, -0.13539886474609375, -0.126617431640625, -0.11783599853515625, -0.1090545654296875, -0.10027313232421875, -0.09149169921875, -0.08271026611328125, -0.0739288330078125, -0.06514739990234375, -0.056365966796875, -0.04758453369140625, -0.0388031005859375, -0.03002166748046875, -0.021240234375, -0.01245880126953125, -0.0036773681640625, 0.00510406494140625, 0.013885498046875, 0.02266693115234375, 0.0314483642578125, 0.04022979736328125, 0.04901123046875, 0.05779266357421875, 0.0665740966796875, 0.07535552978515625, 0.084136962890625, 0.09291839599609375, 0.1016998291015625, 0.11048126220703125, 0.1192626953125, 0.12804412841796875, 0.1368255615234375, 0.14560699462890625, 0.154388427734375, 0.16316986083984375, 0.1719512939453125, 0.18073272705078125, 0.18951416015625, 0.19829559326171875, 0.2070770263671875, 0.21585845947265625, 0.224639892578125, 0.23342132568359375, 0.2422027587890625, 0.25098419189453125, 0.259765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 6.0, 13.0, 9.0, 18.0, 9.0, 24.0, 51.0, 108.0, 269.0, 238.0, 93.0, 56.0, 22.0, 13.0, 17.0, 7.0, 11.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042510986328125, -0.041086673736572266, -0.03966236114501953, -0.0382380485534668, -0.03681373596191406, -0.03538942337036133, -0.033965110778808594, -0.03254079818725586, -0.031116485595703125, -0.02969217300415039, -0.028267860412597656, -0.026843547821044922, -0.025419235229492188, -0.023994922637939453, -0.02257061004638672, -0.021146297454833984, -0.01972198486328125, -0.018297672271728516, -0.01687335968017578, -0.015449047088623047, -0.014024734497070312, -0.012600421905517578, -0.011176109313964844, -0.00975179672241211, -0.008327484130859375, -0.006903171539306641, -0.005478858947753906, -0.004054546356201172, -0.0026302337646484375, -0.0012059211730957031, 0.00021839141845703125, 0.0016427040100097656, 0.0030670166015625, 0.004491329193115234, 0.005915641784667969, 0.007339954376220703, 0.008764266967773438, 0.010188579559326172, 0.011612892150878906, 0.01303720474243164, 0.014461517333984375, 0.01588582992553711, 0.017310142517089844, 0.018734455108642578, 0.020158767700195312, 0.021583080291748047, 0.02300739288330078, 0.024431705474853516, 0.02585601806640625, 0.027280330657958984, 0.02870464324951172, 0.030128955841064453, 0.03155326843261719, 0.03297758102416992, 0.034401893615722656, 0.03582620620727539, 0.037250518798828125, 0.03867483139038086, 0.040099143981933594, 0.04152345657348633, 0.04294776916503906, 0.0443720817565918, 0.04579639434814453, 0.047220706939697266, 0.04864501953125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 9.0, 10.0, 25.0, 38.0, 93.0, 198.0, 225.0, 194.0, 87.0, 41.0, 26.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8823747634887695, -5.711939811706543, -5.541504859924316, -5.37106990814209, -5.200634956359863, -5.030200481414795, -4.859765529632568, -4.689330577850342, -4.518895626068115, -4.348460674285889, -4.178025722503662, -4.0075907707214355, -3.837156057357788, -3.6667211055755615, -3.496286392211914, -3.3258514404296875, -3.155416488647461, -2.9849815368652344, -2.814546585083008, -2.6441118717193604, -2.473676919937134, -2.3032419681549072, -2.1328072547912598, -1.9623723030090332, -1.7919373512268066, -1.62150239944458, -1.451067566871643, -1.280632734298706, -1.1101977825164795, -0.9397628903388977, -0.7693279981613159, -0.5988931655883789, -0.42845869064331055, -0.25802379846572876, -0.08758890628814697, 0.08284598588943481, 0.2532808780670166, 0.4237157702445984, 0.5941506624221802, 0.7645854949951172, 0.9350204467773438, 1.1054553985595703, 1.2758902311325073, 1.4463250637054443, 1.616760015487671, 1.7871949672698975, 1.9576297998428345, 2.1280646324157715, 2.298499584197998, 2.4689345359802246, 2.639369487762451, 2.8098042011260986, 2.980239152908325, 3.1506741046905518, 3.321108818054199, 3.491543769836426, 3.6619787216186523, 3.832413673400879, 4.0028486251831055, 4.173283576965332, 4.343718528747559, 4.514153003692627, 4.6845879554748535, 4.85502290725708, 5.025457859039307]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 21.0, 16.0, 41.0, 49.0, 65.0, 73.0, 106.0, 103.0, 113.0, 104.0, 81.0, 59.0, 43.0, 30.0, 20.0, 13.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.253957748413086, -4.1391191482543945, -4.024280548095703, -3.909442186355591, -3.7946035861968994, -3.679764986038208, -3.5649266242980957, -3.4500880241394043, -3.335249423980713, -3.2204108238220215, -3.10557222366333, -2.9907338619232178, -2.8758952617645264, -2.761056661605835, -2.6462182998657227, -2.5313796997070312, -2.41654109954834, -2.3017024993896484, -2.186863899230957, -2.0720255374908447, -1.9571869373321533, -1.842348337173462, -1.72750985622406, -1.6126713752746582, -1.4978327751159668, -1.3829941749572754, -1.2681556940078735, -1.1533172130584717, -1.0384786128997803, -0.9236400723457336, -0.808801531791687, -0.6939629912376404, -0.5791242122650146, -0.464285671710968, -0.3494471311569214, -0.23460859060287476, -0.11977005004882812, -0.004931509494781494, 0.10990703105926514, 0.22474557161331177, 0.3395841121673584, 0.45442265272140503, 0.5692611932754517, 0.6840997338294983, 0.7989382743835449, 0.9137768149375916, 1.0286153554916382, 1.14345383644104, 1.2582924365997314, 1.3731310367584229, 1.4879695177078247, 1.6028079986572266, 1.717646598815918, 1.8324851989746094, 1.9473236799240112, 2.062162160873413, 2.1770007610321045, 2.291839361190796, 2.406677722930908, 2.5215163230895996, 2.636354923248291, 2.7511935234069824, 2.866032123565674, 2.980870485305786, 3.0957090854644775]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 13.0, 29.0, 76.0, 132.0, 358.0, 1330.0, 10804.0, 485835.0, 536622.0, 11331.0, 1404.0, 336.0, 126.0, 63.0, 30.0, 9.0, 15.0, 10.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.20391845703125, -5.9742431640625, -5.74456787109375, -5.514892578125, -5.28521728515625, -5.0555419921875, -4.82586669921875, -4.59619140625, -4.36651611328125, -4.1368408203125, -3.90716552734375, -3.677490234375, -3.44781494140625, -3.2181396484375, -2.98846435546875, -2.7587890625, -2.52911376953125, -2.2994384765625, -2.06976318359375, -1.840087890625, -1.61041259765625, -1.3807373046875, -1.15106201171875, -0.92138671875, -0.69171142578125, -0.4620361328125, -0.23236083984375, -0.002685546875, 0.22698974609375, 0.4566650390625, 0.68634033203125, 0.916015625, 1.14569091796875, 1.3753662109375, 1.60504150390625, 1.834716796875, 2.06439208984375, 2.2940673828125, 2.52374267578125, 2.75341796875, 2.98309326171875, 3.2127685546875, 3.44244384765625, 3.672119140625, 3.90179443359375, 4.1314697265625, 4.36114501953125, 4.5908203125, 4.82049560546875, 5.0501708984375, 5.27984619140625, 5.509521484375, 5.73919677734375, 5.9688720703125, 6.19854736328125, 6.42822265625, 6.65789794921875, 6.8875732421875, 7.11724853515625, 7.346923828125, 7.57659912109375, 7.8062744140625, 8.03594970703125, 8.265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 15.0, 26.0, 65.0, 124.0, 227.0, 268.0, 154.0, 64.0, 24.0, 19.0, 13.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -31.452880859375, -30.81201171875, -30.171142578125, -29.5302734375, -28.889404296875, -28.24853515625, -27.607666015625, -26.966796875, -26.325927734375, -25.68505859375, -25.044189453125, -24.4033203125, -23.762451171875, -23.12158203125, -22.480712890625, -21.83984375, -21.198974609375, -20.55810546875, -19.917236328125, -19.2763671875, -18.635498046875, -17.99462890625, -17.353759765625, -16.712890625, -16.072021484375, -15.43115234375, -14.790283203125, -14.1494140625, -13.508544921875, -12.86767578125, -12.226806640625, -11.5859375, -10.945068359375, -10.30419921875, -9.663330078125, -9.0224609375, -8.381591796875, -7.74072265625, -7.099853515625, -6.458984375, -5.818115234375, -5.17724609375, -4.536376953125, -3.8955078125, -3.254638671875, -2.61376953125, -1.972900390625, -1.33203125, -0.691162109375, -0.05029296875, 0.590576171875, 1.2314453125, 1.872314453125, 2.51318359375, 3.154052734375, 3.794921875, 4.435791015625, 5.07666015625, 5.717529296875, 6.3583984375, 6.999267578125, 7.64013671875, 8.281005859375, 8.921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 6.0, 20.0, 15.0, 20.0, 29.0, 57.0, 76.0, 121.0, 225.0, 478.0, 1382.0, 6399.0, 88194.0, 879927.0, 63851.0, 5588.0, 1209.0, 431.0, 198.0, 115.0, 63.0, 45.0, 39.0, 23.0, 12.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.532470703125, -4.39697265625, -4.261474609375, -4.1259765625, -3.990478515625, -3.85498046875, -3.719482421875, -3.583984375, -3.448486328125, -3.31298828125, -3.177490234375, -3.0419921875, -2.906494140625, -2.77099609375, -2.635498046875, -2.5, -2.364501953125, -2.22900390625, -2.093505859375, -1.9580078125, -1.822509765625, -1.68701171875, -1.551513671875, -1.416015625, -1.280517578125, -1.14501953125, -1.009521484375, -0.8740234375, -0.738525390625, -0.60302734375, -0.467529296875, -0.33203125, -0.196533203125, -0.06103515625, 0.074462890625, 0.2099609375, 0.345458984375, 0.48095703125, 0.616455078125, 0.751953125, 0.887451171875, 1.02294921875, 1.158447265625, 1.2939453125, 1.429443359375, 1.56494140625, 1.700439453125, 1.8359375, 1.971435546875, 2.10693359375, 2.242431640625, 2.3779296875, 2.513427734375, 2.64892578125, 2.784423828125, 2.919921875, 3.055419921875, 3.19091796875, 3.326416015625, 3.4619140625, 3.597412109375, 3.73291015625, 3.868408203125, 4.00390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 9.0, 7.0, 16.0, 20.0, 15.0, 26.0, 26.0, 33.0, 27.0, 28.0, 40.0, 48.0, 50.0, 58.0, 47.0, 53.0, 62.0, 63.0, 47.0, 42.0, 39.0, 43.0, 35.0, 24.0, 28.0, 21.0, 13.0, 17.0, 14.0, 17.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.85546875, -7.634521484375, -7.41357421875, -7.192626953125, -6.9716796875, -6.750732421875, -6.52978515625, -6.308837890625, -6.087890625, -5.866943359375, -5.64599609375, -5.425048828125, -5.2041015625, -4.983154296875, -4.76220703125, -4.541259765625, -4.3203125, -4.099365234375, -3.87841796875, -3.657470703125, -3.4365234375, -3.215576171875, -2.99462890625, -2.773681640625, -2.552734375, -2.331787109375, -2.11083984375, -1.889892578125, -1.6689453125, -1.447998046875, -1.22705078125, -1.006103515625, -0.78515625, -0.564208984375, -0.34326171875, -0.122314453125, 0.0986328125, 0.319580078125, 0.54052734375, 0.761474609375, 0.982421875, 1.203369140625, 1.42431640625, 1.645263671875, 1.8662109375, 2.087158203125, 2.30810546875, 2.529052734375, 2.75, 2.970947265625, 3.19189453125, 3.412841796875, 3.6337890625, 3.854736328125, 4.07568359375, 4.296630859375, 4.517578125, 4.738525390625, 4.95947265625, 5.180419921875, 5.4013671875, 5.622314453125, 5.84326171875, 6.064208984375, 6.28515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 10.0, 4.0, 7.0, 7.0, 8.0, 8.0, 26.0, 41.0, 54.0, 87.0, 138.0, 252.0, 463.0, 956.0, 2028.0, 4962.0, 16019.0, 74633.0, 509867.0, 363708.0, 54674.0, 12805.0, 4212.0, 1785.0, 781.0, 395.0, 218.0, 147.0, 83.0, 53.0, 40.0, 24.0, 15.0, 7.0, 12.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8388671875, -0.8125762939453125, -0.786285400390625, -0.7599945068359375, -0.73370361328125, -0.7074127197265625, -0.681121826171875, -0.6548309326171875, -0.6285400390625, -0.6022491455078125, -0.575958251953125, -0.5496673583984375, -0.52337646484375, -0.4970855712890625, -0.470794677734375, -0.4445037841796875, -0.418212890625, -0.3919219970703125, -0.365631103515625, -0.3393402099609375, -0.31304931640625, -0.2867584228515625, -0.260467529296875, -0.2341766357421875, -0.2078857421875, -0.1815948486328125, -0.155303955078125, -0.1290130615234375, -0.10272216796875, -0.0764312744140625, -0.050140380859375, -0.0238494873046875, 0.00244140625, 0.0287322998046875, 0.055023193359375, 0.0813140869140625, 0.10760498046875, 0.1338958740234375, 0.160186767578125, 0.1864776611328125, 0.2127685546875, 0.2390594482421875, 0.265350341796875, 0.2916412353515625, 0.31793212890625, 0.3442230224609375, 0.370513916015625, 0.3968048095703125, 0.423095703125, 0.4493865966796875, 0.475677490234375, 0.5019683837890625, 0.52825927734375, 0.5545501708984375, 0.580841064453125, 0.6071319580078125, 0.6334228515625, 0.6597137451171875, 0.686004638671875, 0.7122955322265625, 0.73858642578125, 0.7648773193359375, 0.791168212890625, 0.8174591064453125, 0.84375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 18.0, 32.0, 29.0, 45.0, 70.0, 106.0, 117.0, 133.0, 114.0, 80.0, 62.0, 40.0, 36.0, 26.0, 13.0, 14.0, 17.0, 5.0, 7.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001277923583984375, -0.0001221001148223877, -0.00011640787124633789, -0.00011071562767028809, -0.00010502338409423828, -9.933114051818848e-05, -9.363889694213867e-05, -8.794665336608887e-05, -8.225440979003906e-05, -7.656216621398926e-05, -7.086992263793945e-05, -6.517767906188965e-05, -5.9485435485839844e-05, -5.379319190979004e-05, -4.8100948333740234e-05, -4.240870475769043e-05, -3.6716461181640625e-05, -3.102421760559082e-05, -2.5331974029541016e-05, -1.963973045349121e-05, -1.3947486877441406e-05, -8.255243301391602e-06, -2.562999725341797e-06, 3.129243850708008e-06, 8.821487426757812e-06, 1.4513731002807617e-05, 2.0205974578857422e-05, 2.5898218154907227e-05, 3.159046173095703e-05, 3.7282705307006836e-05, 4.297494888305664e-05, 4.8667192459106445e-05, 5.435943603515625e-05, 6.0051679611206055e-05, 6.574392318725586e-05, 7.143616676330566e-05, 7.712841033935547e-05, 8.282065391540527e-05, 8.851289749145508e-05, 9.420514106750488e-05, 9.989738464355469e-05, 0.00010558962821960449, 0.0001112818717956543, 0.0001169741153717041, 0.0001226663589477539, 0.0001283586025238037, 0.00013405084609985352, 0.00013974308967590332, 0.00014543533325195312, 0.00015112757682800293, 0.00015681982040405273, 0.00016251206398010254, 0.00016820430755615234, 0.00017389655113220215, 0.00017958879470825195, 0.00018528103828430176, 0.00019097328186035156, 0.00019666552543640137, 0.00020235776901245117, 0.00020805001258850098, 0.00021374225616455078, 0.00021943449974060059, 0.0002251267433166504, 0.0002308189868927002, 0.00023651123046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 8.0, 17.0, 20.0, 43.0, 73.0, 178.0, 339.0, 1100.0, 5205.0, 61074.0, 898416.0, 74366.0, 5804.0, 1194.0, 394.0, 137.0, 96.0, 36.0, 22.0, 11.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4159088134765625, -1.358184814453125, -1.3004608154296875, -1.24273681640625, -1.1850128173828125, -1.127288818359375, -1.0695648193359375, -1.0118408203125, -0.9541168212890625, -0.896392822265625, -0.8386688232421875, -0.78094482421875, -0.7232208251953125, -0.665496826171875, -0.6077728271484375, -0.550048828125, -0.4923248291015625, -0.434600830078125, -0.3768768310546875, -0.31915283203125, -0.2614288330078125, -0.203704833984375, -0.1459808349609375, -0.0882568359375, -0.0305328369140625, 0.027191162109375, 0.0849151611328125, 0.14263916015625, 0.2003631591796875, 0.258087158203125, 0.3158111572265625, 0.37353515625, 0.4312591552734375, 0.488983154296875, 0.5467071533203125, 0.60443115234375, 0.6621551513671875, 0.719879150390625, 0.7776031494140625, 0.8353271484375, 0.8930511474609375, 0.950775146484375, 1.0084991455078125, 1.06622314453125, 1.1239471435546875, 1.181671142578125, 1.2393951416015625, 1.297119140625, 1.3548431396484375, 1.412567138671875, 1.4702911376953125, 1.52801513671875, 1.5857391357421875, 1.643463134765625, 1.7011871337890625, 1.7589111328125, 1.8166351318359375, 1.874359130859375, 1.9320831298828125, 1.98980712890625, 2.0475311279296875, 2.105255126953125, 2.1629791259765625, 2.220703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 16.0, 12.0, 15.0, 30.0, 30.0, 29.0, 50.0, 72.0, 65.0, 101.0, 114.0, 108.0, 87.0, 54.0, 51.0, 41.0, 34.0, 15.0, 13.0, 16.0, 9.0, 3.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5673828125, -0.5504837036132812, -0.5335845947265625, -0.5166854858398438, -0.499786376953125, -0.48288726806640625, -0.4659881591796875, -0.44908905029296875, -0.43218994140625, -0.41529083251953125, -0.3983917236328125, -0.38149261474609375, -0.364593505859375, -0.34769439697265625, -0.3307952880859375, -0.31389617919921875, -0.2969970703125, -0.28009796142578125, -0.2631988525390625, -0.24629974365234375, -0.229400634765625, -0.21250152587890625, -0.1956024169921875, -0.17870330810546875, -0.16180419921875, -0.14490509033203125, -0.1280059814453125, -0.11110687255859375, -0.094207763671875, -0.07730865478515625, -0.0604095458984375, -0.04351043701171875, -0.026611328125, -0.00971221923828125, 0.0071868896484375, 0.02408599853515625, 0.040985107421875, 0.05788421630859375, 0.0747833251953125, 0.09168243408203125, 0.10858154296875, 0.12548065185546875, 0.1423797607421875, 0.15927886962890625, 0.176177978515625, 0.19307708740234375, 0.2099761962890625, 0.22687530517578125, 0.2437744140625, 0.26067352294921875, 0.2775726318359375, 0.29447174072265625, 0.311370849609375, 0.32826995849609375, 0.3451690673828125, 0.36206817626953125, 0.37896728515625, 0.39586639404296875, 0.4127655029296875, 0.42966461181640625, 0.446563720703125, 0.46346282958984375, 0.4803619384765625, 0.49726104736328125, 0.51416015625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 7.0, 7.0, 14.0, 97.0, 538.0, 282.0, 45.0, 11.0, 6.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.893657684326172, -27.88878631591797, -26.883914947509766, -25.879043579101562, -24.874170303344727, -23.869298934936523, -22.86442756652832, -21.859556198120117, -20.85468292236328, -19.849811553955078, -18.844940185546875, -17.840068817138672, -16.835195541381836, -15.830324172973633, -14.82545280456543, -13.820581436157227, -12.815710067749023, -11.81083869934082, -10.8059663772583, -9.801095008850098, -8.796222686767578, -7.791351318359375, -6.786479949951172, -5.7816081047058105, -4.776736259460449, -3.771864414215088, -2.7669928073883057, -1.7621212005615234, -0.7572493553161621, 0.24762248992919922, 1.2524938583374023, 2.2573657035827637, 3.262237548828125, 4.267109394073486, 5.271981239318848, 6.276852607727051, 7.281724452972412, 8.286596298217773, 9.291467666625977, 10.29633903503418, 11.3012113571167, 12.306082725524902, 13.310955047607422, 14.315826416015625, 15.320697784423828, 16.32556915283203, 17.330440521240234, 18.33531379699707, 19.340185165405273, 20.345056533813477, 21.34992790222168, 22.354801177978516, 23.35967254638672, 24.364543914794922, 25.369415283203125, 26.374286651611328, 27.37915802001953, 28.384029388427734, 29.388900756835938, 30.39377212524414, 31.398645401000977, 32.40351867675781, 33.40838623046875, 34.41326141357422, 35.41813278198242]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 14.0, 14.0, 15.0, 12.0, 19.0, 33.0, 30.0, 32.0, 55.0, 56.0, 53.0, 67.0, 66.0, 75.0, 57.0, 53.0, 43.0, 65.0, 54.0, 38.0, 38.0, 33.0, 20.0, 22.0, 6.0, 10.0, 12.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.108684539794922, -24.528242111206055, -23.94780158996582, -23.367359161376953, -22.786916732788086, -22.20647621154785, -21.626033782958984, -21.04559326171875, -20.465150833129883, -19.884708404541016, -19.30426788330078, -18.723825454711914, -18.143383026123047, -17.562942504882812, -16.982500076293945, -16.402057647705078, -15.821616172790527, -15.241174697875977, -14.66073226928711, -14.080290794372559, -13.499849319458008, -12.91940689086914, -12.33896541595459, -11.758523941040039, -11.178081512451172, -10.597640037536621, -10.017197608947754, -9.436756134033203, -8.856314659118652, -8.275873184204102, -7.695430755615234, -7.114989280700684, -6.534546852111816, -5.954104900360107, -5.373663425445557, -4.793221473693848, -4.212779998779297, -3.632338047027588, -3.051896095275879, -2.471454620361328, -1.8910126686096191, -1.3105709552764893, -0.7301291227340698, -0.1496872901916504, 0.4307544231414795, 1.0111961364746094, 1.5916380882263184, 2.172079563140869, 2.752521514892578, 3.332963228225708, 3.913404941558838, 4.493846893310547, 5.074288368225098, 5.654730319976807, 6.235172271728516, 6.815613746643066, 7.396055698394775, 7.976497650146484, 8.556939125061035, 9.137380599975586, 9.717823028564453, 10.298264503479004, 10.878705978393555, 11.459148406982422, 12.039589881896973]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 12.0, 16.0, 25.0, 48.0, 55.0, 107.0, 152.0, 259.0, 414.0, 780.0, 1636.0, 3916.0, 11351.0, 49052.0, 527904.0, 3406231.0, 154264.0, 25441.0, 7275.0, 2654.0, 1181.0, 580.0, 355.0, 190.0, 134.0, 87.0, 52.0, 29.0, 23.0, 14.0, 9.0, 8.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.8671875, -3.73046875, -3.59375, -3.45703125, -3.3203125, -3.18359375, -3.046875, -2.91015625, -2.7734375, -2.63671875, -2.5, -2.36328125, -2.2265625, -2.08984375, -1.953125, -1.81640625, -1.6796875, -1.54296875, -1.40625, -1.26953125, -1.1328125, -0.99609375, -0.859375, -0.72265625, -0.5859375, -0.44921875, -0.3125, -0.17578125, -0.0390625, 0.09765625, 0.234375, 0.37109375, 0.5078125, 0.64453125, 0.78125, 0.91796875, 1.0546875, 1.19140625, 1.328125, 1.46484375, 1.6015625, 1.73828125, 1.875, 2.01171875, 2.1484375, 2.28515625, 2.421875, 2.55859375, 2.6953125, 2.83203125, 2.96875, 3.10546875, 3.2421875, 3.37890625, 3.515625, 3.65234375, 3.7890625, 3.92578125, 4.0625, 4.19921875, 4.3359375, 4.47265625, 4.609375, 4.74609375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 7.0, 4.0, 12.0, 13.0, 37.0, 36.0, 43.0, 65.0, 75.0, 102.0, 106.0, 88.0, 97.0, 80.0, 57.0, 49.0, 31.0, 29.0, 15.0, 13.0, 10.0, 12.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.5877685546875, -4.456787109375, -4.3258056640625, -4.19482421875, -4.0638427734375, -3.932861328125, -3.8018798828125, -3.6708984375, -3.5399169921875, -3.408935546875, -3.2779541015625, -3.14697265625, -3.0159912109375, -2.885009765625, -2.7540283203125, -2.623046875, -2.4920654296875, -2.361083984375, -2.2301025390625, -2.09912109375, -1.9681396484375, -1.837158203125, -1.7061767578125, -1.5751953125, -1.4442138671875, -1.313232421875, -1.1822509765625, -1.05126953125, -0.9202880859375, -0.789306640625, -0.6583251953125, -0.52734375, -0.3963623046875, -0.265380859375, -0.1343994140625, -0.00341796875, 0.1275634765625, 0.258544921875, 0.3895263671875, 0.5205078125, 0.6514892578125, 0.782470703125, 0.9134521484375, 1.04443359375, 1.1754150390625, 1.306396484375, 1.4373779296875, 1.568359375, 1.6993408203125, 1.830322265625, 1.9613037109375, 2.09228515625, 2.2232666015625, 2.354248046875, 2.4852294921875, 2.6162109375, 2.7471923828125, 2.878173828125, 3.0091552734375, 3.14013671875, 3.2711181640625, 3.402099609375, 3.5330810546875, 3.6640625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 13.0, 16.0, 37.0, 54.0, 66.0, 96.0, 153.0, 299.0, 567.0, 1217.0, 3369.0, 13185.0, 89821.0, 3569648.0, 472981.0, 32055.0, 6722.0, 2136.0, 842.0, 349.0, 235.0, 119.0, 68.0, 51.0, 35.0, 22.0, 23.0, 15.0, 12.0, 13.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.79437255859375, -4.6434326171875, -4.49249267578125, -4.341552734375, -4.19061279296875, -4.0396728515625, -3.88873291015625, -3.73779296875, -3.58685302734375, -3.4359130859375, -3.28497314453125, -3.134033203125, -2.98309326171875, -2.8321533203125, -2.68121337890625, -2.5302734375, -2.37933349609375, -2.2283935546875, -2.07745361328125, -1.926513671875, -1.77557373046875, -1.6246337890625, -1.47369384765625, -1.32275390625, -1.17181396484375, -1.0208740234375, -0.86993408203125, -0.718994140625, -0.56805419921875, -0.4171142578125, -0.26617431640625, -0.115234375, 0.03570556640625, 0.1866455078125, 0.33758544921875, 0.488525390625, 0.63946533203125, 0.7904052734375, 0.94134521484375, 1.09228515625, 1.24322509765625, 1.3941650390625, 1.54510498046875, 1.696044921875, 1.84698486328125, 1.9979248046875, 2.14886474609375, 2.2998046875, 2.45074462890625, 2.6016845703125, 2.75262451171875, 2.903564453125, 3.05450439453125, 3.2054443359375, 3.35638427734375, 3.50732421875, 3.65826416015625, 3.8092041015625, 3.96014404296875, 4.111083984375, 4.26202392578125, 4.4129638671875, 4.56390380859375, 4.71484375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 7.0, 8.0, 11.0, 13.0, 15.0, 16.0, 20.0, 44.0, 56.0, 63.0, 77.0, 114.0, 154.0, 216.0, 405.0, 710.0, 808.0, 415.0, 239.0, 140.0, 147.0, 89.0, 77.0, 53.0, 40.0, 36.0, 26.0, 11.0, 13.0, 9.0, 9.0, 7.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.73974609375, -0.7159500122070312, -0.6921539306640625, -0.6683578491210938, -0.644561767578125, -0.6207656860351562, -0.5969696044921875, -0.5731735229492188, -0.54937744140625, -0.5255813598632812, -0.5017852783203125, -0.47798919677734375, -0.454193115234375, -0.43039703369140625, -0.4066009521484375, -0.38280487060546875, -0.3590087890625, -0.33521270751953125, -0.3114166259765625, -0.28762054443359375, -0.263824462890625, -0.24002838134765625, -0.2162322998046875, -0.19243621826171875, -0.16864013671875, -0.14484405517578125, -0.1210479736328125, -0.09725189208984375, -0.073455810546875, -0.04965972900390625, -0.0258636474609375, -0.00206756591796875, 0.021728515625, 0.04552459716796875, 0.0693206787109375, 0.09311676025390625, 0.116912841796875, 0.14070892333984375, 0.1645050048828125, 0.18830108642578125, 0.21209716796875, 0.23589324951171875, 0.2596893310546875, 0.28348541259765625, 0.307281494140625, 0.33107757568359375, 0.3548736572265625, 0.37866973876953125, 0.4024658203125, 0.42626190185546875, 0.4500579833984375, 0.47385406494140625, 0.497650146484375, 0.5214462280273438, 0.5452423095703125, 0.5690383911132812, 0.59283447265625, 0.6166305541992188, 0.6404266357421875, 0.6642227172851562, 0.688018798828125, 0.7118148803710938, 0.7356109619140625, 0.7594070434570312, 0.783203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 9.0, 5.0, 13.0, 16.0, 14.0, 50.0, 53.0, 134.0, 145.0, 202.0, 147.0, 82.0, 49.0, 24.0, 11.0, 11.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.659629821777344, -5.472128391265869, -5.2846269607543945, -5.09712553024292, -4.909624099731445, -4.722122669219971, -4.534621238708496, -4.34712028503418, -4.159618377685547, -3.9721169471740723, -3.7846155166625977, -3.597114086151123, -3.4096126556396484, -3.222111225128174, -3.0346100330352783, -2.8471086025238037, -2.659607410430908, -2.4721059799194336, -2.284604549407959, -2.0971031188964844, -1.9096018075942993, -1.7221003770828247, -1.5345990657806396, -1.347097635269165, -1.1595962047576904, -0.9720947742462158, -0.784593403339386, -0.5970920324325562, -0.40959060192108154, -0.22208917140960693, -0.034587860107421875, 0.15291357040405273, 0.34041452407836914, 0.5279159545898438, 0.7154173254966736, 0.9029186964035034, 1.090420126914978, 1.2779215574264526, 1.4654228687286377, 1.6529242992401123, 1.840425729751587, 2.0279271602630615, 2.215428590774536, 2.4029297828674316, 2.5904312133789062, 2.777932643890381, 2.9654340744018555, 3.15293550491333, 3.3404369354248047, 3.5279383659362793, 3.715439796447754, 3.9029412269592285, 4.090442657470703, 4.277944087982178, 4.465445518493652, 4.652946472167969, 4.840448379516602, 5.027949810028076, 5.215451240539551, 5.402952671051025, 5.5904541015625, 5.777955532073975, 5.965456962585449, 6.152957916259766, 6.34045934677124]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 8.0, 8.0, 16.0, 14.0, 29.0, 22.0, 26.0, 49.0, 62.0, 61.0, 71.0, 78.0, 61.0, 62.0, 74.0, 80.0, 45.0, 49.0, 44.0, 26.0, 23.0, 23.0, 14.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03287935256958, -3.9171664714813232, -3.8014535903930664, -3.6857404708862305, -3.5700275897979736, -3.454314708709717, -3.33860182762146, -3.222888946533203, -3.1071760654449463, -2.9914631843566895, -2.8757503032684326, -2.760037422180176, -2.64432430267334, -2.528611421585083, -2.412898540496826, -2.2971856594085693, -2.1814727783203125, -2.0657598972320557, -1.9500468969345093, -1.8343340158462524, -1.7186211347579956, -1.6029081344604492, -1.4871952533721924, -1.3714823722839355, -1.2557692527770996, -1.1400563716888428, -1.0243433713912964, -0.9086304903030396, -0.7929176092147827, -0.6772046685218811, -0.5614917278289795, -0.44577884674072266, -0.3300659656524658, -0.2143530547618866, -0.09864012897014618, 0.01707279682159424, 0.13278570771217346, 0.24849861860275269, 0.3642115592956543, 0.47992444038391113, 0.5956373810768127, 0.7113503217697144, 0.8270632028579712, 0.9427761435508728, 1.0584890842437744, 1.1742019653320312, 1.289914846420288, 1.405627727508545, 1.5213407278060913, 1.6370536088943481, 1.7527666091918945, 1.8684794902801514, 1.9841923713684082, 2.099905252456665, 2.215618133544922, 2.331331253051758, 2.4470441341400146, 2.5627570152282715, 2.6784698963165283, 2.794182777404785, 2.909895896911621, 3.025608777999878, 3.1413216590881348, 3.2570345401763916, 3.3727474212646484]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 1.0, 7.0, 6.0, 14.0, 12.0, 14.0, 31.0, 43.0, 68.0, 131.0, 249.0, 564.0, 1545.0, 5964.0, 38001.0, 672701.0, 302556.0, 20716.0, 3851.0, 1173.0, 425.0, 180.0, 109.0, 63.0, 39.0, 23.0, 19.0, 10.0, 10.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.465087890625, -0.4504890441894531, -0.43589019775390625, -0.4212913513183594, -0.4066925048828125, -0.3920936584472656, -0.37749481201171875, -0.3628959655761719, -0.348297119140625, -0.3336982727050781, -0.31909942626953125, -0.3045005798339844, -0.2899017333984375, -0.2753028869628906, -0.26070404052734375, -0.24610519409179688, -0.23150634765625, -0.21690750122070312, -0.20230865478515625, -0.18770980834960938, -0.1731109619140625, -0.15851211547851562, -0.14391326904296875, -0.12931442260742188, -0.114715576171875, -0.10011672973632812, -0.08551788330078125, -0.07091903686523438, -0.0563201904296875, -0.041721343994140625, -0.02712249755859375, -0.012523651123046875, 0.0020751953125, 0.016674041748046875, 0.03127288818359375, 0.045871734619140625, 0.0604705810546875, 0.07506942749023438, 0.08966827392578125, 0.10426712036132812, 0.118865966796875, 0.13346481323242188, 0.14806365966796875, 0.16266250610351562, 0.1772613525390625, 0.19186019897460938, 0.20645904541015625, 0.22105789184570312, 0.23565673828125, 0.2502555847167969, 0.26485443115234375, 0.2794532775878906, 0.2940521240234375, 0.3086509704589844, 0.32324981689453125, 0.3378486633300781, 0.352447509765625, 0.3670463562011719, 0.38164520263671875, 0.3962440490722656, 0.4108428955078125, 0.4254417419433594, 0.44004058837890625, 0.4546394348144531, 0.46923828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 6.0, 13.0, 10.0, 11.0, 27.0, 19.0, 25.0, 55.0, 40.0, 78.0, 100.0, 82.0, 88.0, 83.0, 67.0, 70.0, 46.0, 42.0, 26.0, 29.0, 20.0, 17.0, 7.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.953125, -2.866912841796875, -2.78070068359375, -2.694488525390625, -2.6082763671875, -2.522064208984375, -2.43585205078125, -2.349639892578125, -2.263427734375, -2.177215576171875, -2.09100341796875, -2.004791259765625, -1.9185791015625, -1.832366943359375, -1.74615478515625, -1.659942626953125, -1.57373046875, -1.487518310546875, -1.40130615234375, -1.315093994140625, -1.2288818359375, -1.142669677734375, -1.05645751953125, -0.970245361328125, -0.884033203125, -0.797821044921875, -0.71160888671875, -0.625396728515625, -0.5391845703125, -0.452972412109375, -0.36676025390625, -0.280548095703125, -0.1943359375, -0.108123779296875, -0.02191162109375, 0.064300537109375, 0.1505126953125, 0.236724853515625, 0.32293701171875, 0.409149169921875, 0.495361328125, 0.581573486328125, 0.66778564453125, 0.753997802734375, 0.8402099609375, 0.926422119140625, 1.01263427734375, 1.098846435546875, 1.18505859375, 1.271270751953125, 1.35748291015625, 1.443695068359375, 1.5299072265625, 1.616119384765625, 1.70233154296875, 1.788543701171875, 1.874755859375, 1.960968017578125, 2.04718017578125, 2.133392333984375, 2.2196044921875, 2.305816650390625, 2.39202880859375, 2.478240966796875, 2.564453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 8.0, 9.0, 12.0, 13.0, 23.0, 38.0, 45.0, 94.0, 87.0, 128.0, 193.0, 303.0, 476.0, 1192.0, 5836.0, 72054.0, 799457.0, 154916.0, 10416.0, 1578.0, 590.0, 327.0, 224.0, 136.0, 93.0, 79.0, 54.0, 45.0, 25.0, 18.0, 15.0, 8.0, 13.0, 10.0, 10.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3585357666015625, -0.347198486328125, -0.3358612060546875, -0.32452392578125, -0.3131866455078125, -0.301849365234375, -0.2905120849609375, -0.2791748046875, -0.2678375244140625, -0.256500244140625, -0.2451629638671875, -0.23382568359375, -0.2224884033203125, -0.211151123046875, -0.1998138427734375, -0.1884765625, -0.1771392822265625, -0.165802001953125, -0.1544647216796875, -0.14312744140625, -0.1317901611328125, -0.120452880859375, -0.1091156005859375, -0.0977783203125, -0.0864410400390625, -0.075103759765625, -0.0637664794921875, -0.05242919921875, -0.0410919189453125, -0.029754638671875, -0.0184173583984375, -0.007080078125, 0.0042572021484375, 0.015594482421875, 0.0269317626953125, 0.03826904296875, 0.0496063232421875, 0.060943603515625, 0.0722808837890625, 0.0836181640625, 0.0949554443359375, 0.106292724609375, 0.1176300048828125, 0.12896728515625, 0.1403045654296875, 0.151641845703125, 0.1629791259765625, 0.17431640625, 0.1856536865234375, 0.196990966796875, 0.2083282470703125, 0.21966552734375, 0.2310028076171875, 0.242340087890625, 0.2536773681640625, 0.2650146484375, 0.2763519287109375, 0.287689208984375, 0.2990264892578125, 0.31036376953125, 0.3217010498046875, 0.333038330078125, 0.3443756103515625, 0.355712890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 3.0, 11.0, 7.0, 13.0, 18.0, 27.0, 28.0, 33.0, 40.0, 57.0, 42.0, 50.0, 46.0, 67.0, 61.0, 51.0, 67.0, 57.0, 51.0, 33.0, 29.0, 32.0, 29.0, 30.0, 20.0, 17.0, 13.0, 12.0, 8.0, 6.0, 13.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74017333984375, -3.6053466796875, -3.47052001953125, -3.335693359375, -3.20086669921875, -3.0660400390625, -2.93121337890625, -2.79638671875, -2.66156005859375, -2.5267333984375, -2.39190673828125, -2.257080078125, -2.12225341796875, -1.9874267578125, -1.85260009765625, -1.7177734375, -1.58294677734375, -1.4481201171875, -1.31329345703125, -1.178466796875, -1.04364013671875, -0.9088134765625, -0.77398681640625, -0.63916015625, -0.50433349609375, -0.3695068359375, -0.23468017578125, -0.099853515625, 0.03497314453125, 0.1697998046875, 0.30462646484375, 0.439453125, 0.57427978515625, 0.7091064453125, 0.84393310546875, 0.978759765625, 1.11358642578125, 1.2484130859375, 1.38323974609375, 1.51806640625, 1.65289306640625, 1.7877197265625, 1.92254638671875, 2.057373046875, 2.19219970703125, 2.3270263671875, 2.46185302734375, 2.5966796875, 2.73150634765625, 2.8663330078125, 3.00115966796875, 3.135986328125, 3.27081298828125, 3.4056396484375, 3.54046630859375, 3.67529296875, 3.81011962890625, 3.9449462890625, 4.07977294921875, 4.214599609375, 4.34942626953125, 4.4842529296875, 4.61907958984375, 4.75390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 5.0, 7.0, 15.0, 13.0, 11.0, 22.0, 30.0, 37.0, 54.0, 49.0, 80.0, 105.0, 108.0, 173.0, 232.0, 317.0, 544.0, 1263.0, 6010.0, 87056.0, 913626.0, 32732.0, 3480.0, 933.0, 466.0, 314.0, 213.0, 159.0, 104.0, 81.0, 64.0, 40.0, 45.0, 29.0, 25.0, 31.0, 14.0, 15.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.06903076171875, -0.06702136993408203, -0.06501197814941406, -0.0630025863647461, -0.060993194580078125, -0.058983802795410156, -0.05697441101074219, -0.05496501922607422, -0.05295562744140625, -0.05094623565673828, -0.04893684387207031, -0.046927452087402344, -0.044918060302734375, -0.042908668518066406, -0.04089927673339844, -0.03888988494873047, -0.0368804931640625, -0.03487110137939453, -0.03286170959472656, -0.030852317810058594, -0.028842926025390625, -0.026833534240722656, -0.024824142456054688, -0.02281475067138672, -0.02080535888671875, -0.01879596710205078, -0.016786575317382812, -0.014777183532714844, -0.012767791748046875, -0.010758399963378906, -0.008749008178710938, -0.006739616394042969, -0.004730224609375, -0.0027208328247070312, -0.0007114410400390625, 0.0012979507446289062, 0.003307342529296875, 0.005316734313964844, 0.0073261260986328125, 0.009335517883300781, 0.01134490966796875, 0.013354301452636719, 0.015363693237304688, 0.017373085021972656, 0.019382476806640625, 0.021391868591308594, 0.023401260375976562, 0.02541065216064453, 0.0274200439453125, 0.02942943572998047, 0.03143882751464844, 0.033448219299316406, 0.035457611083984375, 0.037467002868652344, 0.03947639465332031, 0.04148578643798828, 0.04349517822265625, 0.04550457000732422, 0.04751396179199219, 0.049523353576660156, 0.051532745361328125, 0.053542137145996094, 0.05555152893066406, 0.05756092071533203, 0.0595703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 16.0, 14.0, 18.0, 28.0, 49.0, 59.0, 113.0, 115.0, 114.0, 126.0, 88.0, 68.0, 40.0, 26.0, 28.0, 15.0, 12.0, 17.0, 9.0, 9.0, 8.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0159950256347656e-05, -2.9262155294418335e-05, -2.8364360332489014e-05, -2.7466565370559692e-05, -2.656877040863037e-05, -2.567097544670105e-05, -2.477318048477173e-05, -2.3875385522842407e-05, -2.2977590560913086e-05, -2.2079795598983765e-05, -2.1182000637054443e-05, -2.0284205675125122e-05, -1.93864107131958e-05, -1.848861575126648e-05, -1.7590820789337158e-05, -1.6693025827407837e-05, -1.5795230865478516e-05, -1.4897435903549194e-05, -1.3999640941619873e-05, -1.3101845979690552e-05, -1.220405101776123e-05, -1.130625605583191e-05, -1.0408461093902588e-05, -9.510666131973267e-06, -8.612871170043945e-06, -7.715076208114624e-06, -6.817281246185303e-06, -5.9194862842559814e-06, -5.02169132232666e-06, -4.123896360397339e-06, -3.2261013984680176e-06, -2.3283064365386963e-06, -1.430511474609375e-06, -5.327165126800537e-07, 3.650784492492676e-07, 1.2628734111785889e-06, 2.16066837310791e-06, 3.0584633350372314e-06, 3.956258296966553e-06, 4.854053258895874e-06, 5.751848220825195e-06, 6.649643182754517e-06, 7.547438144683838e-06, 8.44523310661316e-06, 9.34302806854248e-06, 1.0240823030471802e-05, 1.1138617992401123e-05, 1.2036412954330444e-05, 1.2934207916259766e-05, 1.3832002878189087e-05, 1.4729797840118408e-05, 1.562759280204773e-05, 1.652538776397705e-05, 1.7423182725906372e-05, 1.8320977687835693e-05, 1.9218772649765015e-05, 2.0116567611694336e-05, 2.1014362573623657e-05, 2.191215753555298e-05, 2.28099524974823e-05, 2.370774745941162e-05, 2.4605542421340942e-05, 2.5503337383270264e-05, 2.6401132345199585e-05, 2.7298927307128906e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 18.0, 10.0, 18.0, 44.0, 46.0, 70.0, 105.0, 202.0, 299.0, 593.0, 1243.0, 2918.0, 9477.0, 52007.0, 842430.0, 116637.0, 14824.0, 4207.0, 1668.0, 711.0, 400.0, 227.0, 122.0, 68.0, 49.0, 33.0, 18.0, 16.0, 16.0, 12.0, 2.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10235595703125, -0.09931468963623047, -0.09627342224121094, -0.0932321548461914, -0.09019088745117188, -0.08714962005615234, -0.08410835266113281, -0.08106708526611328, -0.07802581787109375, -0.07498455047607422, -0.07194328308105469, -0.06890201568603516, -0.06586074829101562, -0.0628194808959961, -0.05977821350097656, -0.05673694610595703, -0.0536956787109375, -0.05065441131591797, -0.04761314392089844, -0.044571876525878906, -0.041530609130859375, -0.038489341735839844, -0.03544807434082031, -0.03240680694580078, -0.02936553955078125, -0.02632427215576172, -0.023283004760742188, -0.020241737365722656, -0.017200469970703125, -0.014159202575683594, -0.011117935180664062, -0.008076667785644531, -0.005035400390625, -0.0019941329956054688, 0.0010471343994140625, 0.004088401794433594, 0.007129669189453125, 0.010170936584472656, 0.013212203979492188, 0.01625347137451172, 0.01929473876953125, 0.02233600616455078, 0.025377273559570312, 0.028418540954589844, 0.031459808349609375, 0.034501075744628906, 0.03754234313964844, 0.04058361053466797, 0.0436248779296875, 0.04666614532470703, 0.04970741271972656, 0.052748680114746094, 0.055789947509765625, 0.058831214904785156, 0.06187248229980469, 0.06491374969482422, 0.06795501708984375, 0.07099628448486328, 0.07403755187988281, 0.07707881927490234, 0.08012008666992188, 0.0831613540649414, 0.08620262145996094, 0.08924388885498047, 0.09228515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 7.0, 2.0, 5.0, 6.0, 15.0, 16.0, 30.0, 40.0, 63.0, 102.0, 197.0, 190.0, 83.0, 68.0, 35.0, 28.0, 21.0, 14.0, 8.0, 6.0, 11.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019195556640625, -0.018575668334960938, -0.017955780029296875, -0.017335891723632812, -0.01671600341796875, -0.016096115112304688, -0.015476226806640625, -0.014856338500976562, -0.0142364501953125, -0.013616561889648438, -0.012996673583984375, -0.012376785278320312, -0.01175689697265625, -0.011137008666992188, -0.010517120361328125, -0.009897232055664062, -0.00927734375, -0.008657455444335938, -0.008037567138671875, -0.0074176788330078125, -0.00679779052734375, -0.0061779022216796875, -0.005558013916015625, -0.0049381256103515625, -0.0043182373046875, -0.0036983489990234375, -0.003078460693359375, -0.0024585723876953125, -0.00183868408203125, -0.0012187957763671875, -0.000598907470703125, 2.09808349609375e-05, 0.000640869140625, 0.0012607574462890625, 0.001880645751953125, 0.0025005340576171875, 0.00312042236328125, 0.0037403106689453125, 0.004360198974609375, 0.0049800872802734375, 0.0055999755859375, 0.0062198638916015625, 0.006839752197265625, 0.0074596405029296875, 0.00807952880859375, 0.008699417114257812, 0.009319305419921875, 0.009939193725585938, 0.01055908203125, 0.011178970336914062, 0.011798858642578125, 0.012418746948242188, 0.01303863525390625, 0.013658523559570312, 0.014278411865234375, 0.014898300170898438, 0.0155181884765625, 0.016138076782226562, 0.016757965087890625, 0.017377853393554688, 0.01799774169921875, 0.018617630004882812, 0.019237518310546875, 0.019857406616210938, 0.020477294921875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 12.0, 21.0, 32.0, 84.0, 188.0, 278.0, 196.0, 84.0, 30.0, 21.0, 15.0, 4.0, 9.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39328145980835, -5.222194671630859, -5.051107406616211, -4.880020618438721, -4.7089338302612305, -4.537846565246582, -4.366759777069092, -4.195672988891602, -4.024585723876953, -3.853498697280884, -3.6824119091033936, -3.511324882507324, -3.340238094329834, -3.1691510677337646, -2.9980640411376953, -2.826977252960205, -2.655890464782715, -2.4848034381866455, -2.3137166500091553, -2.142629623413086, -1.9715427160263062, -1.8004558086395264, -1.629368782043457, -1.4582818746566772, -1.2871949672698975, -1.1161080598831177, -0.9450210928916931, -0.7739341259002686, -0.6028472185134888, -0.431760311126709, -0.26067328453063965, -0.08958637714385986, 0.08150053024291992, 0.2525874674320221, 0.42367440462112427, 0.5947613716125488, 0.7658482789993286, 0.9369351863861084, 1.1080222129821777, 1.2791091203689575, 1.4501960277557373, 1.621282935142517, 1.7923698425292969, 1.9634568691253662, 2.1345438957214355, 2.305630683898926, 2.476717710494995, 2.6478047370910645, 2.8188915252685547, 2.989978551864624, 3.1610653400421143, 3.3321523666381836, 3.503239154815674, 3.674326181411743, 3.8454132080078125, 4.016499996185303, 4.187586784362793, 4.358673572540283, 4.529760837554932, 4.700847625732422, 4.871934413909912, 5.043021202087402, 5.214108467102051, 5.385195255279541, 5.5562825202941895]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 8.0, 8.0, 6.0, 10.0, 12.0, 16.0, 19.0, 29.0, 37.0, 61.0, 69.0, 82.0, 75.0, 85.0, 86.0, 81.0, 65.0, 53.0, 49.0, 41.0, 29.0, 20.0, 17.0, 13.0, 1.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0085010528564453, -2.9245901107788086, -2.840679168701172, -2.756768226623535, -2.6728570461273193, -2.5889461040496826, -2.505035161972046, -2.421124219894409, -2.3372130393981934, -2.2533020973205566, -2.16939115524292, -2.085480213165283, -2.0015690326690674, -1.9176580905914307, -1.833747148513794, -1.7498362064361572, -1.6659252643585205, -1.5820143222808838, -1.4981032609939575, -1.4141923189163208, -1.3302812576293945, -1.2463703155517578, -1.162459373474121, -1.0785484313964844, -0.9946373701095581, -0.9107263684272766, -0.8268153667449951, -0.7429044246673584, -0.6589934229850769, -0.5750824213027954, -0.4911714792251587, -0.4072604775428772, -0.3233497142791748, -0.2394387274980545, -0.1555277407169342, -0.0716167688369751, 0.012294232845306396, 0.09620523452758789, 0.1801161766052246, 0.2640271782875061, 0.3479381799697876, 0.4318491816520691, 0.5157601833343506, 0.5996711254119873, 0.6835821270942688, 0.7674931287765503, 0.851404070854187, 0.9353150725364685, 1.01922607421875, 1.1031370162963867, 1.187048077583313, 1.2709590196609497, 1.354870080947876, 1.4387810230255127, 1.5226919651031494, 1.6066029071807861, 1.6905139684677124, 1.7744249105453491, 1.8583359718322754, 1.942246913909912, 2.026157855987549, 2.1100687980651855, 2.1939797401428223, 2.277890920639038, 2.361801862716675]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 23.0, 30.0, 36.0, 60.0, 98.0, 186.0, 322.0, 634.0, 1214.0, 2691.0, 6309.0, 17786.0, 62386.0, 297788.0, 501380.0, 112246.0, 28527.0, 9716.0, 3689.0, 1611.0, 813.0, 417.0, 245.0, 121.0, 80.0, 41.0, 37.0, 17.0, 9.0, 6.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.6116485595703125, -1.552398681640625, -1.4931488037109375, -1.43389892578125, -1.3746490478515625, -1.315399169921875, -1.2561492919921875, -1.1968994140625, -1.1376495361328125, -1.078399658203125, -1.0191497802734375, -0.95989990234375, -0.9006500244140625, -0.841400146484375, -0.7821502685546875, -0.722900390625, -0.6636505126953125, -0.604400634765625, -0.5451507568359375, -0.48590087890625, -0.4266510009765625, -0.367401123046875, -0.3081512451171875, -0.2489013671875, -0.1896514892578125, -0.130401611328125, -0.0711517333984375, -0.01190185546875, 0.0473480224609375, 0.106597900390625, 0.1658477783203125, 0.22509765625, 0.2843475341796875, 0.343597412109375, 0.4028472900390625, 0.46209716796875, 0.5213470458984375, 0.580596923828125, 0.6398468017578125, 0.6990966796875, 0.7583465576171875, 0.817596435546875, 0.8768463134765625, 0.93609619140625, 0.9953460693359375, 1.054595947265625, 1.1138458251953125, 1.173095703125, 1.2323455810546875, 1.291595458984375, 1.3508453369140625, 1.41009521484375, 1.4693450927734375, 1.528594970703125, 1.5878448486328125, 1.6470947265625, 1.7063446044921875, 1.765594482421875, 1.8248443603515625, 1.88409423828125, 1.9433441162109375, 2.002593994140625, 2.0618438720703125, 2.12109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 6.0, 7.0, 19.0, 21.0, 20.0, 28.0, 57.0, 61.0, 64.0, 81.0, 88.0, 95.0, 86.0, 58.0, 68.0, 48.0, 42.0, 32.0, 22.0, 24.0, 16.0, 7.0, 1.0, 6.0, 9.0, 1.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.29296875, -7.08709716796875, -6.8812255859375, -6.67535400390625, -6.469482421875, -6.26361083984375, -6.0577392578125, -5.85186767578125, -5.64599609375, -5.44012451171875, -5.2342529296875, -5.02838134765625, -4.822509765625, -4.61663818359375, -4.4107666015625, -4.20489501953125, -3.9990234375, -3.79315185546875, -3.5872802734375, -3.38140869140625, -3.175537109375, -2.96966552734375, -2.7637939453125, -2.55792236328125, -2.35205078125, -2.14617919921875, -1.9403076171875, -1.73443603515625, -1.528564453125, -1.32269287109375, -1.1168212890625, -0.91094970703125, -0.705078125, -0.49920654296875, -0.2933349609375, -0.08746337890625, 0.118408203125, 0.32427978515625, 0.5301513671875, 0.73602294921875, 0.94189453125, 1.14776611328125, 1.3536376953125, 1.55950927734375, 1.765380859375, 1.97125244140625, 2.1771240234375, 2.38299560546875, 2.5888671875, 2.79473876953125, 3.0006103515625, 3.20648193359375, 3.412353515625, 3.61822509765625, 3.8240966796875, 4.02996826171875, 4.23583984375, 4.44171142578125, 4.6475830078125, 4.85345458984375, 5.059326171875, 5.26519775390625, 5.4710693359375, 5.67694091796875, 5.8828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 10.0, 6.0, 16.0, 12.0, 20.0, 28.0, 47.0, 56.0, 70.0, 84.0, 135.0, 230.0, 437.0, 867.0, 2140.0, 6702.0, 31504.0, 256544.0, 641354.0, 87403.0, 14278.0, 3832.0, 1368.0, 574.0, 310.0, 168.0, 110.0, 79.0, 41.0, 34.0, 22.0, 20.0, 16.0, 7.0, 13.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.9011077880859375, -1.840301513671875, -1.7794952392578125, -1.71868896484375, -1.6578826904296875, -1.597076416015625, -1.5362701416015625, -1.4754638671875, -1.4146575927734375, -1.353851318359375, -1.2930450439453125, -1.23223876953125, -1.1714324951171875, -1.110626220703125, -1.0498199462890625, -0.989013671875, -0.9282073974609375, -0.867401123046875, -0.8065948486328125, -0.74578857421875, -0.6849822998046875, -0.624176025390625, -0.5633697509765625, -0.5025634765625, -0.4417572021484375, -0.380950927734375, -0.3201446533203125, -0.25933837890625, -0.1985321044921875, -0.137725830078125, -0.0769195556640625, -0.01611328125, 0.0446929931640625, 0.105499267578125, 0.1663055419921875, 0.22711181640625, 0.2879180908203125, 0.348724365234375, 0.4095306396484375, 0.4703369140625, 0.5311431884765625, 0.591949462890625, 0.6527557373046875, 0.71356201171875, 0.7743682861328125, 0.835174560546875, 0.8959808349609375, 0.956787109375, 1.0175933837890625, 1.078399658203125, 1.1392059326171875, 1.20001220703125, 1.2608184814453125, 1.321624755859375, 1.3824310302734375, 1.4432373046875, 1.5040435791015625, 1.564849853515625, 1.6256561279296875, 1.68646240234375, 1.7472686767578125, 1.808074951171875, 1.8688812255859375, 1.9296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 13.0, 10.0, 15.0, 12.0, 19.0, 31.0, 33.0, 41.0, 40.0, 45.0, 50.0, 44.0, 48.0, 46.0, 57.0, 56.0, 56.0, 61.0, 34.0, 44.0, 40.0, 45.0, 22.0, 27.0, 15.0, 20.0, 13.0, 9.0, 5.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.05950927734375, -6.8416748046875, -6.62384033203125, -6.406005859375, -6.18817138671875, -5.9703369140625, -5.75250244140625, -5.53466796875, -5.31683349609375, -5.0989990234375, -4.88116455078125, -4.663330078125, -4.44549560546875, -4.2276611328125, -4.00982666015625, -3.7919921875, -3.57415771484375, -3.3563232421875, -3.13848876953125, -2.920654296875, -2.70281982421875, -2.4849853515625, -2.26715087890625, -2.04931640625, -1.83148193359375, -1.6136474609375, -1.39581298828125, -1.177978515625, -0.96014404296875, -0.7423095703125, -0.52447509765625, -0.306640625, -0.08880615234375, 0.1290283203125, 0.34686279296875, 0.564697265625, 0.78253173828125, 1.0003662109375, 1.21820068359375, 1.43603515625, 1.65386962890625, 1.8717041015625, 2.08953857421875, 2.307373046875, 2.52520751953125, 2.7430419921875, 2.96087646484375, 3.1787109375, 3.39654541015625, 3.6143798828125, 3.83221435546875, 4.050048828125, 4.26788330078125, 4.4857177734375, 4.70355224609375, 4.92138671875, 5.13922119140625, 5.3570556640625, 5.57489013671875, 5.792724609375, 6.01055908203125, 6.2283935546875, 6.44622802734375, 6.6640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 10.0, 14.0, 32.0, 46.0, 70.0, 139.0, 235.0, 429.0, 841.0, 2234.0, 7367.0, 45931.0, 708200.0, 255953.0, 19857.0, 4226.0, 1451.0, 654.0, 336.0, 184.0, 99.0, 80.0, 36.0, 21.0, 20.0, 9.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9049224853515625, -0.868438720703125, -0.8319549560546875, -0.79547119140625, -0.7589874267578125, -0.722503662109375, -0.6860198974609375, -0.6495361328125, -0.6130523681640625, -0.576568603515625, -0.5400848388671875, -0.50360107421875, -0.4671173095703125, -0.430633544921875, -0.3941497802734375, -0.357666015625, -0.3211822509765625, -0.284698486328125, -0.2482147216796875, -0.21173095703125, -0.1752471923828125, -0.138763427734375, -0.1022796630859375, -0.0657958984375, -0.0293121337890625, 0.007171630859375, 0.0436553955078125, 0.08013916015625, 0.1166229248046875, 0.153106689453125, 0.1895904541015625, 0.22607421875, 0.2625579833984375, 0.299041748046875, 0.3355255126953125, 0.37200927734375, 0.4084930419921875, 0.444976806640625, 0.4814605712890625, 0.5179443359375, 0.5544281005859375, 0.590911865234375, 0.6273956298828125, 0.66387939453125, 0.7003631591796875, 0.736846923828125, 0.7733306884765625, 0.809814453125, 0.8462982177734375, 0.882781982421875, 0.9192657470703125, 0.95574951171875, 0.9922332763671875, 1.028717041015625, 1.0652008056640625, 1.1016845703125, 1.1381683349609375, 1.174652099609375, 1.2111358642578125, 1.24761962890625, 1.2841033935546875, 1.320587158203125, 1.3570709228515625, 1.3935546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 5.0, 7.0, 10.0, 16.0, 17.0, 27.0, 36.0, 53.0, 90.0, 84.0, 129.0, 118.0, 112.0, 90.0, 47.0, 43.0, 37.0, 17.0, 15.0, 12.0, 10.0, 5.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001647472381591797, -0.00015980564057826996, -0.00015486404299736023, -0.0001499224454164505, -0.00014498084783554077, -0.00014003925025463104, -0.0001350976526737213, -0.00013015605509281158, -0.00012521445751190186, -0.00012027285993099213, -0.0001153312623500824, -0.00011038966476917267, -0.00010544806718826294, -0.00010050646960735321, -9.556487202644348e-05, -9.062327444553375e-05, -8.568167686462402e-05, -8.07400792837143e-05, -7.579848170280457e-05, -7.085688412189484e-05, -6.591528654098511e-05, -6.097368896007538e-05, -5.603209137916565e-05, -5.109049379825592e-05, -4.614889621734619e-05, -4.120729863643646e-05, -3.6265701055526733e-05, -3.1324103474617004e-05, -2.6382505893707275e-05, -2.1440908312797546e-05, -1.6499310731887817e-05, -1.1557713150978088e-05, -6.616115570068359e-06, -1.6745179891586304e-06, 3.2670795917510986e-06, 8.208677172660828e-06, 1.3150274753570557e-05, 1.8091872334480286e-05, 2.3033469915390015e-05, 2.7975067496299744e-05, 3.291666507720947e-05, 3.78582626581192e-05, 4.279986023902893e-05, 4.774145781993866e-05, 5.268305540084839e-05, 5.762465298175812e-05, 6.256625056266785e-05, 6.750784814357758e-05, 7.24494457244873e-05, 7.739104330539703e-05, 8.233264088630676e-05, 8.727423846721649e-05, 9.221583604812622e-05, 9.715743362903595e-05, 0.00010209903120994568, 0.00010704062879085541, 0.00011198222637176514, 0.00011692382395267487, 0.0001218654215335846, 0.00012680701911449432, 0.00013174861669540405, 0.00013669021427631378, 0.0001416318118572235, 0.00014657340943813324, 0.00015151500701904297]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 11.0, 14.0, 21.0, 20.0, 25.0, 34.0, 43.0, 72.0, 99.0, 144.0, 232.0, 428.0, 852.0, 1767.0, 4257.0, 12957.0, 63857.0, 557715.0, 347635.0, 41573.0, 9938.0, 3432.0, 1520.0, 767.0, 421.0, 226.0, 159.0, 95.0, 65.0, 48.0, 28.0, 15.0, 10.0, 18.0, 14.0, 9.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6748046875, -0.6487350463867188, -0.6226654052734375, -0.5965957641601562, -0.570526123046875, -0.5444564819335938, -0.5183868408203125, -0.49231719970703125, -0.46624755859375, -0.44017791748046875, -0.4141082763671875, -0.38803863525390625, -0.361968994140625, -0.33589935302734375, -0.3098297119140625, -0.28376007080078125, -0.2576904296875, -0.23162078857421875, -0.2055511474609375, -0.17948150634765625, -0.153411865234375, -0.12734222412109375, -0.1012725830078125, -0.07520294189453125, -0.04913330078125, -0.02306365966796875, 0.0030059814453125, 0.02907562255859375, 0.055145263671875, 0.08121490478515625, 0.1072845458984375, 0.13335418701171875, 0.159423828125, 0.18549346923828125, 0.2115631103515625, 0.23763275146484375, 0.263702392578125, 0.28977203369140625, 0.3158416748046875, 0.34191131591796875, 0.36798095703125, 0.39405059814453125, 0.4201202392578125, 0.44618988037109375, 0.472259521484375, 0.49832916259765625, 0.5243988037109375, 0.5504684448242188, 0.5765380859375, 0.6026077270507812, 0.6286773681640625, 0.6547470092773438, 0.680816650390625, 0.7068862915039062, 0.7329559326171875, 0.7590255737304688, 0.78509521484375, 0.8111648559570312, 0.8372344970703125, 0.8633041381835938, 0.889373779296875, 0.9154434204101562, 0.9415130615234375, 0.9675827026367188, 0.99365234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 10.0, 9.0, 7.0, 18.0, 21.0, 17.0, 29.0, 35.0, 52.0, 58.0, 82.0, 78.0, 95.0, 96.0, 68.0, 73.0, 58.0, 40.0, 35.0, 35.0, 10.0, 19.0, 11.0, 3.0, 3.0, 8.0, 8.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3925323486328125, -0.381011962890625, -0.3694915771484375, -0.35797119140625, -0.3464508056640625, -0.334930419921875, -0.3234100341796875, -0.3118896484375, -0.3003692626953125, -0.288848876953125, -0.2773284912109375, -0.26580810546875, -0.2542877197265625, -0.242767333984375, -0.2312469482421875, -0.2197265625, -0.2082061767578125, -0.196685791015625, -0.1851654052734375, -0.17364501953125, -0.1621246337890625, -0.150604248046875, -0.1390838623046875, -0.1275634765625, -0.1160430908203125, -0.104522705078125, -0.0930023193359375, -0.08148193359375, -0.0699615478515625, -0.058441162109375, -0.0469207763671875, -0.035400390625, -0.0238800048828125, -0.012359619140625, -0.0008392333984375, 0.01068115234375, 0.0222015380859375, 0.033721923828125, 0.0452423095703125, 0.0567626953125, 0.0682830810546875, 0.079803466796875, 0.0913238525390625, 0.10284423828125, 0.1143646240234375, 0.125885009765625, 0.1374053955078125, 0.14892578125, 0.1604461669921875, 0.171966552734375, 0.1834869384765625, 0.19500732421875, 0.2065277099609375, 0.218048095703125, 0.2295684814453125, 0.2410888671875, 0.2526092529296875, 0.264129638671875, 0.2756500244140625, 0.28717041015625, 0.2986907958984375, 0.310211181640625, 0.3217315673828125, 0.333251953125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 10.0, 61.0, 160.0, 378.0, 248.0, 78.0, 28.0, 11.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.317737579345703, -20.76665496826172, -20.215572357177734, -19.66448974609375, -19.113407135009766, -18.56232452392578, -18.011241912841797, -17.460159301757812, -16.909076690673828, -16.357994079589844, -15.80691146850586, -15.255828857421875, -14.70474624633789, -14.153663635253906, -13.602581977844238, -13.051499366760254, -12.500417709350586, -11.949335098266602, -11.398252487182617, -10.847169876098633, -10.296087265014648, -9.745004653930664, -9.193922996520996, -8.642840385437012, -8.091757774353027, -7.540675163269043, -6.989592552185059, -6.438510417938232, -5.887427806854248, -5.336345195770264, -4.7852630615234375, -4.234180450439453, -3.6830968856811523, -3.132014274597168, -2.5809319019317627, -2.0298495292663574, -1.478766918182373, -0.9276843070983887, -0.3766019344329834, 0.17448043823242188, 0.7255630493164062, 1.276645541191101, 1.827728033065796, 2.378810405731201, 2.9298930168151855, 3.48097562789917, 4.032057762145996, 4.5831403732299805, 5.134222984313965, 5.685305595397949, 6.236388206481934, 6.78747034072876, 7.338552951812744, 7.8896355628967285, 8.440717697143555, 8.991800308227539, 9.542882919311523, 10.093965530395508, 10.645048141479492, 11.196130752563477, 11.747213363647461, 12.298295974731445, 12.849377632141113, 13.400460243225098, 13.951542854309082]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 10.0, 7.0, 10.0, 14.0, 13.0, 17.0, 26.0, 30.0, 33.0, 26.0, 42.0, 43.0, 42.0, 41.0, 54.0, 56.0, 52.0, 65.0, 44.0, 49.0, 47.0, 37.0, 42.0, 28.0, 22.0, 33.0, 24.0, 16.0, 11.0, 7.0, 11.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.751856803894043, -15.308099746704102, -14.864343643188477, -14.420587539672852, -13.97683048248291, -13.533073425292969, -13.089317321777344, -12.645561218261719, -12.201804161071777, -11.758047103881836, -11.314291000366211, -10.870534896850586, -10.426777839660645, -9.983020782470703, -9.539264678955078, -9.095508575439453, -8.651751518249512, -8.20799446105957, -7.764238357543945, -7.320481777191162, -6.876725196838379, -6.432968616485596, -5.9892120361328125, -5.545455455780029, -5.101698875427246, -4.657942295074463, -4.21418571472168, -3.7704291343688965, -3.3266725540161133, -2.88291597366333, -2.439159393310547, -1.9954028129577637, -1.5516462326049805, -1.1078896522521973, -0.6641330718994141, -0.22037649154663086, 0.22338008880615234, 0.6671366691589355, 1.1108932495117188, 1.554649829864502, 1.9984064102172852, 2.4421629905700684, 2.8859195709228516, 3.3296761512756348, 3.773432731628418, 4.217189311981201, 4.660945892333984, 5.104702472686768, 5.548459053039551, 5.992215633392334, 6.435972213745117, 6.8797287940979, 7.323485374450684, 7.767241954803467, 8.21099853515625, 8.654754638671875, 9.098511695861816, 9.542268753051758, 9.986024856567383, 10.429780960083008, 10.87353801727295, 11.31729507446289, 11.761051177978516, 12.20480728149414, 12.648564338684082]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 8.0, 11.0, 13.0, 16.0, 29.0, 30.0, 50.0, 58.0, 78.0, 142.0, 187.0, 315.0, 499.0, 899.0, 1683.0, 3504.0, 9112.0, 31250.0, 180986.0, 3351689.0, 531582.0, 56456.0, 14892.0, 5512.0, 2422.0, 1142.0, 630.0, 363.0, 235.0, 136.0, 101.0, 66.0, 44.0, 29.0, 27.0, 14.0, 25.0, 5.0, 7.0, 10.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-3.947265625, -3.836700439453125, -3.72613525390625, -3.615570068359375, -3.5050048828125, -3.394439697265625, -3.28387451171875, -3.173309326171875, -3.062744140625, -2.952178955078125, -2.84161376953125, -2.731048583984375, -2.6204833984375, -2.509918212890625, -2.39935302734375, -2.288787841796875, -2.17822265625, -2.067657470703125, -1.95709228515625, -1.846527099609375, -1.7359619140625, -1.625396728515625, -1.51483154296875, -1.404266357421875, -1.293701171875, -1.183135986328125, -1.07257080078125, -0.962005615234375, -0.8514404296875, -0.740875244140625, -0.63031005859375, -0.519744873046875, -0.4091796875, -0.298614501953125, -0.18804931640625, -0.077484130859375, 0.0330810546875, 0.143646240234375, 0.25421142578125, 0.364776611328125, 0.475341796875, 0.585906982421875, 0.69647216796875, 0.807037353515625, 0.9176025390625, 1.028167724609375, 1.13873291015625, 1.249298095703125, 1.35986328125, 1.470428466796875, 1.58099365234375, 1.691558837890625, 1.8021240234375, 1.912689208984375, 2.02325439453125, 2.133819580078125, 2.244384765625, 2.354949951171875, 2.46551513671875, 2.576080322265625, 2.6866455078125, 2.797210693359375, 2.90777587890625, 3.018341064453125, 3.12890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 1.0, 9.0, 13.0, 14.0, 14.0, 27.0, 34.0, 43.0, 54.0, 75.0, 81.0, 83.0, 116.0, 101.0, 95.0, 62.0, 41.0, 29.0, 24.0, 23.0, 10.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.797210693359375, -3.68621826171875, -3.575225830078125, -3.4642333984375, -3.353240966796875, -3.24224853515625, -3.131256103515625, -3.020263671875, -2.909271240234375, -2.79827880859375, -2.687286376953125, -2.5762939453125, -2.465301513671875, -2.35430908203125, -2.243316650390625, -2.13232421875, -2.021331787109375, -1.91033935546875, -1.799346923828125, -1.6883544921875, -1.577362060546875, -1.46636962890625, -1.355377197265625, -1.244384765625, -1.133392333984375, -1.02239990234375, -0.911407470703125, -0.8004150390625, -0.689422607421875, -0.57843017578125, -0.467437744140625, -0.3564453125, -0.245452880859375, -0.13446044921875, -0.023468017578125, 0.0875244140625, 0.198516845703125, 0.30950927734375, 0.420501708984375, 0.531494140625, 0.642486572265625, 0.75347900390625, 0.864471435546875, 0.9754638671875, 1.086456298828125, 1.19744873046875, 1.308441162109375, 1.41943359375, 1.530426025390625, 1.64141845703125, 1.752410888671875, 1.8634033203125, 1.974395751953125, 2.08538818359375, 2.196380615234375, 2.307373046875, 2.418365478515625, 2.52935791015625, 2.640350341796875, 2.7513427734375, 2.862335205078125, 2.97332763671875, 3.084320068359375, 3.1953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 5.0, 6.0, 5.0, 17.0, 24.0, 53.0, 62.0, 133.0, 299.0, 940.0, 4331.0, 52093.0, 4009552.0, 118281.0, 6576.0, 1184.0, 381.0, 152.0, 65.0, 47.0, 30.0, 20.0, 12.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.02728271484375, -7.7733154296875, -7.51934814453125, -7.265380859375, -7.01141357421875, -6.7574462890625, -6.50347900390625, -6.24951171875, -5.99554443359375, -5.7415771484375, -5.48760986328125, -5.233642578125, -4.97967529296875, -4.7257080078125, -4.47174072265625, -4.2177734375, -3.96380615234375, -3.7098388671875, -3.45587158203125, -3.201904296875, -2.94793701171875, -2.6939697265625, -2.44000244140625, -2.18603515625, -1.93206787109375, -1.6781005859375, -1.42413330078125, -1.170166015625, -0.91619873046875, -0.6622314453125, -0.40826416015625, -0.154296875, 0.09967041015625, 0.3536376953125, 0.60760498046875, 0.861572265625, 1.11553955078125, 1.3695068359375, 1.62347412109375, 1.87744140625, 2.13140869140625, 2.3853759765625, 2.63934326171875, 2.893310546875, 3.14727783203125, 3.4012451171875, 3.65521240234375, 3.9091796875, 4.16314697265625, 4.4171142578125, 4.67108154296875, 4.925048828125, 5.17901611328125, 5.4329833984375, 5.68695068359375, 5.94091796875, 6.19488525390625, 6.4488525390625, 6.70281982421875, 6.956787109375, 7.21075439453125, 7.4647216796875, 7.71868896484375, 7.97265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 8.0, 9.0, 11.0, 22.0, 20.0, 39.0, 36.0, 84.0, 122.0, 208.0, 421.0, 1195.0, 960.0, 395.0, 188.0, 103.0, 56.0, 60.0, 48.0, 33.0, 18.0, 10.0, 6.0, 10.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0266876220703125, -0.989898681640625, -0.9531097412109375, -0.91632080078125, -0.8795318603515625, -0.842742919921875, -0.8059539794921875, -0.7691650390625, -0.7323760986328125, -0.695587158203125, -0.6587982177734375, -0.62200927734375, -0.5852203369140625, -0.548431396484375, -0.5116424560546875, -0.474853515625, -0.4380645751953125, -0.401275634765625, -0.3644866943359375, -0.32769775390625, -0.2909088134765625, -0.254119873046875, -0.2173309326171875, -0.1805419921875, -0.1437530517578125, -0.106964111328125, -0.0701751708984375, -0.03338623046875, 0.0034027099609375, 0.040191650390625, 0.0769805908203125, 0.11376953125, 0.1505584716796875, 0.187347412109375, 0.2241363525390625, 0.26092529296875, 0.2977142333984375, 0.334503173828125, 0.3712921142578125, 0.4080810546875, 0.4448699951171875, 0.481658935546875, 0.5184478759765625, 0.55523681640625, 0.5920257568359375, 0.628814697265625, 0.6656036376953125, 0.702392578125, 0.7391815185546875, 0.775970458984375, 0.8127593994140625, 0.84954833984375, 0.8863372802734375, 0.923126220703125, 0.9599151611328125, 0.9967041015625, 1.0334930419921875, 1.070281982421875, 1.1070709228515625, 1.14385986328125, 1.1806488037109375, 1.217437744140625, 1.2542266845703125, 1.291015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 7.0, 18.0, 21.0, 16.0, 28.0, 40.0, 94.0, 193.0, 196.0, 146.0, 99.0, 54.0, 26.0, 18.0, 12.0, 7.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.628277778625488, -5.443141937255859, -5.258006572723389, -5.07287073135376, -4.887734889984131, -4.702599048614502, -4.517463684082031, -4.332327842712402, -4.147192001342773, -3.9620563983917236, -3.7769205570220947, -3.591784954071045, -3.406649112701416, -3.221513509750366, -3.0363779067993164, -2.8512420654296875, -2.6661064624786377, -2.480970859527588, -2.295835018157959, -2.110699415206909, -1.9255635738372803, -1.7404279708862305, -1.5552922487258911, -1.3701565265655518, -1.1850208044052124, -0.999885082244873, -0.8147493600845337, -0.6296136975288391, -0.44447797536849976, -0.2593422532081604, -0.07420659065246582, 0.11092913150787354, 0.2960648536682129, 0.48120057582855225, 0.6663362979888916, 0.8514719605445862, 1.0366077423095703, 1.2217433452606201, 1.4068790674209595, 1.5920147895812988, 1.7771505117416382, 1.9622862339019775, 2.1474218368530273, 2.3325576782226562, 2.517693281173706, 2.702829122543335, 2.8879647254943848, 3.0731005668640137, 3.2582361698150635, 3.4433717727661133, 3.628507614135742, 3.813643217086792, 3.998779058456421, 4.183914661407471, 4.3690505027771, 4.55418586730957, 4.739321708679199, 4.924457550048828, 5.109592914581299, 5.294728755950928, 5.479864597320557, 5.6650004386901855, 5.850135803222656, 6.035271644592285, 6.220407485961914]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 7.0, 9.0, 5.0, 22.0, 20.0, 18.0, 30.0, 33.0, 46.0, 51.0, 61.0, 67.0, 67.0, 62.0, 72.0, 64.0, 57.0, 65.0, 43.0, 41.0, 35.0, 28.0, 14.0, 16.0, 19.0, 9.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.736663818359375, -3.6356585025787354, -3.5346531867980957, -3.433647871017456, -3.3326425552368164, -3.2316370010375977, -3.130631685256958, -3.0296263694763184, -2.9286210536956787, -2.827615737915039, -2.7266104221343994, -2.6256051063537598, -2.524599552154541, -2.4235944747924805, -2.3225889205932617, -2.221583604812622, -2.1205782890319824, -2.0195729732513428, -1.9185676574707031, -1.817562222480774, -1.7165569067001343, -1.6155515909194946, -1.5145461559295654, -1.4135408401489258, -1.3125355243682861, -1.2115302085876465, -1.1105248928070068, -1.0095194578170776, -0.908514142036438, -0.8075088262557983, -0.7065034508705139, -0.6054980754852295, -0.5044925212860107, -0.4034871757030487, -0.30248183012008667, -0.20147648453712463, -0.1004711389541626, 0.0005341768264770508, 0.10153955221176147, 0.2025449275970459, 0.30355024337768555, 0.4045555889606476, 0.5055609345436096, 0.606566309928894, 0.7075716257095337, 0.8085769414901733, 0.9095823168754578, 1.0105876922607422, 1.1115930080413818, 1.2125983238220215, 1.3136036396026611, 1.4146090745925903, 1.51561439037323, 1.6166197061538696, 1.7176251411437988, 1.8186304569244385, 1.9196357727050781, 2.0206410884857178, 2.1216464042663574, 2.222651720046997, 2.3236570358276367, 2.4246625900268555, 2.525667905807495, 2.6266732215881348, 2.7276785373687744]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 11.0, 17.0, 27.0, 38.0, 45.0, 81.0, 142.0, 299.0, 806.0, 3433.0, 33512.0, 869750.0, 131080.0, 7042.0, 1370.0, 392.0, 197.0, 92.0, 59.0, 27.0, 28.0, 22.0, 17.0, 13.0, 11.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6513671875, -0.6320343017578125, -0.612701416015625, -0.5933685302734375, -0.57403564453125, -0.5547027587890625, -0.535369873046875, -0.5160369873046875, -0.4967041015625, -0.4773712158203125, -0.458038330078125, -0.4387054443359375, -0.41937255859375, -0.4000396728515625, -0.380706787109375, -0.3613739013671875, -0.342041015625, -0.3227081298828125, -0.303375244140625, -0.2840423583984375, -0.26470947265625, -0.2453765869140625, -0.226043701171875, -0.2067108154296875, -0.1873779296875, -0.1680450439453125, -0.148712158203125, -0.1293792724609375, -0.11004638671875, -0.0907135009765625, -0.071380615234375, -0.0520477294921875, -0.03271484375, -0.0133819580078125, 0.005950927734375, 0.0252838134765625, 0.04461669921875, 0.0639495849609375, 0.083282470703125, 0.1026153564453125, 0.1219482421875, 0.1412811279296875, 0.160614013671875, 0.1799468994140625, 0.19927978515625, 0.2186126708984375, 0.237945556640625, 0.2572784423828125, 0.276611328125, 0.2959442138671875, 0.315277099609375, 0.3346099853515625, 0.35394287109375, 0.3732757568359375, 0.392608642578125, 0.4119415283203125, 0.4312744140625, 0.4506072998046875, 0.469940185546875, 0.4892730712890625, 0.50860595703125, 0.5279388427734375, 0.547271728515625, 0.5666046142578125, 0.5859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 2.0, 13.0, 14.0, 17.0, 23.0, 28.0, 31.0, 53.0, 54.0, 63.0, 72.0, 70.0, 92.0, 66.0, 73.0, 67.0, 56.0, 45.0, 42.0, 28.0, 14.0, 15.0, 14.0, 12.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.84375, -2.7613525390625, -2.678955078125, -2.5965576171875, -2.51416015625, -2.4317626953125, -2.349365234375, -2.2669677734375, -2.1845703125, -2.1021728515625, -2.019775390625, -1.9373779296875, -1.85498046875, -1.7725830078125, -1.690185546875, -1.6077880859375, -1.525390625, -1.4429931640625, -1.360595703125, -1.2781982421875, -1.19580078125, -1.1134033203125, -1.031005859375, -0.9486083984375, -0.8662109375, -0.7838134765625, -0.701416015625, -0.6190185546875, -0.53662109375, -0.4542236328125, -0.371826171875, -0.2894287109375, -0.20703125, -0.1246337890625, -0.042236328125, 0.0401611328125, 0.12255859375, 0.2049560546875, 0.287353515625, 0.3697509765625, 0.4521484375, 0.5345458984375, 0.616943359375, 0.6993408203125, 0.78173828125, 0.8641357421875, 0.946533203125, 1.0289306640625, 1.111328125, 1.1937255859375, 1.276123046875, 1.3585205078125, 1.44091796875, 1.5233154296875, 1.605712890625, 1.6881103515625, 1.7705078125, 1.8529052734375, 1.935302734375, 2.0177001953125, 2.10009765625, 2.1824951171875, 2.264892578125, 2.3472900390625, 2.4296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 5.0, 15.0, 15.0, 15.0, 25.0, 22.0, 30.0, 51.0, 47.0, 81.0, 118.0, 204.0, 317.0, 567.0, 1649.0, 10846.0, 121724.0, 730974.0, 163580.0, 14334.0, 2233.0, 653.0, 314.0, 177.0, 126.0, 107.0, 79.0, 50.0, 33.0, 35.0, 19.0, 21.0, 12.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2600440979003906, -0.25153350830078125, -0.24302291870117188, -0.2345123291015625, -0.22600173950195312, -0.21749114990234375, -0.20898056030273438, -0.200469970703125, -0.19195938110351562, -0.18344879150390625, -0.17493820190429688, -0.1664276123046875, -0.15791702270507812, -0.14940643310546875, -0.14089584350585938, -0.13238525390625, -0.12387466430664062, -0.11536407470703125, -0.10685348510742188, -0.0983428955078125, -0.08983230590820312, -0.08132171630859375, -0.07281112670898438, -0.064300537109375, -0.055789947509765625, -0.04727935791015625, -0.038768768310546875, -0.0302581787109375, -0.021747589111328125, -0.01323699951171875, -0.004726409912109375, 0.0037841796875, 0.012294769287109375, 0.02080535888671875, 0.029315948486328125, 0.0378265380859375, 0.046337127685546875, 0.05484771728515625, 0.06335830688476562, 0.071868896484375, 0.08037948608398438, 0.08889007568359375, 0.09740066528320312, 0.1059112548828125, 0.11442184448242188, 0.12293243408203125, 0.13144302368164062, 0.13995361328125, 0.14846420288085938, 0.15697479248046875, 0.16548538208007812, 0.1739959716796875, 0.18250656127929688, 0.19101715087890625, 0.19952774047851562, 0.208038330078125, 0.21654891967773438, 0.22505950927734375, 0.23357009887695312, 0.2420806884765625, 0.2505912780761719, 0.25910186767578125, 0.2676124572753906, 0.276123046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 9.0, 13.0, 15.0, 15.0, 15.0, 18.0, 29.0, 32.0, 35.0, 33.0, 41.0, 44.0, 33.0, 47.0, 45.0, 45.0, 46.0, 50.0, 45.0, 34.0, 33.0, 30.0, 32.0, 34.0, 30.0, 35.0, 26.0, 23.0, 19.0, 13.0, 10.0, 9.0, 14.0, 8.0, 10.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5703125, -3.466033935546875, -3.36175537109375, -3.257476806640625, -3.1531982421875, -3.048919677734375, -2.94464111328125, -2.840362548828125, -2.736083984375, -2.631805419921875, -2.52752685546875, -2.423248291015625, -2.3189697265625, -2.214691162109375, -2.11041259765625, -2.006134033203125, -1.90185546875, -1.797576904296875, -1.69329833984375, -1.589019775390625, -1.4847412109375, -1.380462646484375, -1.27618408203125, -1.171905517578125, -1.067626953125, -0.963348388671875, -0.85906982421875, -0.754791259765625, -0.6505126953125, -0.546234130859375, -0.44195556640625, -0.337677001953125, -0.2333984375, -0.129119873046875, -0.02484130859375, 0.079437255859375, 0.1837158203125, 0.287994384765625, 0.39227294921875, 0.496551513671875, 0.600830078125, 0.705108642578125, 0.80938720703125, 0.913665771484375, 1.0179443359375, 1.122222900390625, 1.22650146484375, 1.330780029296875, 1.43505859375, 1.539337158203125, 1.64361572265625, 1.747894287109375, 1.8521728515625, 1.956451416015625, 2.06072998046875, 2.165008544921875, 2.269287109375, 2.373565673828125, 2.47784423828125, 2.582122802734375, 2.6864013671875, 2.790679931640625, 2.89495849609375, 2.999237060546875, 3.103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 7.0, 5.0, 14.0, 17.0, 15.0, 26.0, 31.0, 35.0, 50.0, 85.0, 152.0, 418.0, 1526.0, 12634.0, 1009071.0, 21338.0, 2097.0, 474.0, 213.0, 99.0, 54.0, 36.0, 33.0, 19.0, 15.0, 14.0, 14.0, 11.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1253662109375, -0.12139701843261719, -0.11742782592773438, -0.11345863342285156, -0.10948944091796875, -0.10552024841308594, -0.10155105590820312, -0.09758186340332031, -0.0936126708984375, -0.08964347839355469, -0.08567428588867188, -0.08170509338378906, -0.07773590087890625, -0.07376670837402344, -0.06979751586914062, -0.06582832336425781, -0.061859130859375, -0.05788993835449219, -0.053920745849609375, -0.04995155334472656, -0.04598236083984375, -0.04201316833496094, -0.038043975830078125, -0.03407478332519531, -0.0301055908203125, -0.026136398315429688, -0.022167205810546875, -0.018198013305664062, -0.01422882080078125, -0.010259628295898438, -0.006290435791015625, -0.0023212432861328125, 0.00164794921875, 0.0056171417236328125, 0.009586334228515625, 0.013555526733398438, 0.01752471923828125, 0.021493911743164062, 0.025463104248046875, 0.029432296752929688, 0.0334014892578125, 0.03737068176269531, 0.041339874267578125, 0.04530906677246094, 0.04927825927734375, 0.05324745178222656, 0.057216644287109375, 0.06118583679199219, 0.065155029296875, 0.06912422180175781, 0.07309341430664062, 0.07706260681152344, 0.08103179931640625, 0.08500099182128906, 0.08897018432617188, 0.09293937683105469, 0.0969085693359375, 0.10087776184082031, 0.10484695434570312, 0.10881614685058594, 0.11278533935546875, 0.11675453186035156, 0.12072372436523438, 0.12469291687011719, 0.128662109375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 2.0, 6.0, 12.0, 21.0, 55.0, 154.0, 304.0, 265.0, 104.0, 39.0, 20.0, 6.0, 4.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.273653030395508e-05, -4.0685757994651794e-05, -3.863498568534851e-05, -3.658421337604523e-05, -3.453344106674194e-05, -3.248266875743866e-05, -3.0431896448135376e-05, -2.8381124138832092e-05, -2.633035182952881e-05, -2.4279579520225525e-05, -2.222880721092224e-05, -2.0178034901618958e-05, -1.8127262592315674e-05, -1.607649028301239e-05, -1.4025717973709106e-05, -1.1974945664405823e-05, -9.924173355102539e-06, -7.873401045799255e-06, -5.822628736495972e-06, -3.771856427192688e-06, -1.7210841178894043e-06, 3.296881914138794e-07, 2.380460500717163e-06, 4.431232810020447e-06, 6.4820051193237305e-06, 8.532777428627014e-06, 1.0583549737930298e-05, 1.2634322047233582e-05, 1.4685094356536865e-05, 1.673586666584015e-05, 1.8786638975143433e-05, 2.0837411284446716e-05, 2.288818359375e-05, 2.4938955903053284e-05, 2.6989728212356567e-05, 2.904050052165985e-05, 3.1091272830963135e-05, 3.314204514026642e-05, 3.51928174495697e-05, 3.7243589758872986e-05, 3.929436206817627e-05, 4.134513437747955e-05, 4.339590668678284e-05, 4.544667899608612e-05, 4.7497451305389404e-05, 4.954822361469269e-05, 5.159899592399597e-05, 5.3649768233299255e-05, 5.570054054260254e-05, 5.775131285190582e-05, 5.9802085161209106e-05, 6.185285747051239e-05, 6.390362977981567e-05, 6.595440208911896e-05, 6.800517439842224e-05, 7.005594670772552e-05, 7.210671901702881e-05, 7.415749132633209e-05, 7.620826363563538e-05, 7.825903594493866e-05, 8.030980825424194e-05, 8.236058056354523e-05, 8.441135287284851e-05, 8.64621251821518e-05, 8.851289749145508e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 8.0, 6.0, 14.0, 18.0, 33.0, 33.0, 59.0, 83.0, 126.0, 224.0, 488.0, 1280.0, 4300.0, 37176.0, 980220.0, 19190.0, 3230.0, 1020.0, 430.0, 209.0, 131.0, 80.0, 54.0, 41.0, 22.0, 27.0, 11.0, 6.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.1349029541015625, -0.129791259765625, -0.1246795654296875, -0.11956787109375, -0.1144561767578125, -0.109344482421875, -0.1042327880859375, -0.09912109375, -0.0940093994140625, -0.088897705078125, -0.0837860107421875, -0.07867431640625, -0.0735626220703125, -0.068450927734375, -0.0633392333984375, -0.0582275390625, -0.0531158447265625, -0.048004150390625, -0.0428924560546875, -0.03778076171875, -0.0326690673828125, -0.027557373046875, -0.0224456787109375, -0.017333984375, -0.0122222900390625, -0.007110595703125, -0.0019989013671875, 0.00311279296875, 0.0082244873046875, 0.013336181640625, 0.0184478759765625, 0.0235595703125, 0.0286712646484375, 0.033782958984375, 0.0388946533203125, 0.04400634765625, 0.0491180419921875, 0.054229736328125, 0.0593414306640625, 0.064453125, 0.0695648193359375, 0.074676513671875, 0.0797882080078125, 0.08489990234375, 0.0900115966796875, 0.095123291015625, 0.1002349853515625, 0.1053466796875, 0.1104583740234375, 0.115570068359375, 0.1206817626953125, 0.12579345703125, 0.1309051513671875, 0.136016845703125, 0.1411285400390625, 0.146240234375, 0.1513519287109375, 0.156463623046875, 0.1615753173828125, 0.16668701171875, 0.1717987060546875, 0.176910400390625, 0.1820220947265625, 0.1871337890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 21.0, 27.0, 37.0, 68.0, 149.0, 344.0, 160.0, 80.0, 40.0, 24.0, 17.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035858154296875, -0.03482174873352051, -0.033785343170166016, -0.03274893760681152, -0.03171253204345703, -0.03067612648010254, -0.029639720916748047, -0.028603315353393555, -0.027566909790039062, -0.02653050422668457, -0.025494098663330078, -0.024457693099975586, -0.023421287536621094, -0.0223848819732666, -0.02134847640991211, -0.020312070846557617, -0.019275665283203125, -0.018239259719848633, -0.01720285415649414, -0.01616644859313965, -0.015130043029785156, -0.014093637466430664, -0.013057231903076172, -0.01202082633972168, -0.010984420776367188, -0.009948015213012695, -0.008911609649658203, -0.007875204086303711, -0.006838798522949219, -0.0058023929595947266, -0.004765987396240234, -0.003729581832885742, -0.00269317626953125, -0.0016567707061767578, -0.0006203651428222656, 0.00041604042053222656, 0.0014524459838867188, 0.002488851547241211, 0.003525257110595703, 0.004561662673950195, 0.0055980682373046875, 0.00663447380065918, 0.007670879364013672, 0.008707284927368164, 0.009743690490722656, 0.010780096054077148, 0.01181650161743164, 0.012852907180786133, 0.013889312744140625, 0.014925718307495117, 0.01596212387084961, 0.0169985294342041, 0.018034934997558594, 0.019071340560913086, 0.020107746124267578, 0.02114415168762207, 0.022180557250976562, 0.023216962814331055, 0.024253368377685547, 0.02528977394104004, 0.02632617950439453, 0.027362585067749023, 0.028398990631103516, 0.029435396194458008, 0.0304718017578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 11.0, 16.0, 26.0, 39.0, 86.0, 240.0, 285.0, 145.0, 73.0, 30.0, 14.0, 7.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.954397201538086, -5.775512218475342, -5.596627235412598, -5.4177422523498535, -5.238857269287109, -5.059972286224365, -4.881087303161621, -4.702201843261719, -4.523317337036133, -4.344432353973389, -4.1655473709106445, -3.9866623878479004, -3.8077774047851562, -3.628892421722412, -3.450007200241089, -3.2711222171783447, -3.0922369956970215, -2.9133520126342773, -2.734467029571533, -2.555582046508789, -2.376697063446045, -2.197812080383301, -2.0189268589019775, -1.8400418758392334, -1.6611568927764893, -1.4822719097137451, -1.303386926651001, -1.1245018243789673, -0.9456168413162231, -0.766731858253479, -0.5878467559814453, -0.40896177291870117, -0.23007726669311523, -0.051192253828048706, 0.12769275903701782, 0.30657780170440674, 0.4854627847671509, 0.664347767829895, 0.8432328701019287, 1.0221178531646729, 1.201002836227417, 1.3798878192901611, 1.5587728023529053, 1.737657904624939, 1.916542887687683, 2.095427989959717, 2.274312973022461, 2.453197956085205, 2.632082939147949, 2.8109679222106934, 2.9898529052734375, 3.1687378883361816, 3.347622871398926, 3.52650785446167, 3.705393075942993, 3.8842780590057373, 4.063162803649902, 4.2420477867126465, 4.420932769775391, 4.599817752838135, 4.778702735900879, 4.957587718963623, 5.136472702026367, 5.3153581619262695, 5.494243144989014]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 13.0, 10.0, 23.0, 19.0, 25.0, 35.0, 53.0, 56.0, 67.0, 70.0, 78.0, 78.0, 79.0, 66.0, 63.0, 55.0, 39.0, 40.0, 19.0, 16.0, 24.0, 11.0, 8.0, 6.0, 10.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.8812129497528076, -2.804255485534668, -2.727297782897949, -2.6503403186798096, -2.57338285446167, -2.496425151824951, -2.4194676876068115, -2.342510223388672, -2.265552520751953, -2.1885950565338135, -2.1116373538970947, -2.034679889678955, -1.9577223062515259, -1.8807647228240967, -1.803807258605957, -1.7268496751785278, -1.6498920917510986, -1.5729345083236694, -1.4959769248962402, -1.4190194606781006, -1.3420618772506714, -1.2651042938232422, -1.1881468296051025, -1.1111892461776733, -1.0342316627502441, -0.9572740793228149, -0.8803165555000305, -0.8033590316772461, -0.7264014482498169, -0.6494438648223877, -0.5724863409996033, -0.49552881717681885, -0.41857123374938965, -0.34161368012428284, -0.264656126499176, -0.1876985728740692, -0.1107410192489624, -0.03378346562385559, 0.04317408800125122, 0.12013161182403564, 0.19708919525146484, 0.27404674887657166, 0.35100430250167847, 0.4279618561267853, 0.5049194097518921, 0.5818769931793213, 0.6588345170021057, 0.7357920408248901, 0.8127496242523193, 0.8897072076797485, 0.966664731502533, 1.0436222553253174, 1.1205798387527466, 1.1975374221801758, 1.2744948863983154, 1.3514524698257446, 1.4284100532531738, 1.505367636680603, 1.5823252201080322, 1.6592826843261719, 1.736240267753601, 1.8131978511810303, 1.89015531539917, 1.9671128988265991, 2.0440704822540283]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 4.0, 9.0, 8.0, 14.0, 16.0, 24.0, 29.0, 40.0, 60.0, 87.0, 150.0, 184.0, 284.0, 422.0, 716.0, 1164.0, 2057.0, 4036.0, 8324.0, 20756.0, 69091.0, 473409.0, 372817.0, 59832.0, 18646.0, 7658.0, 3637.0, 1979.0, 1164.0, 683.0, 407.0, 273.0, 168.0, 128.0, 80.0, 51.0, 49.0, 22.0, 22.0, 14.0, 8.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2890625, -1.2460174560546875, -1.202972412109375, -1.1599273681640625, -1.11688232421875, -1.0738372802734375, -1.030792236328125, -0.9877471923828125, -0.9447021484375, -0.9016571044921875, -0.858612060546875, -0.8155670166015625, -0.77252197265625, -0.7294769287109375, -0.686431884765625, -0.6433868408203125, -0.600341796875, -0.5572967529296875, -0.514251708984375, -0.4712066650390625, -0.42816162109375, -0.3851165771484375, -0.342071533203125, -0.2990264892578125, -0.2559814453125, -0.2129364013671875, -0.169891357421875, -0.1268463134765625, -0.08380126953125, -0.0407562255859375, 0.002288818359375, 0.0453338623046875, 0.08837890625, 0.1314239501953125, 0.174468994140625, 0.2175140380859375, 0.26055908203125, 0.3036041259765625, 0.346649169921875, 0.3896942138671875, 0.4327392578125, 0.4757843017578125, 0.518829345703125, 0.5618743896484375, 0.60491943359375, 0.6479644775390625, 0.691009521484375, 0.7340545654296875, 0.777099609375, 0.8201446533203125, 0.863189697265625, 0.9062347412109375, 0.94927978515625, 0.9923248291015625, 1.035369873046875, 1.0784149169921875, 1.1214599609375, 1.1645050048828125, 1.207550048828125, 1.2505950927734375, 1.29364013671875, 1.3366851806640625, 1.379730224609375, 1.4227752685546875, 1.4658203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 3.0, 7.0, 6.0, 10.0, 15.0, 11.0, 24.0, 24.0, 51.0, 39.0, 59.0, 74.0, 94.0, 74.0, 82.0, 80.0, 65.0, 60.0, 44.0, 44.0, 32.0, 20.0, 18.0, 14.0, 10.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.625, -6.44647216796875, -6.2679443359375, -6.08941650390625, -5.910888671875, -5.73236083984375, -5.5538330078125, -5.37530517578125, -5.19677734375, -5.01824951171875, -4.8397216796875, -4.66119384765625, -4.482666015625, -4.30413818359375, -4.1256103515625, -3.94708251953125, -3.7685546875, -3.59002685546875, -3.4114990234375, -3.23297119140625, -3.054443359375, -2.87591552734375, -2.6973876953125, -2.51885986328125, -2.34033203125, -2.16180419921875, -1.9832763671875, -1.80474853515625, -1.626220703125, -1.44769287109375, -1.2691650390625, -1.09063720703125, -0.912109375, -0.73358154296875, -0.5550537109375, -0.37652587890625, -0.197998046875, -0.01947021484375, 0.1590576171875, 0.33758544921875, 0.51611328125, 0.69464111328125, 0.8731689453125, 1.05169677734375, 1.230224609375, 1.40875244140625, 1.5872802734375, 1.76580810546875, 1.9443359375, 2.12286376953125, 2.3013916015625, 2.47991943359375, 2.658447265625, 2.83697509765625, 3.0155029296875, 3.19403076171875, 3.37255859375, 3.55108642578125, 3.7296142578125, 3.90814208984375, 4.086669921875, 4.26519775390625, 4.4437255859375, 4.62225341796875, 4.80078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 15.0, 31.0, 18.0, 38.0, 80.0, 155.0, 317.0, 1013.0, 4156.0, 46041.0, 957639.0, 33833.0, 3596.0, 929.0, 327.0, 148.0, 81.0, 50.0, 21.0, 20.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2840576171875, -4.169677734375, -4.0552978515625, -3.94091796875, -3.8265380859375, -3.712158203125, -3.5977783203125, -3.4833984375, -3.3690185546875, -3.254638671875, -3.1402587890625, -3.02587890625, -2.9114990234375, -2.797119140625, -2.6827392578125, -2.568359375, -2.4539794921875, -2.339599609375, -2.2252197265625, -2.11083984375, -1.9964599609375, -1.882080078125, -1.7677001953125, -1.6533203125, -1.5389404296875, -1.424560546875, -1.3101806640625, -1.19580078125, -1.0814208984375, -0.967041015625, -0.8526611328125, -0.73828125, -0.6239013671875, -0.509521484375, -0.3951416015625, -0.28076171875, -0.1663818359375, -0.052001953125, 0.0623779296875, 0.1767578125, 0.2911376953125, 0.405517578125, 0.5198974609375, 0.63427734375, 0.7486572265625, 0.863037109375, 0.9774169921875, 1.091796875, 1.2061767578125, 1.320556640625, 1.4349365234375, 1.54931640625, 1.6636962890625, 1.778076171875, 1.8924560546875, 2.0068359375, 2.1212158203125, 2.235595703125, 2.3499755859375, 2.46435546875, 2.5787353515625, 2.693115234375, 2.8074951171875, 2.921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 10.0, 5.0, 11.0, 7.0, 15.0, 21.0, 15.0, 34.0, 30.0, 38.0, 44.0, 50.0, 45.0, 51.0, 60.0, 59.0, 61.0, 55.0, 59.0, 57.0, 39.0, 43.0, 30.0, 31.0, 31.0, 29.0, 14.0, 13.0, 15.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-8.5625, -8.357177734375, -8.15185546875, -7.946533203125, -7.7412109375, -7.535888671875, -7.33056640625, -7.125244140625, -6.919921875, -6.714599609375, -6.50927734375, -6.303955078125, -6.0986328125, -5.893310546875, -5.68798828125, -5.482666015625, -5.27734375, -5.072021484375, -4.86669921875, -4.661376953125, -4.4560546875, -4.250732421875, -4.04541015625, -3.840087890625, -3.634765625, -3.429443359375, -3.22412109375, -3.018798828125, -2.8134765625, -2.608154296875, -2.40283203125, -2.197509765625, -1.9921875, -1.786865234375, -1.58154296875, -1.376220703125, -1.1708984375, -0.965576171875, -0.76025390625, -0.554931640625, -0.349609375, -0.144287109375, 0.06103515625, 0.266357421875, 0.4716796875, 0.677001953125, 0.88232421875, 1.087646484375, 1.29296875, 1.498291015625, 1.70361328125, 1.908935546875, 2.1142578125, 2.319580078125, 2.52490234375, 2.730224609375, 2.935546875, 3.140869140625, 3.34619140625, 3.551513671875, 3.7568359375, 3.962158203125, 4.16748046875, 4.372802734375, 4.578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 8.0, 7.0, 16.0, 16.0, 34.0, 63.0, 88.0, 218.0, 497.0, 1613.0, 7467.0, 102176.0, 897916.0, 32676.0, 3981.0, 1044.0, 378.0, 153.0, 86.0, 31.0, 26.0, 18.0, 7.0, 8.0, 2.0, 7.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.5665435791015625, -1.525665283203125, -1.4847869873046875, -1.44390869140625, -1.4030303955078125, -1.362152099609375, -1.3212738037109375, -1.2803955078125, -1.2395172119140625, -1.198638916015625, -1.1577606201171875, -1.11688232421875, -1.0760040283203125, -1.035125732421875, -0.9942474365234375, -0.953369140625, -0.9124908447265625, -0.871612548828125, -0.8307342529296875, -0.78985595703125, -0.7489776611328125, -0.708099365234375, -0.6672210693359375, -0.6263427734375, -0.5854644775390625, -0.544586181640625, -0.5037078857421875, -0.46282958984375, -0.4219512939453125, -0.381072998046875, -0.3401947021484375, -0.29931640625, -0.2584381103515625, -0.217559814453125, -0.1766815185546875, -0.13580322265625, -0.0949249267578125, -0.054046630859375, -0.0131683349609375, 0.0277099609375, 0.0685882568359375, 0.109466552734375, 0.1503448486328125, 0.19122314453125, 0.2321014404296875, 0.272979736328125, 0.3138580322265625, 0.354736328125, 0.3956146240234375, 0.436492919921875, 0.4773712158203125, 0.51824951171875, 0.5591278076171875, 0.600006103515625, 0.6408843994140625, 0.6817626953125, 0.7226409912109375, 0.763519287109375, 0.8043975830078125, 0.84527587890625, 0.8861541748046875, 0.927032470703125, 0.9679107666015625, 1.0087890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 9.0, 15.0, 19.0, 21.0, 35.0, 49.0, 88.0, 151.0, 285.0, 95.0, 67.0, 49.0, 36.0, 26.0, 8.0, 6.0, 8.0, 11.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.801650255918503e-05, -8.370541036128998e-05, -7.939431816339493e-05, -7.508322596549988e-05, -7.077213376760483e-05, -6.646104156970978e-05, -6.214994937181473e-05, -5.783885717391968e-05, -5.352776497602463e-05, -4.921667277812958e-05, -4.490558058023453e-05, -4.059448838233948e-05, -3.628339618444443e-05, -3.197230398654938e-05, -2.7661211788654327e-05, -2.3350119590759277e-05, -1.9039027392864227e-05, -1.4727935194969177e-05, -1.0416842997074127e-05, -6.105750799179077e-06, -1.794658601284027e-06, 2.516433596611023e-06, 6.827525794506073e-06, 1.1138617992401123e-05, 1.5449710190296173e-05, 1.9760802388191223e-05, 2.4071894586086273e-05, 2.8382986783981323e-05, 3.269407898187637e-05, 3.700517117977142e-05, 4.1316263377666473e-05, 4.5627355575561523e-05, 4.9938447773456573e-05, 5.4249539971351624e-05, 5.8560632169246674e-05, 6.287172436714172e-05, 6.718281656503677e-05, 7.149390876293182e-05, 7.580500096082687e-05, 8.011609315872192e-05, 8.442718535661697e-05, 8.873827755451202e-05, 9.304936975240707e-05, 9.736046195030212e-05, 0.00010167155414819717, 0.00010598264634609222, 0.00011029373854398727, 0.00011460483074188232, 0.00011891592293977737, 0.00012322701513767242, 0.00012753810733556747, 0.00013184919953346252, 0.00013616029173135757, 0.00014047138392925262, 0.00014478247612714767, 0.00014909356832504272, 0.00015340466052293777, 0.00015771575272083282, 0.00016202684491872787, 0.00016633793711662292, 0.00017064902931451797, 0.00017496012151241302, 0.00017927121371030807, 0.00018358230590820312]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 10.0, 13.0, 15.0, 19.0, 28.0, 35.0, 89.0, 132.0, 263.0, 530.0, 1250.0, 3825.0, 15934.0, 136778.0, 819117.0, 57081.0, 9086.0, 2514.0, 885.0, 397.0, 192.0, 122.0, 64.0, 41.0, 35.0, 12.0, 19.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.9699935913085938, -0.9399871826171875, -0.9099807739257812, -0.879974365234375, -0.8499679565429688, -0.8199615478515625, -0.7899551391601562, -0.75994873046875, -0.7299423217773438, -0.6999359130859375, -0.6699295043945312, -0.639923095703125, -0.6099166870117188, -0.5799102783203125, -0.5499038696289062, -0.5198974609375, -0.48989105224609375, -0.4598846435546875, -0.42987823486328125, -0.399871826171875, -0.36986541748046875, -0.3398590087890625, -0.30985260009765625, -0.27984619140625, -0.24983978271484375, -0.2198333740234375, -0.18982696533203125, -0.159820556640625, -0.12981414794921875, -0.0998077392578125, -0.06980133056640625, -0.039794921875, -0.00978851318359375, 0.0202178955078125, 0.05022430419921875, 0.080230712890625, 0.11023712158203125, 0.1402435302734375, 0.17024993896484375, 0.20025634765625, 0.23026275634765625, 0.2602691650390625, 0.29027557373046875, 0.320281982421875, 0.35028839111328125, 0.3802947998046875, 0.41030120849609375, 0.4403076171875, 0.47031402587890625, 0.5003204345703125, 0.5303268432617188, 0.560333251953125, 0.5903396606445312, 0.6203460693359375, 0.6503524780273438, 0.68035888671875, 0.7103652954101562, 0.7403717041015625, 0.7703781127929688, 0.800384521484375, 0.8303909301757812, 0.8603973388671875, 0.8904037475585938, 0.92041015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 12.0, 7.0, 9.0, 14.0, 21.0, 27.0, 42.0, 55.0, 75.0, 156.0, 249.0, 90.0, 64.0, 28.0, 38.0, 22.0, 17.0, 15.0, 14.0, 13.0, 6.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.467041015625, -0.45481109619140625, -0.4425811767578125, -0.43035125732421875, -0.418121337890625, -0.40589141845703125, -0.3936614990234375, -0.38143157958984375, -0.36920166015625, -0.35697174072265625, -0.3447418212890625, -0.33251190185546875, -0.320281982421875, -0.30805206298828125, -0.2958221435546875, -0.28359222412109375, -0.2713623046875, -0.25913238525390625, -0.2469024658203125, -0.23467254638671875, -0.222442626953125, -0.21021270751953125, -0.1979827880859375, -0.18575286865234375, -0.17352294921875, -0.16129302978515625, -0.1490631103515625, -0.13683319091796875, -0.124603271484375, -0.11237335205078125, -0.1001434326171875, -0.08791351318359375, -0.07568359375, -0.06345367431640625, -0.0512237548828125, -0.03899383544921875, -0.026763916015625, -0.01453399658203125, -0.0023040771484375, 0.00992584228515625, 0.02215576171875, 0.03438568115234375, 0.0466156005859375, 0.05884552001953125, 0.071075439453125, 0.08330535888671875, 0.0955352783203125, 0.10776519775390625, 0.1199951171875, 0.13222503662109375, 0.1444549560546875, 0.15668487548828125, 0.168914794921875, 0.18114471435546875, 0.1933746337890625, 0.20560455322265625, 0.21783447265625, 0.23006439208984375, 0.2422943115234375, 0.25452423095703125, 0.266754150390625, 0.27898406982421875, 0.2912139892578125, 0.30344390869140625, 0.315673828125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 1.0, 8.0, 18.0, 27.0, 77.0, 273.0, 363.0, 138.0, 58.0, 20.0, 9.0, 0.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.589208126068115, -7.057093143463135, -6.5249786376953125, -5.992863655090332, -5.460748672485352, -4.928633689880371, -4.396518707275391, -3.8644042015075684, -3.332289218902588, -2.8001742362976074, -2.268059492111206, -1.7359446287155151, -1.2038297653198242, -0.6717147827148438, -0.13960003852844238, 0.392514705657959, 0.9246296882629395, 1.4567445516586304, 1.9888594150543213, 2.5209741592407227, 3.053089141845703, 3.5852041244506836, 4.117319107055664, 4.649433612823486, 5.181548595428467, 5.713663578033447, 6.2457780838012695, 6.77789306640625, 7.3100080490112305, 7.842123031616211, 8.374238014221191, 8.906352996826172, 9.438467025756836, 9.970582008361816, 10.502696990966797, 11.034811973571777, 11.566926956176758, 12.099040985107422, 12.631155967712402, 13.163270950317383, 13.695385932922363, 14.227500915527344, 14.759615898132324, 15.291730880737305, 15.823844909667969, 16.355960845947266, 16.88807487487793, 17.420188903808594, 17.95230484008789, 18.484418869018555, 19.01653480529785, 19.548648834228516, 20.080764770507812, 20.612878799438477, 21.144994735717773, 21.677108764648438, 22.209224700927734, 22.7413387298584, 23.273454666137695, 23.80556869506836, 24.337684631347656, 24.86979866027832, 25.401914596557617, 25.93402862548828, 26.466142654418945]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 16.0, 16.0, 23.0, 25.0, 39.0, 48.0, 54.0, 76.0, 70.0, 63.0, 66.0, 72.0, 60.0, 65.0, 64.0, 45.0, 40.0, 32.0, 26.0, 19.0, 22.0, 18.0, 10.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.230571746826172, -16.753639221191406, -16.276704788208008, -15.799771308898926, -15.322837829589844, -14.845904350280762, -14.36897087097168, -13.892038345336914, -13.415103912353516, -12.938170433044434, -12.461236953735352, -11.98430347442627, -11.507369995117188, -11.030436515808105, -10.553503036499023, -10.076570510864258, -9.599637031555176, -9.122703552246094, -8.645770072937012, -8.16883659362793, -7.691903114318848, -7.214969635009766, -6.738036632537842, -6.26110315322876, -5.784169673919678, -5.307236194610596, -4.830302715301514, -4.35336971282959, -3.8764359951019287, -3.3995025157928467, -2.9225692749023438, -2.4456357955932617, -1.9687023162841797, -1.4917688369750977, -1.0148354768753052, -0.5379021167755127, -0.060968637466430664, 0.41596484184265137, 0.8928980827331543, 1.3698315620422363, 1.8467650413513184, 2.3236985206604004, 2.8006319999694824, 3.2775652408599854, 3.7544987201690674, 4.23143196105957, 4.708365440368652, 5.185298919677734, 5.662232398986816, 6.139165878295898, 6.6160993576049805, 7.0930328369140625, 7.5699663162231445, 8.046899795532227, 8.523832321166992, 9.00076675415039, 9.477699279785156, 9.954632759094238, 10.43156623840332, 10.908499717712402, 11.385433197021484, 11.862366676330566, 12.339300155639648, 12.816232681274414, 13.293167114257812]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 12.0, 27.0, 34.0, 58.0, 154.0, 284.0, 757.0, 2727.0, 17440.0, 675521.0, 3461447.0, 30030.0, 3997.0, 1056.0, 372.0, 155.0, 83.0, 43.0, 35.0, 12.0, 13.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82421875, -7.5948486328125, -7.365478515625, -7.1361083984375, -6.90673828125, -6.6773681640625, -6.447998046875, -6.2186279296875, -5.9892578125, -5.7598876953125, -5.530517578125, -5.3011474609375, -5.07177734375, -4.8424072265625, -4.613037109375, -4.3836669921875, -4.154296875, -3.9249267578125, -3.695556640625, -3.4661865234375, -3.23681640625, -3.0074462890625, -2.778076171875, -2.5487060546875, -2.3193359375, -2.0899658203125, -1.860595703125, -1.6312255859375, -1.40185546875, -1.1724853515625, -0.943115234375, -0.7137451171875, -0.484375, -0.2550048828125, -0.025634765625, 0.2037353515625, 0.43310546875, 0.6624755859375, 0.891845703125, 1.1212158203125, 1.3505859375, 1.5799560546875, 1.809326171875, 2.0386962890625, 2.26806640625, 2.4974365234375, 2.726806640625, 2.9561767578125, 3.185546875, 3.4149169921875, 3.644287109375, 3.8736572265625, 4.10302734375, 4.3323974609375, 4.561767578125, 4.7911376953125, 5.0205078125, 5.2498779296875, 5.479248046875, 5.7086181640625, 5.93798828125, 6.1673583984375, 6.396728515625, 6.6260986328125, 6.85546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 11.0, 12.0, 19.0, 14.0, 30.0, 38.0, 66.0, 77.0, 105.0, 110.0, 118.0, 99.0, 86.0, 62.0, 31.0, 27.0, 21.0, 16.0, 9.0, 10.0, 11.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.921875, -3.806793212890625, -3.69171142578125, -3.576629638671875, -3.4615478515625, -3.346466064453125, -3.23138427734375, -3.116302490234375, -3.001220703125, -2.886138916015625, -2.77105712890625, -2.655975341796875, -2.5408935546875, -2.425811767578125, -2.31072998046875, -2.195648193359375, -2.08056640625, -1.965484619140625, -1.85040283203125, -1.735321044921875, -1.6202392578125, -1.505157470703125, -1.39007568359375, -1.274993896484375, -1.159912109375, -1.044830322265625, -0.92974853515625, -0.814666748046875, -0.6995849609375, -0.584503173828125, -0.46942138671875, -0.354339599609375, -0.2392578125, -0.124176025390625, -0.00909423828125, 0.105987548828125, 0.2210693359375, 0.336151123046875, 0.45123291015625, 0.566314697265625, 0.681396484375, 0.796478271484375, 0.91156005859375, 1.026641845703125, 1.1417236328125, 1.256805419921875, 1.37188720703125, 1.486968994140625, 1.60205078125, 1.717132568359375, 1.83221435546875, 1.947296142578125, 2.0623779296875, 2.177459716796875, 2.29254150390625, 2.407623291015625, 2.522705078125, 2.637786865234375, 2.75286865234375, 2.867950439453125, 2.9830322265625, 3.098114013671875, 3.21319580078125, 3.328277587890625, 3.443359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 21.0, 40.0, 65.0, 129.0, 286.0, 827.0, 3805.0, 53785.0, 4045245.0, 83654.0, 4847.0, 947.0, 296.0, 137.0, 65.0, 33.0, 27.0, 10.0, 5.0, 9.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0546875, -10.7821044921875, -10.509521484375, -10.2369384765625, -9.96435546875, -9.6917724609375, -9.419189453125, -9.1466064453125, -8.8740234375, -8.6014404296875, -8.328857421875, -8.0562744140625, -7.78369140625, -7.5111083984375, -7.238525390625, -6.9659423828125, -6.693359375, -6.4207763671875, -6.148193359375, -5.8756103515625, -5.60302734375, -5.3304443359375, -5.057861328125, -4.7852783203125, -4.5126953125, -4.2401123046875, -3.967529296875, -3.6949462890625, -3.42236328125, -3.1497802734375, -2.877197265625, -2.6046142578125, -2.33203125, -2.0594482421875, -1.786865234375, -1.5142822265625, -1.24169921875, -0.9691162109375, -0.696533203125, -0.4239501953125, -0.1513671875, 0.1212158203125, 0.393798828125, 0.6663818359375, 0.93896484375, 1.2115478515625, 1.484130859375, 1.7567138671875, 2.029296875, 2.3018798828125, 2.574462890625, 2.8470458984375, 3.11962890625, 3.3922119140625, 3.664794921875, 3.9373779296875, 4.2099609375, 4.4825439453125, 4.755126953125, 5.0277099609375, 5.30029296875, 5.5728759765625, 5.845458984375, 6.1180419921875, 6.390625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 10.0, 9.0, 16.0, 18.0, 21.0, 32.0, 53.0, 74.0, 119.0, 145.0, 289.0, 591.0, 1315.0, 559.0, 303.0, 142.0, 117.0, 63.0, 48.0, 39.0, 28.0, 18.0, 11.0, 10.0, 11.0, 7.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8154296875, -0.7846832275390625, -0.753936767578125, -0.7231903076171875, -0.69244384765625, -0.6616973876953125, -0.630950927734375, -0.6002044677734375, -0.5694580078125, -0.5387115478515625, -0.507965087890625, -0.4772186279296875, -0.44647216796875, -0.4157257080078125, -0.384979248046875, -0.3542327880859375, -0.323486328125, -0.2927398681640625, -0.261993408203125, -0.2312469482421875, -0.20050048828125, -0.1697540283203125, -0.139007568359375, -0.1082611083984375, -0.0775146484375, -0.0467681884765625, -0.016021728515625, 0.0147247314453125, 0.04547119140625, 0.0762176513671875, 0.106964111328125, 0.1377105712890625, 0.16845703125, 0.1992034912109375, 0.229949951171875, 0.2606964111328125, 0.29144287109375, 0.3221893310546875, 0.352935791015625, 0.3836822509765625, 0.4144287109375, 0.4451751708984375, 0.475921630859375, 0.5066680908203125, 0.53741455078125, 0.5681610107421875, 0.598907470703125, 0.6296539306640625, 0.660400390625, 0.6911468505859375, 0.721893310546875, 0.7526397705078125, 0.78338623046875, 0.8141326904296875, 0.844879150390625, 0.8756256103515625, 0.9063720703125, 0.9371185302734375, 0.967864990234375, 0.9986114501953125, 1.02935791015625, 1.0601043701171875, 1.090850830078125, 1.1215972900390625, 1.15234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 11.0, 8.0, 22.0, 40.0, 52.0, 94.0, 105.0, 141.0, 168.0, 103.0, 91.0, 43.0, 30.0, 25.0, 11.0, 7.0, 8.0, 6.0, 3.0, 0.0, 7.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.091717720031738, -4.932479381561279, -4.77324104309082, -4.614002704620361, -4.454764366149902, -4.295525550842285, -4.136287689208984, -3.977048873901367, -3.817810535430908, -3.658572196960449, -3.4993338584899902, -3.3400955200195312, -3.180856943130493, -3.021618604660034, -2.862380266189575, -2.703141689300537, -2.5439035892486572, -2.3846652507781982, -2.2254269123077393, -2.066188335418701, -1.9069499969482422, -1.7477116584777832, -1.5884733200073242, -1.4292348623275757, -1.2699965238571167, -1.1107581853866577, -0.9515197277069092, -0.7922813892364502, -0.6330429911613464, -0.4738045930862427, -0.3145662546157837, -0.15532779693603516, 0.003910541534423828, 0.1631489247083664, 0.32238730788230896, 0.48162567615509033, 0.6408640742301941, 0.8001024723052979, 0.9593408107757568, 1.1185792684555054, 1.2778176069259644, 1.4370559453964233, 1.5962944030761719, 1.7555327415466309, 1.9147710800170898, 2.074009418487549, 2.233247756958008, 2.392486333847046, 2.551724672317505, 2.710963010787964, 2.870201349258423, 3.029439926147461, 3.18867826461792, 3.347916603088379, 3.507154941558838, 3.666393280029297, 3.825631618499756, 3.984869956970215, 4.144108295440674, 4.303346633911133, 4.462584972381592, 4.621823310852051, 4.781062126159668, 4.940300464630127, 5.099538803100586]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 15.0, 18.0, 22.0, 36.0, 37.0, 54.0, 54.0, 61.0, 68.0, 74.0, 76.0, 97.0, 76.0, 65.0, 47.0, 36.0, 33.0, 22.0, 13.0, 20.0, 13.0, 11.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.7531285285949707, -3.6427433490753174, -3.532357931137085, -3.4219727516174316, -3.311587333679199, -3.201202154159546, -3.0908169746398926, -2.98043155670166, -2.8700461387634277, -2.7596609592437744, -2.649275541305542, -2.5388903617858887, -2.4285049438476562, -2.318119764328003, -2.2077345848083496, -2.097349166870117, -1.9869639873504639, -1.876578688621521, -1.7661933898925781, -1.6558082103729248, -1.5454227924346924, -1.435037612915039, -1.3246523141860962, -1.2142670154571533, -1.1038817167282104, -0.9934964179992676, -0.8831111192703247, -0.7727258801460266, -0.6623405814170837, -0.5519552826881409, -0.4415700435638428, -0.3311847448348999, -0.22079920768737793, -0.11041392385959625, -2.8640031814575195e-05, 0.11035662889480591, 0.22074192762374878, 0.33112722635269165, 0.44151246547698975, 0.5518977642059326, 0.6622830629348755, 0.7726683616638184, 0.8830536603927612, 0.9934388995170593, 1.1038241386413574, 1.2142095565795898, 1.3245947360992432, 1.434980034828186, 1.545365333557129, 1.6557506322860718, 1.7661359310150146, 1.876521110534668, 1.9869065284729004, 2.0972917079925537, 2.207676887512207, 2.3180623054504395, 2.428447723388672, 2.538832902908325, 2.6492183208465576, 2.759603500366211, 2.8699889183044434, 2.9803740978240967, 3.09075927734375, 3.2011446952819824, 3.3115298748016357]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 7.0, 13.0, 22.0, 18.0, 24.0, 53.0, 85.0, 103.0, 178.0, 313.0, 609.0, 1403.0, 4541.0, 20745.0, 343073.0, 637205.0, 31047.0, 5651.0, 1760.0, 754.0, 373.0, 210.0, 121.0, 64.0, 51.0, 36.0, 23.0, 16.0, 9.0, 10.0, 3.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.45671844482421875, -0.4424896240234375, -0.42826080322265625, -0.414031982421875, -0.39980316162109375, -0.3855743408203125, -0.37134552001953125, -0.35711669921875, -0.34288787841796875, -0.3286590576171875, -0.31443023681640625, -0.300201416015625, -0.28597259521484375, -0.2717437744140625, -0.25751495361328125, -0.2432861328125, -0.22905731201171875, -0.2148284912109375, -0.20059967041015625, -0.186370849609375, -0.17214202880859375, -0.1579132080078125, -0.14368438720703125, -0.12945556640625, -0.11522674560546875, -0.1009979248046875, -0.08676910400390625, -0.072540283203125, -0.05831146240234375, -0.0440826416015625, -0.02985382080078125, -0.015625, -0.00139617919921875, 0.0128326416015625, 0.02706146240234375, 0.041290283203125, 0.05551910400390625, 0.0697479248046875, 0.08397674560546875, 0.09820556640625, 0.11243438720703125, 0.1266632080078125, 0.14089202880859375, 0.155120849609375, 0.16934967041015625, 0.1835784912109375, 0.19780731201171875, 0.2120361328125, 0.22626495361328125, 0.2404937744140625, 0.25472259521484375, 0.268951416015625, 0.28318023681640625, 0.2974090576171875, 0.31163787841796875, 0.32586669921875, 0.34009552001953125, 0.3543243408203125, 0.36855316162109375, 0.382781982421875, 0.39701080322265625, 0.4112396240234375, 0.42546844482421875, 0.439697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 9.0, 12.0, 26.0, 24.0, 44.0, 59.0, 72.0, 78.0, 92.0, 117.0, 100.0, 93.0, 68.0, 51.0, 46.0, 22.0, 14.0, 13.0, 11.0, 9.0, 11.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.811981201171875, -2.71380615234375, -2.615631103515625, -2.5174560546875, -2.419281005859375, -2.32110595703125, -2.222930908203125, -2.124755859375, -2.026580810546875, -1.92840576171875, -1.830230712890625, -1.7320556640625, -1.633880615234375, -1.53570556640625, -1.437530517578125, -1.33935546875, -1.241180419921875, -1.14300537109375, -1.044830322265625, -0.9466552734375, -0.848480224609375, -0.75030517578125, -0.652130126953125, -0.553955078125, -0.455780029296875, -0.35760498046875, -0.259429931640625, -0.1612548828125, -0.063079833984375, 0.03509521484375, 0.133270263671875, 0.2314453125, 0.329620361328125, 0.42779541015625, 0.525970458984375, 0.6241455078125, 0.722320556640625, 0.82049560546875, 0.918670654296875, 1.016845703125, 1.115020751953125, 1.21319580078125, 1.311370849609375, 1.4095458984375, 1.507720947265625, 1.60589599609375, 1.704071044921875, 1.80224609375, 1.900421142578125, 1.99859619140625, 2.096771240234375, 2.1949462890625, 2.293121337890625, 2.39129638671875, 2.489471435546875, 2.587646484375, 2.685821533203125, 2.78399658203125, 2.882171630859375, 2.9803466796875, 3.078521728515625, 3.17669677734375, 3.274871826171875, 3.373046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 15.0, 18.0, 24.0, 32.0, 48.0, 48.0, 59.0, 101.0, 159.0, 248.0, 470.0, 1520.0, 13970.0, 567435.0, 451236.0, 10684.0, 1297.0, 456.0, 202.0, 130.0, 93.0, 84.0, 48.0, 38.0, 22.0, 19.0, 15.0, 12.0, 8.0, 8.0, 7.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4151115417480469, -0.40077972412109375, -0.3864479064941406, -0.3721160888671875, -0.3577842712402344, -0.34345245361328125, -0.3291206359863281, -0.314788818359375, -0.3004570007324219, -0.28612518310546875, -0.2717933654785156, -0.2574615478515625, -0.24312973022460938, -0.22879791259765625, -0.21446609497070312, -0.20013427734375, -0.18580245971679688, -0.17147064208984375, -0.15713882446289062, -0.1428070068359375, -0.12847518920898438, -0.11414337158203125, -0.09981155395507812, -0.085479736328125, -0.07114791870117188, -0.05681610107421875, -0.042484283447265625, -0.0281524658203125, -0.013820648193359375, 0.00051116943359375, 0.014842987060546875, 0.0291748046875, 0.043506622314453125, 0.05783843994140625, 0.07217025756835938, 0.0865020751953125, 0.10083389282226562, 0.11516571044921875, 0.12949752807617188, 0.143829345703125, 0.15816116333007812, 0.17249298095703125, 0.18682479858398438, 0.2011566162109375, 0.21548843383789062, 0.22982025146484375, 0.24415206909179688, 0.25848388671875, 0.2728157043457031, 0.28714752197265625, 0.3014793395996094, 0.3158111572265625, 0.3301429748535156, 0.34447479248046875, 0.3588066101074219, 0.373138427734375, 0.3874702453613281, 0.40180206298828125, 0.4161338806152344, 0.4304656982421875, 0.4447975158691406, 0.45912933349609375, 0.4734611511230469, 0.48779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 1.0, 5.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 12.0, 7.0, 7.0, 15.0, 24.0, 27.0, 25.0, 21.0, 30.0, 33.0, 30.0, 34.0, 31.0, 32.0, 42.0, 45.0, 40.0, 44.0, 46.0, 41.0, 40.0, 45.0, 37.0, 35.0, 20.0, 24.0, 24.0, 26.0, 17.0, 17.0, 22.0, 13.0, 11.0, 7.0, 8.0, 4.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.7933349609375, -2.701904296875, -2.6104736328125, -2.51904296875, -2.4276123046875, -2.336181640625, -2.2447509765625, -2.1533203125, -2.0618896484375, -1.970458984375, -1.8790283203125, -1.78759765625, -1.6961669921875, -1.604736328125, -1.5133056640625, -1.421875, -1.3304443359375, -1.239013671875, -1.1475830078125, -1.05615234375, -0.9647216796875, -0.873291015625, -0.7818603515625, -0.6904296875, -0.5989990234375, -0.507568359375, -0.4161376953125, -0.32470703125, -0.2332763671875, -0.141845703125, -0.0504150390625, 0.041015625, 0.1324462890625, 0.223876953125, 0.3153076171875, 0.40673828125, 0.4981689453125, 0.589599609375, 0.6810302734375, 0.7724609375, 0.8638916015625, 0.955322265625, 1.0467529296875, 1.13818359375, 1.2296142578125, 1.321044921875, 1.4124755859375, 1.50390625, 1.5953369140625, 1.686767578125, 1.7781982421875, 1.86962890625, 1.9610595703125, 2.052490234375, 2.1439208984375, 2.2353515625, 2.3267822265625, 2.418212890625, 2.5096435546875, 2.60107421875, 2.6925048828125, 2.783935546875, 2.8753662109375, 2.966796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 11.0, 17.0, 24.0, 53.0, 163.0, 471.0, 2773.0, 1041627.0, 2813.0, 388.0, 100.0, 43.0, 29.0, 14.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.30068206787109375, -0.2878875732421875, -0.27509307861328125, -0.262298583984375, -0.24950408935546875, -0.2367095947265625, -0.22391510009765625, -0.21112060546875, -0.19832611083984375, -0.1855316162109375, -0.17273712158203125, -0.159942626953125, -0.14714813232421875, -0.1343536376953125, -0.12155914306640625, -0.1087646484375, -0.09597015380859375, -0.0831756591796875, -0.07038116455078125, -0.057586669921875, -0.04479217529296875, -0.0319976806640625, -0.01920318603515625, -0.00640869140625, 0.00638580322265625, 0.0191802978515625, 0.03197479248046875, 0.044769287109375, 0.05756378173828125, 0.0703582763671875, 0.08315277099609375, 0.095947265625, 0.10874176025390625, 0.1215362548828125, 0.13433074951171875, 0.147125244140625, 0.15991973876953125, 0.1727142333984375, 0.18550872802734375, 0.19830322265625, 0.21109771728515625, 0.2238922119140625, 0.23668670654296875, 0.249481201171875, 0.26227569580078125, 0.2750701904296875, 0.28786468505859375, 0.3006591796875, 0.31345367431640625, 0.3262481689453125, 0.33904266357421875, 0.351837158203125, 0.36463165283203125, 0.3774261474609375, 0.39022064208984375, 0.40301513671875, 0.41580963134765625, 0.4286041259765625, 0.44139862060546875, 0.454193115234375, 0.46698760986328125, 0.4797821044921875, 0.49257659912109375, 0.50537109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 2.0, 10.0, 8.0, 20.0, 33.0, 70.0, 136.0, 175.0, 192.0, 134.0, 77.0, 55.0, 25.0, 17.0, 15.0, 14.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.638599395751953e-05, -5.504675209522247e-05, -5.3707510232925415e-05, -5.236826837062836e-05, -5.10290265083313e-05, -4.968978464603424e-05, -4.835054278373718e-05, -4.7011300921440125e-05, -4.5672059059143066e-05, -4.433281719684601e-05, -4.299357533454895e-05, -4.165433347225189e-05, -4.0315091609954834e-05, -3.8975849747657776e-05, -3.763660788536072e-05, -3.629736602306366e-05, -3.49581241607666e-05, -3.3618882298469543e-05, -3.2279640436172485e-05, -3.094039857387543e-05, -2.960115671157837e-05, -2.826191484928131e-05, -2.6922672986984253e-05, -2.5583431124687195e-05, -2.4244189262390137e-05, -2.290494740009308e-05, -2.156570553779602e-05, -2.0226463675498962e-05, -1.8887221813201904e-05, -1.7547979950904846e-05, -1.6208738088607788e-05, -1.486949622631073e-05, -1.3530254364013672e-05, -1.2191012501716614e-05, -1.0851770639419556e-05, -9.512528777122498e-06, -8.17328691482544e-06, -6.834045052528381e-06, -5.494803190231323e-06, -4.155561327934265e-06, -2.816319465637207e-06, -1.477077603340149e-06, -1.3783574104309082e-07, 1.2014061212539673e-06, 2.5406479835510254e-06, 3.8798898458480835e-06, 5.219131708145142e-06, 6.5583735704422e-06, 7.897615432739258e-06, 9.236857295036316e-06, 1.0576099157333374e-05, 1.1915341019630432e-05, 1.325458288192749e-05, 1.4593824744224548e-05, 1.5933066606521606e-05, 1.7272308468818665e-05, 1.8611550331115723e-05, 1.995079219341278e-05, 2.129003405570984e-05, 2.2629275918006897e-05, 2.3968517780303955e-05, 2.5307759642601013e-05, 2.664700150489807e-05, 2.798624336719513e-05, 2.9325485229492188e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 8.0, 15.0, 24.0, 41.0, 55.0, 127.0, 214.0, 533.0, 2383.0, 152376.0, 888482.0, 3145.0, 593.0, 260.0, 127.0, 59.0, 39.0, 24.0, 17.0, 6.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2529296875, -0.24196243286132812, -0.23099517822265625, -0.22002792358398438, -0.2090606689453125, -0.19809341430664062, -0.18712615966796875, -0.17615890502929688, -0.165191650390625, -0.15422439575195312, -0.14325714111328125, -0.13228988647460938, -0.1213226318359375, -0.11035537719726562, -0.09938812255859375, -0.08842086791992188, -0.07745361328125, -0.06648635864257812, -0.05551910400390625, -0.044551849365234375, -0.0335845947265625, -0.022617340087890625, -0.01165008544921875, -0.000682830810546875, 0.010284423828125, 0.021251678466796875, 0.03221893310546875, 0.043186187744140625, 0.0541534423828125, 0.06512069702148438, 0.07608795166015625, 0.08705520629882812, 0.0980224609375, 0.10898971557617188, 0.11995697021484375, 0.13092422485351562, 0.1418914794921875, 0.15285873413085938, 0.16382598876953125, 0.17479324340820312, 0.185760498046875, 0.19672775268554688, 0.20769500732421875, 0.21866226196289062, 0.2296295166015625, 0.24059677124023438, 0.25156402587890625, 0.2625312805175781, 0.27349853515625, 0.2844657897949219, 0.29543304443359375, 0.3064002990722656, 0.3173675537109375, 0.3283348083496094, 0.33930206298828125, 0.3502693176269531, 0.361236572265625, 0.3722038269042969, 0.38317108154296875, 0.3941383361816406, 0.4051055908203125, 0.4160728454589844, 0.42704010009765625, 0.4380073547363281, 0.448974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 12.0, 19.0, 34.0, 334.0, 518.0, 36.0, 21.0, 12.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12443161010742188, -0.12178802490234375, -0.11914443969726562, -0.1165008544921875, -0.11385726928710938, -0.11121368408203125, -0.10857009887695312, -0.105926513671875, -0.10328292846679688, -0.10063934326171875, -0.09799575805664062, -0.0953521728515625, -0.09270858764648438, -0.09006500244140625, -0.08742141723632812, -0.08477783203125, -0.08213424682617188, -0.07949066162109375, -0.07684707641601562, -0.0742034912109375, -0.07155990600585938, -0.06891632080078125, -0.06627273559570312, -0.063629150390625, -0.060985565185546875, -0.05834197998046875, -0.055698394775390625, -0.0530548095703125, -0.050411224365234375, -0.04776763916015625, -0.045124053955078125, -0.04248046875, -0.039836883544921875, -0.03719329833984375, -0.034549713134765625, -0.0319061279296875, -0.029262542724609375, -0.02661895751953125, -0.023975372314453125, -0.021331787109375, -0.018688201904296875, -0.01604461669921875, -0.013401031494140625, -0.0107574462890625, -0.008113861083984375, -0.00547027587890625, -0.002826690673828125, -0.00018310546875, 0.002460479736328125, 0.00510406494140625, 0.007747650146484375, 0.0103912353515625, 0.013034820556640625, 0.01567840576171875, 0.018321990966796875, 0.020965576171875, 0.023609161376953125, 0.02625274658203125, 0.028896331787109375, 0.0315399169921875, 0.034183502197265625, 0.03682708740234375, 0.039470672607421875, 0.0421142578125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 16.0, 19.0, 46.0, 77.0, 121.0, 182.0, 194.0, 137.0, 68.0, 42.0, 33.0, 8.0, 9.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8529906272888184, -3.7201764583587646, -3.58736252784729, -3.4545483589172363, -3.3217344284057617, -3.188920259475708, -3.0561060905456543, -2.9232921600341797, -2.790477991104126, -2.6576638221740723, -2.5248498916625977, -2.392035722732544, -2.2592215538024902, -2.1264076232910156, -1.993593454360962, -1.8607794046401978, -1.7279653549194336, -1.5951513051986694, -1.4623372554779053, -1.3295230865478516, -1.1967090368270874, -1.0638949871063232, -0.9310808777809143, -0.7982667684555054, -0.6654527187347412, -0.532638669013977, -0.3998245596885681, -0.26701048016548157, -0.13419640064239502, -0.0013823509216308594, 0.13143175840377808, 0.264245867729187, 0.3970603942871094, 0.5298744440078735, 0.6626885533332825, 0.7955026626586914, 0.9283167123794556, 1.0611307621002197, 1.1939449310302734, 1.3267589807510376, 1.4595730304718018, 1.592387080192566, 1.72520112991333, 1.8580152988433838, 1.990829348564148, 2.123643398284912, 2.256457567214966, 2.3892717361450195, 2.522085666656494, 2.654899835586548, 2.7877137660980225, 2.920527935028076, 3.053341865539551, 3.1861560344696045, 3.318970203399658, 3.451784133911133, 3.5845983028411865, 3.7174124717712402, 3.850226402282715, 3.9830405712127686, 4.115854740142822, 4.248668670654297, 4.3814826011657715, 4.514297008514404, 4.647110939025879]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 12.0, 24.0, 16.0, 23.0, 40.0, 52.0, 62.0, 74.0, 75.0, 92.0, 90.0, 101.0, 89.0, 55.0, 37.0, 45.0, 17.0, 18.0, 15.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6858091354370117, -2.6021041870117188, -2.5183990001678467, -2.4346940517425537, -2.3509888648986816, -2.2672839164733887, -2.1835789680480957, -2.0998737812042236, -2.0161685943603516, -1.932463526725769, -1.8487584590911865, -1.7650535106658936, -1.6813483238220215, -1.5976433753967285, -1.513938307762146, -1.4302332401275635, -1.3465282917022705, -1.262823224067688, -1.1791181564331055, -1.0954132080078125, -1.0117080211639404, -0.9280030131340027, -0.8442980051040649, -0.7605929374694824, -0.6768878698348999, -0.5931828022003174, -0.5094777345657349, -0.4257727265357971, -0.3420676589012146, -0.2583625912666321, -0.17465758323669434, -0.09095251560211182, -0.007247447967529297, 0.07645760476589203, 0.16016265749931335, 0.2438676953315735, 0.327572762966156, 0.4112778306007385, 0.49498283863067627, 0.5786879062652588, 0.6623929738998413, 0.7460980415344238, 0.8298031091690063, 0.9135081171989441, 0.9972131848335266, 1.080918312072754, 1.1646232604980469, 1.2483283281326294, 1.332033395767212, 1.4157384634017944, 1.499443531036377, 1.58314847946167, 1.666853666305542, 1.750558614730835, 1.8342636823654175, 1.91796875, 2.001673698425293, 2.085378646850586, 2.169083833694458, 2.252788782119751, 2.336493968963623, 2.420198917388916, 2.503903865814209, 2.587609052658081, 2.671314239501953]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 5.0, 16.0, 12.0, 24.0, 18.0, 38.0, 62.0, 70.0, 103.0, 173.0, 240.0, 438.0, 661.0, 1159.0, 2052.0, 4002.0, 8342.0, 20316.0, 63052.0, 420412.0, 425919.0, 63402.0, 20504.0, 8459.0, 3986.0, 2064.0, 1166.0, 682.0, 369.0, 264.0, 164.0, 119.0, 65.0, 55.0, 35.0, 22.0, 18.0, 14.0, 16.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.701171875, -1.64447021484375, -1.5877685546875, -1.53106689453125, -1.474365234375, -1.41766357421875, -1.3609619140625, -1.30426025390625, -1.24755859375, -1.19085693359375, -1.1341552734375, -1.07745361328125, -1.020751953125, -0.96405029296875, -0.9073486328125, -0.85064697265625, -0.7939453125, -0.73724365234375, -0.6805419921875, -0.62384033203125, -0.567138671875, -0.51043701171875, -0.4537353515625, -0.39703369140625, -0.34033203125, -0.28363037109375, -0.2269287109375, -0.17022705078125, -0.113525390625, -0.05682373046875, -0.0001220703125, 0.05657958984375, 0.11328125, 0.16998291015625, 0.2266845703125, 0.28338623046875, 0.340087890625, 0.39678955078125, 0.4534912109375, 0.51019287109375, 0.56689453125, 0.62359619140625, 0.6802978515625, 0.73699951171875, 0.793701171875, 0.85040283203125, 0.9071044921875, 0.96380615234375, 1.0205078125, 1.07720947265625, 1.1339111328125, 1.19061279296875, 1.247314453125, 1.30401611328125, 1.3607177734375, 1.41741943359375, 1.47412109375, 1.53082275390625, 1.5875244140625, 1.64422607421875, 1.700927734375, 1.75762939453125, 1.8143310546875, 1.87103271484375, 1.927734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 17.0, 14.0, 28.0, 43.0, 54.0, 52.0, 68.0, 66.0, 90.0, 89.0, 92.0, 65.0, 73.0, 47.0, 35.0, 24.0, 23.0, 18.0, 13.0, 13.0, 9.0, 4.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39178466796875, -4.2366943359375, -4.08160400390625, -3.926513671875, -3.77142333984375, -3.6163330078125, -3.46124267578125, -3.30615234375, -3.15106201171875, -2.9959716796875, -2.84088134765625, -2.685791015625, -2.53070068359375, -2.3756103515625, -2.22052001953125, -2.0654296875, -1.91033935546875, -1.7552490234375, -1.60015869140625, -1.445068359375, -1.28997802734375, -1.1348876953125, -0.97979736328125, -0.82470703125, -0.66961669921875, -0.5145263671875, -0.35943603515625, -0.204345703125, -0.04925537109375, 0.1058349609375, 0.26092529296875, 0.416015625, 0.57110595703125, 0.7261962890625, 0.88128662109375, 1.036376953125, 1.19146728515625, 1.3465576171875, 1.50164794921875, 1.65673828125, 1.81182861328125, 1.9669189453125, 2.12200927734375, 2.277099609375, 2.43218994140625, 2.5872802734375, 2.74237060546875, 2.8974609375, 3.05255126953125, 3.2076416015625, 3.36273193359375, 3.517822265625, 3.67291259765625, 3.8280029296875, 3.98309326171875, 4.13818359375, 4.29327392578125, 4.4483642578125, 4.60345458984375, 4.758544921875, 4.91363525390625, 5.0687255859375, 5.22381591796875, 5.37890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 10.0, 18.0, 25.0, 29.0, 29.0, 46.0, 55.0, 85.0, 104.0, 137.0, 212.0, 342.0, 582.0, 1362.0, 5242.0, 37042.0, 851899.0, 135123.0, 11589.0, 2359.0, 842.0, 429.0, 287.0, 202.0, 134.0, 89.0, 74.0, 40.0, 40.0, 28.0, 31.0, 10.0, 12.0, 9.0, 11.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.517578125, -3.416290283203125, -3.31500244140625, -3.213714599609375, -3.1124267578125, -3.011138916015625, -2.90985107421875, -2.808563232421875, -2.707275390625, -2.605987548828125, -2.50469970703125, -2.403411865234375, -2.3021240234375, -2.200836181640625, -2.09954833984375, -1.998260498046875, -1.89697265625, -1.795684814453125, -1.69439697265625, -1.593109130859375, -1.4918212890625, -1.390533447265625, -1.28924560546875, -1.187957763671875, -1.086669921875, -0.985382080078125, -0.88409423828125, -0.782806396484375, -0.6815185546875, -0.580230712890625, -0.47894287109375, -0.377655029296875, -0.2763671875, -0.175079345703125, -0.07379150390625, 0.027496337890625, 0.1287841796875, 0.230072021484375, 0.33135986328125, 0.432647705078125, 0.533935546875, 0.635223388671875, 0.73651123046875, 0.837799072265625, 0.9390869140625, 1.040374755859375, 1.14166259765625, 1.242950439453125, 1.34423828125, 1.445526123046875, 1.54681396484375, 1.648101806640625, 1.7493896484375, 1.850677490234375, 1.95196533203125, 2.053253173828125, 2.154541015625, 2.255828857421875, 2.35711669921875, 2.458404541015625, 2.5596923828125, 2.660980224609375, 2.76226806640625, 2.863555908203125, 2.96484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 7.0, 10.0, 6.0, 12.0, 8.0, 11.0, 23.0, 19.0, 24.0, 26.0, 37.0, 35.0, 40.0, 52.0, 55.0, 56.0, 58.0, 62.0, 54.0, 41.0, 62.0, 40.0, 48.0, 34.0, 37.0, 22.0, 18.0, 23.0, 23.0, 10.0, 14.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.79296875, -4.64007568359375, -4.4871826171875, -4.33428955078125, -4.181396484375, -4.02850341796875, -3.8756103515625, -3.72271728515625, -3.56982421875, -3.41693115234375, -3.2640380859375, -3.11114501953125, -2.958251953125, -2.80535888671875, -2.6524658203125, -2.49957275390625, -2.3466796875, -2.19378662109375, -2.0408935546875, -1.88800048828125, -1.735107421875, -1.58221435546875, -1.4293212890625, -1.27642822265625, -1.12353515625, -0.97064208984375, -0.8177490234375, -0.66485595703125, -0.511962890625, -0.35906982421875, -0.2061767578125, -0.05328369140625, 0.099609375, 0.25250244140625, 0.4053955078125, 0.55828857421875, 0.711181640625, 0.86407470703125, 1.0169677734375, 1.16986083984375, 1.32275390625, 1.47564697265625, 1.6285400390625, 1.78143310546875, 1.934326171875, 2.08721923828125, 2.2401123046875, 2.39300537109375, 2.5458984375, 2.69879150390625, 2.8516845703125, 3.00457763671875, 3.157470703125, 3.31036376953125, 3.4632568359375, 3.61614990234375, 3.76904296875, 3.92193603515625, 4.0748291015625, 4.22772216796875, 4.380615234375, 4.53350830078125, 4.6864013671875, 4.83929443359375, 4.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 15.0, 20.0, 35.0, 46.0, 120.0, 475.0, 2829.0, 131516.0, 907370.0, 5121.0, 677.0, 194.0, 50.0, 35.0, 17.0, 12.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.806793212890625, -4.68389892578125, -4.561004638671875, -4.4381103515625, -4.315216064453125, -4.19232177734375, -4.069427490234375, -3.946533203125, -3.823638916015625, -3.70074462890625, -3.577850341796875, -3.4549560546875, -3.332061767578125, -3.20916748046875, -3.086273193359375, -2.96337890625, -2.840484619140625, -2.71759033203125, -2.594696044921875, -2.4718017578125, -2.348907470703125, -2.22601318359375, -2.103118896484375, -1.980224609375, -1.857330322265625, -1.73443603515625, -1.611541748046875, -1.4886474609375, -1.365753173828125, -1.24285888671875, -1.119964599609375, -0.9970703125, -0.874176025390625, -0.75128173828125, -0.628387451171875, -0.5054931640625, -0.382598876953125, -0.25970458984375, -0.136810302734375, -0.013916015625, 0.108978271484375, 0.23187255859375, 0.354766845703125, 0.4776611328125, 0.600555419921875, 0.72344970703125, 0.846343994140625, 0.96923828125, 1.092132568359375, 1.21502685546875, 1.337921142578125, 1.4608154296875, 1.583709716796875, 1.70660400390625, 1.829498291015625, 1.952392578125, 2.075286865234375, 2.19818115234375, 2.321075439453125, 2.4439697265625, 2.566864013671875, 2.68975830078125, 2.812652587890625, 2.935546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 7.0, 16.0, 27.0, 28.0, 22.0, 33.0, 63.0, 130.0, 259.0, 159.0, 62.0, 40.0, 29.0, 21.0, 19.0, 20.0, 8.0, 13.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018334388732910156, -0.00017804093658924103, -0.0001727379858493805, -0.00016743503510951996, -0.00016213208436965942, -0.0001568291336297989, -0.00015152618288993835, -0.00014622323215007782, -0.00014092028141021729, -0.00013561733067035675, -0.00013031437993049622, -0.00012501142919063568, -0.00011970847845077515, -0.00011440552771091461, -0.00010910257697105408, -0.00010379962623119354, -9.849667549133301e-05, -9.319372475147247e-05, -8.789077401161194e-05, -8.25878232717514e-05, -7.728487253189087e-05, -7.198192179203033e-05, -6.66789710521698e-05, -6.137602031230927e-05, -5.607306957244873e-05, -5.0770118832588196e-05, -4.546716809272766e-05, -4.0164217352867126e-05, -3.486126661300659e-05, -2.9558315873146057e-05, -2.4255365133285522e-05, -1.8952414393424988e-05, -1.3649463653564453e-05, -8.346512913703918e-06, -3.043562173843384e-06, 2.259388566017151e-06, 7.5623393058776855e-06, 1.286529004573822e-05, 1.8168240785598755e-05, 2.347119152545929e-05, 2.8774142265319824e-05, 3.407709300518036e-05, 3.9380043745040894e-05, 4.468299448490143e-05, 4.998594522476196e-05, 5.52888959646225e-05, 6.059184670448303e-05, 6.589479744434357e-05, 7.11977481842041e-05, 7.650069892406464e-05, 8.180364966392517e-05, 8.71066004037857e-05, 9.240955114364624e-05, 9.771250188350677e-05, 0.00010301545262336731, 0.00010831840336322784, 0.00011362135410308838, 0.00011892430484294891, 0.00012422725558280945, 0.00012953020632266998, 0.00013483315706253052, 0.00014013610780239105, 0.0001454390585422516, 0.00015074200928211212, 0.00015604496002197266]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 15.0, 28.0, 60.0, 126.0, 326.0, 1337.0, 14282.0, 965597.0, 63070.0, 2884.0, 537.0, 148.0, 75.0, 27.0, 15.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.724853515625, -1.62158203125, -1.518310546875, -1.4150390625, -1.311767578125, -1.20849609375, -1.105224609375, -1.001953125, -0.898681640625, -0.79541015625, -0.692138671875, -0.5888671875, -0.485595703125, -0.38232421875, -0.279052734375, -0.17578125, -0.072509765625, 0.03076171875, 0.134033203125, 0.2373046875, 0.340576171875, 0.44384765625, 0.547119140625, 0.650390625, 0.753662109375, 0.85693359375, 0.960205078125, 1.0634765625, 1.166748046875, 1.27001953125, 1.373291015625, 1.4765625, 1.579833984375, 1.68310546875, 1.786376953125, 1.8896484375, 1.992919921875, 2.09619140625, 2.199462890625, 2.302734375, 2.406005859375, 2.50927734375, 2.612548828125, 2.7158203125, 2.819091796875, 2.92236328125, 3.025634765625, 3.12890625, 3.232177734375, 3.33544921875, 3.438720703125, 3.5419921875, 3.645263671875, 3.74853515625, 3.851806640625, 3.955078125, 4.058349609375, 4.16162109375, 4.264892578125, 4.3681640625, 4.471435546875, 4.57470703125, 4.677978515625, 4.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 14.0, 22.0, 41.0, 41.0, 104.0, 529.0, 91.0, 54.0, 37.0, 26.0, 14.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.498046875, -1.4658050537109375, -1.433563232421875, -1.4013214111328125, -1.36907958984375, -1.3368377685546875, -1.304595947265625, -1.2723541259765625, -1.2401123046875, -1.2078704833984375, -1.175628662109375, -1.1433868408203125, -1.11114501953125, -1.0789031982421875, -1.046661376953125, -1.0144195556640625, -0.982177734375, -0.9499359130859375, -0.917694091796875, -0.8854522705078125, -0.85321044921875, -0.8209686279296875, -0.788726806640625, -0.7564849853515625, -0.7242431640625, -0.6920013427734375, -0.659759521484375, -0.6275177001953125, -0.59527587890625, -0.5630340576171875, -0.530792236328125, -0.4985504150390625, -0.46630859375, -0.4340667724609375, -0.401824951171875, -0.3695831298828125, -0.33734130859375, -0.3050994873046875, -0.272857666015625, -0.2406158447265625, -0.2083740234375, -0.1761322021484375, -0.143890380859375, -0.1116485595703125, -0.07940673828125, -0.0471649169921875, -0.014923095703125, 0.0173187255859375, 0.049560546875, 0.0818023681640625, 0.114044189453125, 0.1462860107421875, 0.17852783203125, 0.2107696533203125, 0.243011474609375, 0.2752532958984375, 0.3074951171875, 0.3397369384765625, 0.371978759765625, 0.4042205810546875, 0.43646240234375, 0.4687042236328125, 0.500946044921875, 0.5331878662109375, 0.5654296875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 11.0, 10.0, 30.0, 74.0, 146.0, 263.0, 232.0, 111.0, 59.0, 30.0, 10.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.956765651702881, -7.55506706237793, -7.1533684730529785, -6.751669883728027, -6.349970817565918, -5.948272705078125, -5.546573638916016, -5.1448750495910645, -4.743176460266113, -4.341477870941162, -3.939779281616211, -3.5380804538726807, -3.1363818645477295, -2.7346832752227783, -2.332984447479248, -1.9312858581542969, -1.5295872688293457, -1.1278886795043945, -0.7261899709701538, -0.3244912624359131, 0.07720732688903809, 0.47890591621398926, 0.8806047439575195, 1.2823033332824707, 1.6840019226074219, 2.085700511932373, 2.487399101257324, 2.8890979290008545, 3.2907965183258057, 3.692495107650757, 4.094193935394287, 4.495892524719238, 4.897590637207031, 5.299289226531982, 5.700987815856934, 6.102686882019043, 6.504384994506836, 6.906084060668945, 7.3077826499938965, 7.709481239318848, 8.11117935180664, 8.51287841796875, 8.914576530456543, 9.316275596618652, 9.717973709106445, 10.119672775268555, 10.521371841430664, 10.923069953918457, 11.324769020080566, 11.726468086242676, 12.128166198730469, 12.529865264892578, 12.931563377380371, 13.33326244354248, 13.734960556030273, 14.136659622192383, 14.538358688354492, 14.940057754516602, 15.341755867004395, 15.743454933166504, 16.145153045654297, 16.546852111816406, 16.948551177978516, 17.350250244140625, 17.7519474029541]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 19.0, 12.0, 20.0, 10.0, 19.0, 18.0, 20.0, 24.0, 28.0, 40.0, 32.0, 40.0, 32.0, 41.0, 39.0, 34.0, 51.0, 43.0, 46.0, 35.0, 39.0, 48.0, 37.0, 32.0, 31.0, 25.0, 27.0, 18.0, 14.0, 15.0, 15.0, 16.0, 15.0, 4.0, 12.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.197763442993164, -5.985151290893555, -5.772539138793945, -5.559926509857178, -5.347314357757568, -5.134702205657959, -4.922089576721191, -4.709477424621582, -4.496865272521973, -4.284253120422363, -4.071640968322754, -3.8590283393859863, -3.646416187286377, -3.4338040351867676, -3.221191644668579, -3.0085792541503906, -2.7959671020507812, -2.583354949951172, -2.3707425594329834, -2.158130168914795, -1.9455180168151855, -1.7329057455062866, -1.5202934741973877, -1.3076812028884888, -1.0950689315795898, -0.8824566602706909, -0.669844388961792, -0.45723211765289307, -0.24461984634399414, -0.032007575035095215, 0.1806046962738037, 0.39321696758270264, 0.6058297157287598, 0.8184419870376587, 1.0310542583465576, 1.2436665296554565, 1.4562788009643555, 1.6688910722732544, 1.8815033435821533, 2.094115734100342, 2.306727886199951, 2.5193400382995605, 2.731952428817749, 2.9445648193359375, 3.157176971435547, 3.3697891235351562, 3.5824015140533447, 3.795013904571533, 4.007626056671143, 4.220238208770752, 4.4328508377075195, 4.645462989807129, 4.858075141906738, 5.070687294006348, 5.283299446105957, 5.495912075042725, 5.708524227142334, 5.921136379241943, 6.133749008178711, 6.34636116027832, 6.55897331237793, 6.771585464477539, 6.984197616577148, 7.196810245513916, 7.409422397613525]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 11.0, 16.0, 15.0, 14.0, 18.0, 30.0, 24.0, 35.0, 58.0, 92.0, 165.0, 356.0, 1154.0, 6310.0, 129744.0, 4008755.0, 42009.0, 3837.0, 872.0, 282.0, 130.0, 60.0, 57.0, 32.0, 21.0, 28.0, 18.0, 15.0, 14.0, 9.0, 9.0, 13.0, 7.0, 10.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4765625, -8.214599609375, -7.95263671875, -7.690673828125, -7.4287109375, -7.166748046875, -6.90478515625, -6.642822265625, -6.380859375, -6.118896484375, -5.85693359375, -5.594970703125, -5.3330078125, -5.071044921875, -4.80908203125, -4.547119140625, -4.28515625, -4.023193359375, -3.76123046875, -3.499267578125, -3.2373046875, -2.975341796875, -2.71337890625, -2.451416015625, -2.189453125, -1.927490234375, -1.66552734375, -1.403564453125, -1.1416015625, -0.879638671875, -0.61767578125, -0.355712890625, -0.09375, 0.168212890625, 0.43017578125, 0.692138671875, 0.9541015625, 1.216064453125, 1.47802734375, 1.739990234375, 2.001953125, 2.263916015625, 2.52587890625, 2.787841796875, 3.0498046875, 3.311767578125, 3.57373046875, 3.835693359375, 4.09765625, 4.359619140625, 4.62158203125, 4.883544921875, 5.1455078125, 5.407470703125, 5.66943359375, 5.931396484375, 6.193359375, 6.455322265625, 6.71728515625, 6.979248046875, 7.2412109375, 7.503173828125, 7.76513671875, 8.027099609375, 8.2890625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 19.0, 13.0, 19.0, 23.0, 29.0, 39.0, 49.0, 77.0, 87.0, 82.0, 94.0, 98.0, 93.0, 52.0, 49.0, 33.0, 31.0, 18.0, 18.0, 19.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.345703125, -3.253631591796875, -3.16156005859375, -3.069488525390625, -2.9774169921875, -2.885345458984375, -2.79327392578125, -2.701202392578125, -2.609130859375, -2.517059326171875, -2.42498779296875, -2.332916259765625, -2.2408447265625, -2.148773193359375, -2.05670166015625, -1.964630126953125, -1.87255859375, -1.780487060546875, -1.68841552734375, -1.596343994140625, -1.5042724609375, -1.412200927734375, -1.32012939453125, -1.228057861328125, -1.135986328125, -1.043914794921875, -0.95184326171875, -0.859771728515625, -0.7677001953125, -0.675628662109375, -0.58355712890625, -0.491485595703125, -0.3994140625, -0.307342529296875, -0.21527099609375, -0.123199462890625, -0.0311279296875, 0.060943603515625, 0.15301513671875, 0.245086669921875, 0.337158203125, 0.429229736328125, 0.52130126953125, 0.613372802734375, 0.7054443359375, 0.797515869140625, 0.88958740234375, 0.981658935546875, 1.07373046875, 1.165802001953125, 1.25787353515625, 1.349945068359375, 1.4420166015625, 1.534088134765625, 1.62615966796875, 1.718231201171875, 1.810302734375, 1.902374267578125, 1.99444580078125, 2.086517333984375, 2.1785888671875, 2.270660400390625, 2.36273193359375, 2.454803466796875, 2.546875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 2.0, 11.0, 9.0, 17.0, 36.0, 61.0, 104.0, 250.0, 767.0, 3878.0, 53158.0, 3983295.0, 144280.0, 6655.0, 1133.0, 315.0, 149.0, 56.0, 35.0, 19.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.890625, -10.62255859375, -10.3544921875, -10.08642578125, -9.818359375, -9.55029296875, -9.2822265625, -9.01416015625, -8.74609375, -8.47802734375, -8.2099609375, -7.94189453125, -7.673828125, -7.40576171875, -7.1376953125, -6.86962890625, -6.6015625, -6.33349609375, -6.0654296875, -5.79736328125, -5.529296875, -5.26123046875, -4.9931640625, -4.72509765625, -4.45703125, -4.18896484375, -3.9208984375, -3.65283203125, -3.384765625, -3.11669921875, -2.8486328125, -2.58056640625, -2.3125, -2.04443359375, -1.7763671875, -1.50830078125, -1.240234375, -0.97216796875, -0.7041015625, -0.43603515625, -0.16796875, 0.10009765625, 0.3681640625, 0.63623046875, 0.904296875, 1.17236328125, 1.4404296875, 1.70849609375, 1.9765625, 2.24462890625, 2.5126953125, 2.78076171875, 3.048828125, 3.31689453125, 3.5849609375, 3.85302734375, 4.12109375, 4.38916015625, 4.6572265625, 4.92529296875, 5.193359375, 5.46142578125, 5.7294921875, 5.99755859375, 6.265625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 9.0, 6.0, 5.0, 6.0, 8.0, 21.0, 27.0, 28.0, 30.0, 46.0, 54.0, 91.0, 111.0, 153.0, 227.0, 356.0, 705.0, 815.0, 442.0, 255.0, 186.0, 100.0, 109.0, 46.0, 46.0, 38.0, 30.0, 27.0, 15.0, 20.0, 16.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7553558349609375, -0.731903076171875, -0.7084503173828125, -0.68499755859375, -0.6615447998046875, -0.638092041015625, -0.6146392822265625, -0.5911865234375, -0.5677337646484375, -0.544281005859375, -0.5208282470703125, -0.49737548828125, -0.4739227294921875, -0.450469970703125, -0.4270172119140625, -0.403564453125, -0.3801116943359375, -0.356658935546875, -0.3332061767578125, -0.30975341796875, -0.2863006591796875, -0.262847900390625, -0.2393951416015625, -0.2159423828125, -0.1924896240234375, -0.169036865234375, -0.1455841064453125, -0.12213134765625, -0.0986785888671875, -0.075225830078125, -0.0517730712890625, -0.0283203125, -0.0048675537109375, 0.018585205078125, 0.0420379638671875, 0.06549072265625, 0.0889434814453125, 0.112396240234375, 0.1358489990234375, 0.1593017578125, 0.1827545166015625, 0.206207275390625, 0.2296600341796875, 0.25311279296875, 0.2765655517578125, 0.300018310546875, 0.3234710693359375, 0.346923828125, 0.3703765869140625, 0.393829345703125, 0.4172821044921875, 0.44073486328125, 0.4641876220703125, 0.487640380859375, 0.5110931396484375, 0.5345458984375, 0.5579986572265625, 0.581451416015625, 0.6049041748046875, 0.62835693359375, 0.6518096923828125, 0.675262451171875, 0.6987152099609375, 0.72216796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 7.0, 16.0, 14.0, 32.0, 47.0, 103.0, 94.0, 188.0, 147.0, 122.0, 83.0, 53.0, 38.0, 12.0, 17.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.128007411956787, -4.951148986816406, -4.774291038513184, -4.597433090209961, -4.42057466506958, -4.243716239929199, -4.066858291625977, -3.890000104904175, -3.713141918182373, -3.5362837314605713, -3.3594255447387695, -3.1825673580169678, -3.005709171295166, -2.8288509845733643, -2.6519927978515625, -2.4751346111297607, -2.298276424407959, -2.1214182376861572, -1.9445600509643555, -1.7677018642425537, -1.590843677520752, -1.4139854907989502, -1.2371273040771484, -1.0602691173553467, -0.8834109306335449, -0.7065527439117432, -0.5296945571899414, -0.35283637046813965, -0.1759781837463379, 0.0008800029754638672, 0.17773818969726562, 0.3545963764190674, 0.5314550399780273, 0.7083132266998291, 0.8851714134216309, 1.0620296001434326, 1.2388877868652344, 1.4157459735870361, 1.592604160308838, 1.7694623470306396, 1.9463205337524414, 2.123178720474243, 2.300036907196045, 2.4768950939178467, 2.6537532806396484, 2.83061146736145, 3.007469654083252, 3.1843278408050537, 3.3611860275268555, 3.5380442142486572, 3.714902400970459, 3.8917605876922607, 4.0686187744140625, 4.245476722717285, 4.422335147857666, 4.599193572998047, 4.7760515213012695, 4.952909469604492, 5.129767894744873, 5.306626319885254, 5.483484268188477, 5.660342216491699, 5.83720064163208, 6.014059066772461, 6.190917015075684]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 6.0, 10.0, 27.0, 25.0, 25.0, 41.0, 44.0, 54.0, 50.0, 57.0, 74.0, 67.0, 63.0, 64.0, 63.0, 53.0, 47.0, 41.0, 25.0, 33.0, 23.0, 18.0, 16.0, 21.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3691611289978027, -3.271679639816284, -3.1741981506347656, -3.076716899871826, -2.9792354106903076, -2.881753921508789, -2.7842724323272705, -2.686790943145752, -2.5893096923828125, -2.491828203201294, -2.3943467140197754, -2.296865463256836, -2.1993839740753174, -2.101902484893799, -2.0044209957122803, -1.9069395065307617, -1.8094580173492432, -1.7119765281677246, -1.6144951581954956, -1.517013669013977, -1.419532299041748, -1.3220508098602295, -1.224569320678711, -1.1270878314971924, -1.0296064615249634, -0.9321250319480896, -0.8346436023712158, -0.7371621131896973, -0.6396806836128235, -0.5421992540359497, -0.44471776485443115, -0.3472363352775574, -0.2497551441192627, -0.15227369964122772, -0.05479225516319275, 0.04268920421600342, 0.1401706337928772, 0.23765206336975098, 0.33513355255126953, 0.4326149821281433, 0.5300964117050171, 0.6275778412818909, 0.7250592708587646, 0.8225407600402832, 0.920022189617157, 1.0175036191940308, 1.1149851083755493, 1.2124664783477783, 1.3099479675292969, 1.4074294567108154, 1.5049108266830444, 1.602392315864563, 1.699873685836792, 1.7973551750183105, 1.894836664199829, 1.9923181533813477, 2.089799404144287, 2.1872808933258057, 2.284762382507324, 2.3822436332702637, 2.4797251224517822, 2.577206611633301, 2.6746881008148193, 2.772169589996338, 2.8696510791778564]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 3.0, 7.0, 2.0, 11.0, 9.0, 12.0, 20.0, 27.0, 21.0, 43.0, 54.0, 88.0, 125.0, 156.0, 243.0, 388.0, 677.0, 1202.0, 2827.0, 10487.0, 82099.0, 787532.0, 141285.0, 14280.0, 3578.0, 1322.0, 731.0, 444.0, 249.0, 170.0, 122.0, 84.0, 74.0, 46.0, 34.0, 24.0, 18.0, 13.0, 9.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.5146484375, -0.49835968017578125, -0.4820709228515625, -0.46578216552734375, -0.449493408203125, -0.43320465087890625, -0.4169158935546875, -0.40062713623046875, -0.38433837890625, -0.36804962158203125, -0.3517608642578125, -0.33547210693359375, -0.319183349609375, -0.30289459228515625, -0.2866058349609375, -0.27031707763671875, -0.2540283203125, -0.23773956298828125, -0.2214508056640625, -0.20516204833984375, -0.188873291015625, -0.17258453369140625, -0.1562957763671875, -0.14000701904296875, -0.12371826171875, -0.10742950439453125, -0.0911407470703125, -0.07485198974609375, -0.058563232421875, -0.04227447509765625, -0.0259857177734375, -0.00969696044921875, 0.006591796875, 0.02288055419921875, 0.0391693115234375, 0.05545806884765625, 0.071746826171875, 0.08803558349609375, 0.1043243408203125, 0.12061309814453125, 0.13690185546875, 0.15319061279296875, 0.1694793701171875, 0.18576812744140625, 0.202056884765625, 0.21834564208984375, 0.2346343994140625, 0.25092315673828125, 0.2672119140625, 0.28350067138671875, 0.2997894287109375, 0.31607818603515625, 0.332366943359375, 0.34865570068359375, 0.3649444580078125, 0.38123321533203125, 0.39752197265625, 0.41381072998046875, 0.4300994873046875, 0.44638824462890625, 0.462677001953125, 0.47896575927734375, 0.4952545166015625, 0.5115432739257812, 0.52783203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 6.0, 17.0, 17.0, 22.0, 33.0, 36.0, 60.0, 53.0, 50.0, 79.0, 61.0, 67.0, 88.0, 59.0, 60.0, 49.0, 41.0, 35.0, 40.0, 21.0, 10.0, 24.0, 13.0, 16.0, 3.0, 8.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4765625, -2.395904541015625, -2.31524658203125, -2.234588623046875, -2.1539306640625, -2.073272705078125, -1.99261474609375, -1.911956787109375, -1.831298828125, -1.750640869140625, -1.66998291015625, -1.589324951171875, -1.5086669921875, -1.428009033203125, -1.34735107421875, -1.266693115234375, -1.18603515625, -1.105377197265625, -1.02471923828125, -0.944061279296875, -0.8634033203125, -0.782745361328125, -0.70208740234375, -0.621429443359375, -0.540771484375, -0.460113525390625, -0.37945556640625, -0.298797607421875, -0.2181396484375, -0.137481689453125, -0.05682373046875, 0.023834228515625, 0.1044921875, 0.185150146484375, 0.26580810546875, 0.346466064453125, 0.4271240234375, 0.507781982421875, 0.58843994140625, 0.669097900390625, 0.749755859375, 0.830413818359375, 0.91107177734375, 0.991729736328125, 1.0723876953125, 1.153045654296875, 1.23370361328125, 1.314361572265625, 1.39501953125, 1.475677490234375, 1.55633544921875, 1.636993408203125, 1.7176513671875, 1.798309326171875, 1.87896728515625, 1.959625244140625, 2.040283203125, 2.120941162109375, 2.20159912109375, 2.282257080078125, 2.3629150390625, 2.443572998046875, 2.52423095703125, 2.604888916015625, 2.685546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 12.0, 10.0, 30.0, 18.0, 37.0, 37.0, 55.0, 73.0, 109.0, 142.0, 193.0, 318.0, 453.0, 977.0, 3896.0, 44037.0, 605906.0, 365427.0, 22320.0, 2430.0, 738.0, 399.0, 262.0, 194.0, 123.0, 74.0, 61.0, 52.0, 44.0, 19.0, 29.0, 14.0, 15.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.35931396484375, -0.3472900390625, -0.33526611328125, -0.3232421875, -0.31121826171875, -0.2991943359375, -0.28717041015625, -0.275146484375, -0.26312255859375, -0.2510986328125, -0.23907470703125, -0.22705078125, -0.21502685546875, -0.2030029296875, -0.19097900390625, -0.178955078125, -0.16693115234375, -0.1549072265625, -0.14288330078125, -0.130859375, -0.11883544921875, -0.1068115234375, -0.09478759765625, -0.082763671875, -0.07073974609375, -0.0587158203125, -0.04669189453125, -0.03466796875, -0.02264404296875, -0.0106201171875, 0.00140380859375, 0.013427734375, 0.02545166015625, 0.0374755859375, 0.04949951171875, 0.0615234375, 0.07354736328125, 0.0855712890625, 0.09759521484375, 0.109619140625, 0.12164306640625, 0.1336669921875, 0.14569091796875, 0.15771484375, 0.16973876953125, 0.1817626953125, 0.19378662109375, 0.205810546875, 0.21783447265625, 0.2298583984375, 0.24188232421875, 0.25390625, 0.26593017578125, 0.2779541015625, 0.28997802734375, 0.302001953125, 0.31402587890625, 0.3260498046875, 0.33807373046875, 0.35009765625, 0.36212158203125, 0.3741455078125, 0.38616943359375, 0.398193359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 4.0, 9.0, 18.0, 15.0, 21.0, 28.0, 23.0, 26.0, 31.0, 38.0, 31.0, 34.0, 32.0, 31.0, 39.0, 42.0, 49.0, 58.0, 50.0, 45.0, 46.0, 39.0, 34.0, 34.0, 27.0, 24.0, 23.0, 20.0, 19.0, 20.0, 13.0, 11.0, 21.0, 2.0, 9.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.17578125, -4.0543212890625, -3.932861328125, -3.8114013671875, -3.68994140625, -3.5684814453125, -3.447021484375, -3.3255615234375, -3.2041015625, -3.0826416015625, -2.961181640625, -2.8397216796875, -2.71826171875, -2.5968017578125, -2.475341796875, -2.3538818359375, -2.232421875, -2.1109619140625, -1.989501953125, -1.8680419921875, -1.74658203125, -1.6251220703125, -1.503662109375, -1.3822021484375, -1.2607421875, -1.1392822265625, -1.017822265625, -0.8963623046875, -0.77490234375, -0.6534423828125, -0.531982421875, -0.4105224609375, -0.2890625, -0.1676025390625, -0.046142578125, 0.0753173828125, 0.19677734375, 0.3182373046875, 0.439697265625, 0.5611572265625, 0.6826171875, 0.8040771484375, 0.925537109375, 1.0469970703125, 1.16845703125, 1.2899169921875, 1.411376953125, 1.5328369140625, 1.654296875, 1.7757568359375, 1.897216796875, 2.0186767578125, 2.14013671875, 2.2615966796875, 2.383056640625, 2.5045166015625, 2.6259765625, 2.7474365234375, 2.868896484375, 2.9903564453125, 3.11181640625, 3.2332763671875, 3.354736328125, 3.4761962890625, 3.59765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 3.0, 8.0, 8.0, 11.0, 14.0, 23.0, 19.0, 22.0, 32.0, 38.0, 50.0, 73.0, 103.0, 178.0, 398.0, 1437.0, 12721.0, 993715.0, 35986.0, 2423.0, 577.0, 225.0, 134.0, 91.0, 63.0, 37.0, 34.0, 21.0, 16.0, 15.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.14024066925048828, -0.13607215881347656, -0.13190364837646484, -0.12773513793945312, -0.1235666275024414, -0.11939811706542969, -0.11522960662841797, -0.11106109619140625, -0.10689258575439453, -0.10272407531738281, -0.0985555648803711, -0.09438705444335938, -0.09021854400634766, -0.08605003356933594, -0.08188152313232422, -0.0777130126953125, -0.07354450225830078, -0.06937599182128906, -0.06520748138427734, -0.061038970947265625, -0.056870460510253906, -0.05270195007324219, -0.04853343963623047, -0.04436492919921875, -0.04019641876220703, -0.03602790832519531, -0.031859397888183594, -0.027690887451171875, -0.023522377014160156, -0.019353866577148438, -0.015185356140136719, -0.011016845703125, -0.006848335266113281, -0.0026798248291015625, 0.0014886856079101562, 0.005657196044921875, 0.009825706481933594, 0.013994216918945312, 0.01816272735595703, 0.02233123779296875, 0.02649974822998047, 0.030668258666992188, 0.034836769104003906, 0.039005279541015625, 0.043173789978027344, 0.04734230041503906, 0.05151081085205078, 0.0556793212890625, 0.05984783172607422, 0.06401634216308594, 0.06818485260009766, 0.07235336303710938, 0.0765218734741211, 0.08069038391113281, 0.08485889434814453, 0.08902740478515625, 0.09319591522216797, 0.09736442565917969, 0.1015329360961914, 0.10570144653320312, 0.10986995697021484, 0.11403846740722656, 0.11820697784423828, 0.12237548828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 9.0, 4.0, 5.0, 13.0, 22.0, 25.0, 23.0, 36.0, 36.0, 63.0, 78.0, 111.0, 120.0, 124.0, 97.0, 69.0, 45.0, 23.0, 22.0, 12.0, 20.0, 7.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8312206268310547e-05, -2.734735608100891e-05, -2.6382505893707275e-05, -2.541765570640564e-05, -2.4452805519104004e-05, -2.3487955331802368e-05, -2.2523105144500732e-05, -2.1558254957199097e-05, -2.059340476989746e-05, -1.9628554582595825e-05, -1.866370439529419e-05, -1.7698854207992554e-05, -1.6734004020690918e-05, -1.5769153833389282e-05, -1.4804303646087646e-05, -1.383945345878601e-05, -1.2874603271484375e-05, -1.190975308418274e-05, -1.0944902896881104e-05, -9.980052709579468e-06, -9.015202522277832e-06, -8.050352334976196e-06, -7.0855021476745605e-06, -6.120651960372925e-06, -5.155801773071289e-06, -4.190951585769653e-06, -3.2261013984680176e-06, -2.261251211166382e-06, -1.296401023864746e-06, -3.3155083656311035e-07, 6.332993507385254e-07, 1.5981495380401611e-06, 2.562999725341797e-06, 3.5278499126434326e-06, 4.492700099945068e-06, 5.457550287246704e-06, 6.42240047454834e-06, 7.387250661849976e-06, 8.352100849151611e-06, 9.316951036453247e-06, 1.0281801223754883e-05, 1.1246651411056519e-05, 1.2211501598358154e-05, 1.317635178565979e-05, 1.4141201972961426e-05, 1.5106052160263062e-05, 1.6070902347564697e-05, 1.7035752534866333e-05, 1.800060272216797e-05, 1.8965452909469604e-05, 1.993030309677124e-05, 2.0895153284072876e-05, 2.1860003471374512e-05, 2.2824853658676147e-05, 2.3789703845977783e-05, 2.475455403327942e-05, 2.5719404220581055e-05, 2.668425440788269e-05, 2.7649104595184326e-05, 2.8613954782485962e-05, 2.9578804969787598e-05, 3.0543655157089233e-05, 3.150850534439087e-05, 3.2473355531692505e-05, 3.343820571899414e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 13.0, 20.0, 16.0, 29.0, 44.0, 72.0, 132.0, 174.0, 388.0, 731.0, 1692.0, 5169.0, 28057.0, 877363.0, 118427.0, 10979.0, 2899.0, 1080.0, 531.0, 297.0, 159.0, 95.0, 64.0, 45.0, 31.0, 14.0, 12.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14711952209472656, -0.14262771606445312, -0.1381359100341797, -0.13364410400390625, -0.1291522979736328, -0.12466049194335938, -0.12016868591308594, -0.1156768798828125, -0.11118507385253906, -0.10669326782226562, -0.10220146179199219, -0.09770965576171875, -0.09321784973144531, -0.08872604370117188, -0.08423423767089844, -0.079742431640625, -0.07525062561035156, -0.07075881958007812, -0.06626701354980469, -0.06177520751953125, -0.05728340148925781, -0.052791595458984375, -0.04829978942871094, -0.0438079833984375, -0.03931617736816406, -0.034824371337890625, -0.030332565307617188, -0.02584075927734375, -0.021348953247070312, -0.016857147216796875, -0.012365341186523438, -0.00787353515625, -0.0033817291259765625, 0.001110076904296875, 0.0056018829345703125, 0.01009368896484375, 0.014585494995117188, 0.019077301025390625, 0.023569107055664062, 0.0280609130859375, 0.03255271911621094, 0.037044525146484375, 0.04153633117675781, 0.04602813720703125, 0.05051994323730469, 0.055011749267578125, 0.05950355529785156, 0.063995361328125, 0.06848716735839844, 0.07297897338867188, 0.07747077941894531, 0.08196258544921875, 0.08645439147949219, 0.09094619750976562, 0.09543800354003906, 0.0999298095703125, 0.10442161560058594, 0.10891342163085938, 0.11340522766113281, 0.11789703369140625, 0.12238883972167969, 0.12688064575195312, 0.13137245178222656, 0.1358642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 8.0, 12.0, 15.0, 23.0, 39.0, 98.0, 268.0, 270.0, 106.0, 48.0, 32.0, 15.0, 13.0, 9.0, 6.0, 5.0, 1.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0355224609375, -0.034297943115234375, -0.03307342529296875, -0.031848907470703125, -0.0306243896484375, -0.029399871826171875, -0.02817535400390625, -0.026950836181640625, -0.025726318359375, -0.024501800537109375, -0.02327728271484375, -0.022052764892578125, -0.0208282470703125, -0.019603729248046875, -0.01837921142578125, -0.017154693603515625, -0.01593017578125, -0.014705657958984375, -0.01348114013671875, -0.012256622314453125, -0.0110321044921875, -0.009807586669921875, -0.00858306884765625, -0.007358551025390625, -0.006134033203125, -0.004909515380859375, -0.00368499755859375, -0.002460479736328125, -0.0012359619140625, -1.1444091796875e-05, 0.00121307373046875, 0.002437591552734375, 0.003662109375, 0.004886627197265625, 0.00611114501953125, 0.007335662841796875, 0.0085601806640625, 0.009784698486328125, 0.01100921630859375, 0.012233734130859375, 0.013458251953125, 0.014682769775390625, 0.01590728759765625, 0.017131805419921875, 0.0183563232421875, 0.019580841064453125, 0.02080535888671875, 0.022029876708984375, 0.02325439453125, 0.024478912353515625, 0.02570343017578125, 0.026927947998046875, 0.0281524658203125, 0.029376983642578125, 0.03060150146484375, 0.031826019287109375, 0.033050537109375, 0.034275054931640625, 0.03549957275390625, 0.036724090576171875, 0.0379486083984375, 0.039173126220703125, 0.04039764404296875, 0.041622161865234375, 0.0428466796875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 19.0, 40.0, 65.0, 106.0, 134.0, 198.0, 147.0, 99.0, 69.0, 41.0, 20.0, 10.0, 12.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455575704574585, -3.3145558834075928, -3.1735360622406006, -3.0325162410736084, -2.891496181488037, -2.750476360321045, -2.6094565391540527, -2.4684367179870605, -2.3274168968200684, -2.186397075653076, -2.045377254486084, -1.9043573141098022, -1.76333749294281, -1.6223176717758179, -1.4812977313995361, -1.340277910232544, -1.1992580890655518, -1.0582382678985596, -0.9172183871269226, -0.7761985063552856, -0.6351786851882935, -0.49415886402130127, -0.3531389832496643, -0.21211910247802734, -0.07109928131103516, 0.06992056965827942, 0.210940420627594, 0.35196027159690857, 0.49298012256622314, 0.6339999437332153, 0.7750198245048523, 0.9160397052764893, 1.0570592880249023, 1.1980791091918945, 1.3390989303588867, 1.4801188707351685, 1.6211386919021606, 1.7621585130691528, 1.9031784534454346, 2.0441982746124268, 2.185218095779419, 2.326237916946411, 2.4672577381134033, 2.6082775592803955, 2.749297618865967, 2.890317440032959, 3.031337261199951, 3.1723570823669434, 3.3133769035339355, 3.4543967247009277, 3.59541654586792, 3.736436367034912, 3.8774561882019043, 4.0184760093688965, 4.159495830535889, 4.300516128540039, 4.441535949707031, 4.582555770874023, 4.723575592041016, 4.864595413208008, 5.005615234375, 5.146635055541992, 5.287654876708984, 5.428674697875977, 5.569694519042969]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 10.0, 7.0, 20.0, 21.0, 28.0, 41.0, 49.0, 52.0, 44.0, 72.0, 70.0, 78.0, 86.0, 55.0, 58.0, 64.0, 45.0, 36.0, 31.0, 28.0, 16.0, 20.0, 14.0, 11.0, 11.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5668931007385254, -2.4891254901885986, -2.411357879638672, -2.333590269088745, -2.2558226585388184, -2.1780550479888916, -2.100287437438965, -2.022520065307617, -1.9447523355484009, -1.8669847249984741, -1.7892171144485474, -1.7114495038986206, -1.6336820125579834, -1.5559144020080566, -1.4781467914581299, -1.4003791809082031, -1.3226115703582764, -1.2448439598083496, -1.1670763492584229, -1.089308738708496, -1.0115411281585693, -0.9337735772132874, -0.8560060262680054, -0.7782384157180786, -0.7004708051681519, -0.6227031946182251, -0.5449355840682983, -0.46716803312301636, -0.3894004225730896, -0.31163281202316284, -0.23386523127555847, -0.1560976505279541, -0.07833027839660645, -0.0005626827478408813, 0.07720491290092468, 0.15497250854969025, 0.2327401041984558, 0.31050771474838257, 0.38827529549598694, 0.4660428762435913, 0.5438104867935181, 0.6215780973434448, 0.6993457078933716, 0.7771132588386536, 0.8548808693885803, 0.9326484799385071, 1.010416030883789, 1.0881836414337158, 1.1659512519836426, 1.2437188625335693, 1.321486473083496, 1.3992540836334229, 1.4770216941833496, 1.5547893047332764, 1.6325567960739136, 1.7103244066238403, 1.788092017173767, 1.8658596277236938, 1.9436272382736206, 2.021394729614258, 2.0991623401641846, 2.1769299507141113, 2.254697561264038, 2.332465171813965, 2.4102327823638916]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 14.0, 15.0, 21.0, 29.0, 68.0, 99.0, 160.0, 229.0, 436.0, 766.0, 1539.0, 3103.0, 7016.0, 18436.0, 59039.0, 312341.0, 521738.0, 82709.0, 24174.0, 8938.0, 3760.0, 1758.0, 898.0, 474.0, 284.0, 191.0, 107.0, 66.0, 41.0, 31.0, 17.0, 18.0, 9.0, 1.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.17828369140625, -2.1104736328125, -2.04266357421875, -1.974853515625, -1.90704345703125, -1.8392333984375, -1.77142333984375, -1.70361328125, -1.63580322265625, -1.5679931640625, -1.50018310546875, -1.432373046875, -1.36456298828125, -1.2967529296875, -1.22894287109375, -1.1611328125, -1.09332275390625, -1.0255126953125, -0.95770263671875, -0.889892578125, -0.82208251953125, -0.7542724609375, -0.68646240234375, -0.61865234375, -0.55084228515625, -0.4830322265625, -0.41522216796875, -0.347412109375, -0.27960205078125, -0.2117919921875, -0.14398193359375, -0.076171875, -0.00836181640625, 0.0594482421875, 0.12725830078125, 0.195068359375, 0.26287841796875, 0.3306884765625, 0.39849853515625, 0.46630859375, 0.53411865234375, 0.6019287109375, 0.66973876953125, 0.737548828125, 0.80535888671875, 0.8731689453125, 0.94097900390625, 1.0087890625, 1.07659912109375, 1.1444091796875, 1.21221923828125, 1.280029296875, 1.34783935546875, 1.4156494140625, 1.48345947265625, 1.55126953125, 1.61907958984375, 1.6868896484375, 1.75469970703125, 1.822509765625, 1.89031982421875, 1.9581298828125, 2.02593994140625, 2.09375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 9.0, 10.0, 13.0, 18.0, 28.0, 36.0, 24.0, 57.0, 54.0, 67.0, 74.0, 73.0, 81.0, 80.0, 89.0, 55.0, 54.0, 38.0, 32.0, 23.0, 25.0, 12.0, 14.0, 10.0, 4.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.890625, -5.723388671875, -5.55615234375, -5.388916015625, -5.2216796875, -5.054443359375, -4.88720703125, -4.719970703125, -4.552734375, -4.385498046875, -4.21826171875, -4.051025390625, -3.8837890625, -3.716552734375, -3.54931640625, -3.382080078125, -3.21484375, -3.047607421875, -2.88037109375, -2.713134765625, -2.5458984375, -2.378662109375, -2.21142578125, -2.044189453125, -1.876953125, -1.709716796875, -1.54248046875, -1.375244140625, -1.2080078125, -1.040771484375, -0.87353515625, -0.706298828125, -0.5390625, -0.371826171875, -0.20458984375, -0.037353515625, 0.1298828125, 0.297119140625, 0.46435546875, 0.631591796875, 0.798828125, 0.966064453125, 1.13330078125, 1.300537109375, 1.4677734375, 1.635009765625, 1.80224609375, 1.969482421875, 2.13671875, 2.303955078125, 2.47119140625, 2.638427734375, 2.8056640625, 2.972900390625, 3.14013671875, 3.307373046875, 3.474609375, 3.641845703125, 3.80908203125, 3.976318359375, 4.1435546875, 4.310791015625, 4.47802734375, 4.645263671875, 4.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 17.0, 17.0, 26.0, 36.0, 52.0, 69.0, 84.0, 167.0, 265.0, 596.0, 2942.0, 64487.0, 946373.0, 30370.0, 1848.0, 461.0, 247.0, 138.0, 99.0, 69.0, 50.0, 33.0, 33.0, 23.0, 12.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.3359375, -7.1226806640625, -6.909423828125, -6.6961669921875, -6.48291015625, -6.2696533203125, -6.056396484375, -5.8431396484375, -5.6298828125, -5.4166259765625, -5.203369140625, -4.9901123046875, -4.77685546875, -4.5635986328125, -4.350341796875, -4.1370849609375, -3.923828125, -3.7105712890625, -3.497314453125, -3.2840576171875, -3.07080078125, -2.8575439453125, -2.644287109375, -2.4310302734375, -2.2177734375, -2.0045166015625, -1.791259765625, -1.5780029296875, -1.36474609375, -1.1514892578125, -0.938232421875, -0.7249755859375, -0.51171875, -0.2984619140625, -0.085205078125, 0.1280517578125, 0.34130859375, 0.5545654296875, 0.767822265625, 0.9810791015625, 1.1943359375, 1.4075927734375, 1.620849609375, 1.8341064453125, 2.04736328125, 2.2606201171875, 2.473876953125, 2.6871337890625, 2.900390625, 3.1136474609375, 3.326904296875, 3.5401611328125, 3.75341796875, 3.9666748046875, 4.179931640625, 4.3931884765625, 4.6064453125, 4.8197021484375, 5.032958984375, 5.2462158203125, 5.45947265625, 5.6727294921875, 5.885986328125, 6.0992431640625, 6.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 11.0, 16.0, 27.0, 19.0, 22.0, 25.0, 22.0, 36.0, 39.0, 49.0, 44.0, 48.0, 56.0, 48.0, 46.0, 44.0, 37.0, 43.0, 42.0, 42.0, 44.0, 34.0, 23.0, 25.0, 15.0, 25.0, 21.0, 16.0, 4.0, 10.0, 12.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.3046875, -5.14898681640625, -4.9932861328125, -4.83758544921875, -4.681884765625, -4.52618408203125, -4.3704833984375, -4.21478271484375, -4.05908203125, -3.90338134765625, -3.7476806640625, -3.59197998046875, -3.436279296875, -3.28057861328125, -3.1248779296875, -2.96917724609375, -2.8134765625, -2.65777587890625, -2.5020751953125, -2.34637451171875, -2.190673828125, -2.03497314453125, -1.8792724609375, -1.72357177734375, -1.56787109375, -1.41217041015625, -1.2564697265625, -1.10076904296875, -0.945068359375, -0.78936767578125, -0.6336669921875, -0.47796630859375, -0.322265625, -0.16656494140625, -0.0108642578125, 0.14483642578125, 0.300537109375, 0.45623779296875, 0.6119384765625, 0.76763916015625, 0.92333984375, 1.07904052734375, 1.2347412109375, 1.39044189453125, 1.546142578125, 1.70184326171875, 1.8575439453125, 2.01324462890625, 2.1689453125, 2.32464599609375, 2.4803466796875, 2.63604736328125, 2.791748046875, 2.94744873046875, 3.1031494140625, 3.25885009765625, 3.41455078125, 3.57025146484375, 3.7259521484375, 3.88165283203125, 4.037353515625, 4.19305419921875, 4.3487548828125, 4.50445556640625, 4.66015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 14.0, 20.0, 23.0, 25.0, 69.0, 102.0, 153.0, 290.0, 663.0, 1721.0, 6887.0, 42876.0, 559776.0, 391368.0, 35843.0, 5926.0, 1536.0, 579.0, 267.0, 135.0, 95.0, 58.0, 30.0, 20.0, 14.0, 12.0, 6.0, 8.0, 0.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.00189208984375, -0.9647216796875, -0.92755126953125, -0.890380859375, -0.85321044921875, -0.8160400390625, -0.77886962890625, -0.74169921875, -0.70452880859375, -0.6673583984375, -0.63018798828125, -0.593017578125, -0.55584716796875, -0.5186767578125, -0.48150634765625, -0.4443359375, -0.40716552734375, -0.3699951171875, -0.33282470703125, -0.295654296875, -0.25848388671875, -0.2213134765625, -0.18414306640625, -0.14697265625, -0.10980224609375, -0.0726318359375, -0.03546142578125, 0.001708984375, 0.03887939453125, 0.0760498046875, 0.11322021484375, 0.150390625, 0.18756103515625, 0.2247314453125, 0.26190185546875, 0.299072265625, 0.33624267578125, 0.3734130859375, 0.41058349609375, 0.44775390625, 0.48492431640625, 0.5220947265625, 0.55926513671875, 0.596435546875, 0.63360595703125, 0.6707763671875, 0.70794677734375, 0.7451171875, 0.78228759765625, 0.8194580078125, 0.85662841796875, 0.893798828125, 0.93096923828125, 0.9681396484375, 1.00531005859375, 1.04248046875, 1.07965087890625, 1.1168212890625, 1.15399169921875, 1.191162109375, 1.22833251953125, 1.2655029296875, 1.30267333984375, 1.33984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 31.0, 27.0, 38.0, 66.0, 74.0, 120.0, 206.0, 123.0, 84.0, 43.0, 38.0, 29.0, 20.0, 13.0, 12.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015592575073242188, -0.0001504272222518921, -0.0001449286937713623, -0.00013943016529083252, -0.00013393163681030273, -0.00012843310832977295, -0.00012293457984924316, -0.00011743605136871338, -0.0001119375228881836, -0.00010643899440765381, -0.00010094046592712402, -9.544193744659424e-05, -8.994340896606445e-05, -8.444488048553467e-05, -7.894635200500488e-05, -7.34478235244751e-05, -6.794929504394531e-05, -6.245076656341553e-05, -5.695223808288574e-05, -5.145370960235596e-05, -4.595518112182617e-05, -4.045665264129639e-05, -3.49581241607666e-05, -2.9459595680236816e-05, -2.396106719970703e-05, -1.8462538719177246e-05, -1.2964010238647461e-05, -7.465481758117676e-06, -1.9669532775878906e-06, 3.5315752029418945e-06, 9.03010368347168e-06, 1.4528632164001465e-05, 2.002716064453125e-05, 2.5525689125061035e-05, 3.102421760559082e-05, 3.6522746086120605e-05, 4.202127456665039e-05, 4.7519803047180176e-05, 5.301833152770996e-05, 5.8516860008239746e-05, 6.401538848876953e-05, 6.951391696929932e-05, 7.50124454498291e-05, 8.051097393035889e-05, 8.600950241088867e-05, 9.150803089141846e-05, 9.700655937194824e-05, 0.00010250508785247803, 0.00010800361633300781, 0.0001135021448135376, 0.00011900067329406738, 0.00012449920177459717, 0.00012999773025512695, 0.00013549625873565674, 0.00014099478721618652, 0.0001464933156967163, 0.0001519918441772461, 0.00015749037265777588, 0.00016298890113830566, 0.00016848742961883545, 0.00017398595809936523, 0.00017948448657989502, 0.0001849830150604248, 0.0001904815435409546, 0.00019598007202148438]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 10.0, 4.0, 5.0, 16.0, 19.0, 19.0, 35.0, 86.0, 176.0, 510.0, 1764.0, 10758.0, 149510.0, 825689.0, 52930.0, 5290.0, 1093.0, 339.0, 151.0, 57.0, 33.0, 22.0, 13.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.4168701171875, -1.363037109375, -1.3092041015625, -1.25537109375, -1.2015380859375, -1.147705078125, -1.0938720703125, -1.0400390625, -0.9862060546875, -0.932373046875, -0.8785400390625, -0.82470703125, -0.7708740234375, -0.717041015625, -0.6632080078125, -0.609375, -0.5555419921875, -0.501708984375, -0.4478759765625, -0.39404296875, -0.3402099609375, -0.286376953125, -0.2325439453125, -0.1787109375, -0.1248779296875, -0.071044921875, -0.0172119140625, 0.03662109375, 0.0904541015625, 0.144287109375, 0.1981201171875, 0.251953125, 0.3057861328125, 0.359619140625, 0.4134521484375, 0.46728515625, 0.5211181640625, 0.574951171875, 0.6287841796875, 0.6826171875, 0.7364501953125, 0.790283203125, 0.8441162109375, 0.89794921875, 0.9517822265625, 1.005615234375, 1.0594482421875, 1.11328125, 1.1671142578125, 1.220947265625, 1.2747802734375, 1.32861328125, 1.3824462890625, 1.436279296875, 1.4901123046875, 1.5439453125, 1.5977783203125, 1.651611328125, 1.7054443359375, 1.75927734375, 1.8131103515625, 1.866943359375, 1.9207763671875, 1.974609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 8.0, 14.0, 16.0, 27.0, 47.0, 51.0, 91.0, 119.0, 196.0, 129.0, 95.0, 60.0, 46.0, 24.0, 20.0, 18.0, 12.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4609375, -0.44217681884765625, -0.4234161376953125, -0.40465545654296875, -0.385894775390625, -0.36713409423828125, -0.3483734130859375, -0.32961273193359375, -0.31085205078125, -0.29209136962890625, -0.2733306884765625, -0.25457000732421875, -0.235809326171875, -0.21704864501953125, -0.1982879638671875, -0.17952728271484375, -0.1607666015625, -0.14200592041015625, -0.1232452392578125, -0.10448455810546875, -0.085723876953125, -0.06696319580078125, -0.0482025146484375, -0.02944183349609375, -0.01068115234375, 0.00807952880859375, 0.0268402099609375, 0.04560089111328125, 0.064361572265625, 0.08312225341796875, 0.1018829345703125, 0.12064361572265625, 0.139404296875, 0.15816497802734375, 0.1769256591796875, 0.19568634033203125, 0.214447021484375, 0.23320770263671875, 0.2519683837890625, 0.27072906494140625, 0.28948974609375, 0.30825042724609375, 0.3270111083984375, 0.34577178955078125, 0.364532470703125, 0.38329315185546875, 0.4020538330078125, 0.42081451416015625, 0.4395751953125, 0.45833587646484375, 0.4770965576171875, 0.49585723876953125, 0.514617919921875, 0.5333786010742188, 0.5521392822265625, 0.5708999633789062, 0.58966064453125, 0.6084213256835938, 0.6271820068359375, 0.6459426879882812, 0.664703369140625, 0.6834640502929688, 0.7022247314453125, 0.7209854125976562, 0.73974609375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 13.0, 29.0, 119.0, 324.0, 331.0, 137.0, 33.0, 13.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.941051483154297, -31.231830596923828, -30.52260971069336, -29.81338882446289, -29.104167938232422, -28.394948959350586, -27.685728073120117, -26.97650718688965, -26.26728630065918, -25.55806541442871, -24.848844528198242, -24.139623641967773, -23.430404663085938, -22.72118377685547, -22.011962890625, -21.30274200439453, -20.593521118164062, -19.884300231933594, -19.175079345703125, -18.465858459472656, -17.756637573242188, -17.04741859436035, -16.338197708129883, -15.628976821899414, -14.919755935668945, -14.210535049438477, -13.501314163208008, -12.792094230651855, -12.082873344421387, -11.373652458190918, -10.664432525634766, -9.955211639404297, -9.245990753173828, -8.53676986694336, -7.827549457550049, -7.118329048156738, -6.4091081619262695, -5.699887275695801, -4.99066686630249, -4.28144645690918, -3.572225570678711, -2.8630049228668213, -2.1537842750549316, -1.444563627243042, -0.7353429794311523, -0.026122331619262695, 0.683098316192627, 1.3923187255859375, 2.1015396118164062, 2.810760259628296, 3.5199809074401855, 4.229201316833496, 4.938422203063965, 5.647643089294434, 6.356863498687744, 7.066083908081055, 7.775304794311523, 8.484525680541992, 9.193746566772461, 9.902966499328613, 10.612187385559082, 11.32140827178955, 12.030628204345703, 12.739849090576172, 13.44906997680664]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 13.0, 6.0, 14.0, 10.0, 18.0, 15.0, 24.0, 25.0, 26.0, 33.0, 26.0, 31.0, 37.0, 37.0, 31.0, 52.0, 39.0, 36.0, 44.0, 44.0, 43.0, 44.0, 30.0, 40.0, 28.0, 28.0, 30.0, 18.0, 27.0, 15.0, 20.0, 19.0, 15.0, 14.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.344343185424805, -8.106801986694336, -7.869259834289551, -7.631718158721924, -7.394176483154297, -7.156635284423828, -6.919093132019043, -6.681551933288574, -6.444010257720947, -6.20646858215332, -5.968926906585693, -5.731385231018066, -5.4938435554504395, -5.2563018798828125, -5.018760681152344, -4.781219005584717, -4.54367733001709, -4.306135654449463, -4.068593978881836, -3.831052303314209, -3.593510866165161, -3.355969190597534, -3.1184275150299072, -2.8808860778808594, -2.643343925476074, -2.4058022499084473, -2.1682605743408203, -1.930719017982483, -1.6931774616241455, -1.4556357860565186, -1.2180941104888916, -0.9805525541305542, -0.7430109977722168, -0.5054693818092346, -0.26792773604393005, -0.03038609027862549, 0.2071555256843567, 0.44469714164733887, 0.6822388172149658, 0.9197803735733032, 1.1573220491409302, 1.3948637247085571, 1.6324052810668945, 1.8699469566345215, 2.1074886322021484, 2.3450303077697754, 2.5825719833374023, 2.82011342048645, 3.057655096054077, 3.295196771621704, 3.532738447189331, 3.770279884338379, 4.007821559906006, 4.245363235473633, 4.48290491104126, 4.720446586608887, 4.957988262176514, 5.195529937744141, 5.433071613311768, 5.6706132888793945, 5.9081549644470215, 6.145696640014648, 6.383237838745117, 6.620779514312744, 6.858321189880371]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 8.0, 15.0, 16.0, 20.0, 26.0, 36.0, 51.0, 56.0, 68.0, 97.0, 144.0, 195.0, 342.0, 600.0, 1406.0, 3536.0, 12440.0, 68072.0, 1622412.0, 2382369.0, 80353.0, 14476.0, 4140.0, 1488.0, 737.0, 363.0, 243.0, 149.0, 111.0, 65.0, 63.0, 33.0, 28.0, 27.0, 22.0, 9.0, 12.0, 8.0, 9.0, 5.0, 5.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.1112060546875, -3.964599609375, -3.8179931640625, -3.67138671875, -3.5247802734375, -3.378173828125, -3.2315673828125, -3.0849609375, -2.9383544921875, -2.791748046875, -2.6451416015625, -2.49853515625, -2.3519287109375, -2.205322265625, -2.0587158203125, -1.912109375, -1.7655029296875, -1.618896484375, -1.4722900390625, -1.32568359375, -1.1790771484375, -1.032470703125, -0.8858642578125, -0.7392578125, -0.5926513671875, -0.446044921875, -0.2994384765625, -0.15283203125, -0.0062255859375, 0.140380859375, 0.2869873046875, 0.43359375, 0.5802001953125, 0.726806640625, 0.8734130859375, 1.02001953125, 1.1666259765625, 1.313232421875, 1.4598388671875, 1.6064453125, 1.7530517578125, 1.899658203125, 2.0462646484375, 2.19287109375, 2.3394775390625, 2.486083984375, 2.6326904296875, 2.779296875, 2.9259033203125, 3.072509765625, 3.2191162109375, 3.36572265625, 3.5123291015625, 3.658935546875, 3.8055419921875, 3.9521484375, 4.0987548828125, 4.245361328125, 4.3919677734375, 4.53857421875, 4.6851806640625, 4.831787109375, 4.9783935546875, 5.125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 10.0, 9.0, 14.0, 18.0, 26.0, 28.0, 57.0, 56.0, 56.0, 71.0, 88.0, 88.0, 80.0, 78.0, 68.0, 57.0, 52.0, 29.0, 32.0, 17.0, 21.0, 7.0, 12.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.115234375, -3.030364990234375, -2.94549560546875, -2.860626220703125, -2.7757568359375, -2.690887451171875, -2.60601806640625, -2.521148681640625, -2.436279296875, -2.351409912109375, -2.26654052734375, -2.181671142578125, -2.0968017578125, -2.011932373046875, -1.92706298828125, -1.842193603515625, -1.75732421875, -1.672454833984375, -1.58758544921875, -1.502716064453125, -1.4178466796875, -1.332977294921875, -1.24810791015625, -1.163238525390625, -1.078369140625, -0.993499755859375, -0.90863037109375, -0.823760986328125, -0.7388916015625, -0.654022216796875, -0.56915283203125, -0.484283447265625, -0.3994140625, -0.314544677734375, -0.22967529296875, -0.144805908203125, -0.0599365234375, 0.024932861328125, 0.10980224609375, 0.194671630859375, 0.279541015625, 0.364410400390625, 0.44927978515625, 0.534149169921875, 0.6190185546875, 0.703887939453125, 0.78875732421875, 0.873626708984375, 0.95849609375, 1.043365478515625, 1.12823486328125, 1.213104248046875, 1.2979736328125, 1.382843017578125, 1.46771240234375, 1.552581787109375, 1.637451171875, 1.722320556640625, 1.80718994140625, 1.892059326171875, 1.9769287109375, 2.061798095703125, 2.14666748046875, 2.231536865234375, 2.31640625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 10.0, 8.0, 23.0, 23.0, 52.0, 78.0, 89.0, 199.0, 467.0, 1752.0, 13068.0, 423458.0, 3698368.0, 50967.0, 4186.0, 827.0, 296.0, 151.0, 78.0, 51.0, 41.0, 31.0, 13.0, 12.0, 8.0, 7.0, 9.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.5703125, -10.29388427734375, -10.0174560546875, -9.74102783203125, -9.464599609375, -9.18817138671875, -8.9117431640625, -8.63531494140625, -8.35888671875, -8.08245849609375, -7.8060302734375, -7.52960205078125, -7.253173828125, -6.97674560546875, -6.7003173828125, -6.42388916015625, -6.1474609375, -5.87103271484375, -5.5946044921875, -5.31817626953125, -5.041748046875, -4.76531982421875, -4.4888916015625, -4.21246337890625, -3.93603515625, -3.65960693359375, -3.3831787109375, -3.10675048828125, -2.830322265625, -2.55389404296875, -2.2774658203125, -2.00103759765625, -1.724609375, -1.44818115234375, -1.1717529296875, -0.89532470703125, -0.618896484375, -0.34246826171875, -0.0660400390625, 0.21038818359375, 0.48681640625, 0.76324462890625, 1.0396728515625, 1.31610107421875, 1.592529296875, 1.86895751953125, 2.1453857421875, 2.42181396484375, 2.6982421875, 2.97467041015625, 3.2510986328125, 3.52752685546875, 3.803955078125, 4.08038330078125, 4.3568115234375, 4.63323974609375, 4.90966796875, 5.18609619140625, 5.4625244140625, 5.73895263671875, 6.015380859375, 6.29180908203125, 6.5682373046875, 6.84466552734375, 7.12109375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 2.0, 9.0, 11.0, 13.0, 19.0, 25.0, 25.0, 39.0, 49.0, 70.0, 108.0, 150.0, 235.0, 363.0, 579.0, 749.0, 525.0, 329.0, 221.0, 155.0, 108.0, 76.0, 52.0, 41.0, 27.0, 22.0, 19.0, 12.0, 8.0, 6.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.16015625, -1.1254730224609375, -1.090789794921875, -1.0561065673828125, -1.02142333984375, -0.9867401123046875, -0.952056884765625, -0.9173736572265625, -0.8826904296875, -0.8480072021484375, -0.813323974609375, -0.7786407470703125, -0.74395751953125, -0.7092742919921875, -0.674591064453125, -0.6399078369140625, -0.605224609375, -0.5705413818359375, -0.535858154296875, -0.5011749267578125, -0.46649169921875, -0.4318084716796875, -0.397125244140625, -0.3624420166015625, -0.3277587890625, -0.2930755615234375, -0.258392333984375, -0.2237091064453125, -0.18902587890625, -0.1543426513671875, -0.119659423828125, -0.0849761962890625, -0.05029296875, -0.0156097412109375, 0.019073486328125, 0.0537567138671875, 0.08843994140625, 0.1231231689453125, 0.157806396484375, 0.1924896240234375, 0.2271728515625, 0.2618560791015625, 0.296539306640625, 0.3312225341796875, 0.36590576171875, 0.4005889892578125, 0.435272216796875, 0.4699554443359375, 0.504638671875, 0.5393218994140625, 0.574005126953125, 0.6086883544921875, 0.64337158203125, 0.6780548095703125, 0.712738037109375, 0.7474212646484375, 0.7821044921875, 0.8167877197265625, 0.851470947265625, 0.8861541748046875, 0.92083740234375, 0.9555206298828125, 0.990203857421875, 1.0248870849609375, 1.0595703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 11.0, 10.0, 17.0, 27.0, 21.0, 36.0, 46.0, 61.0, 77.0, 81.0, 70.0, 81.0, 83.0, 71.0, 80.0, 59.0, 38.0, 25.0, 20.0, 18.0, 16.0, 16.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.030686855316162, -3.9129021167755127, -3.7951176166534424, -3.677332878112793, -3.5595483779907227, -3.4417636394500732, -3.323978900909424, -3.2061944007873535, -3.088409662246704, -2.9706249237060547, -2.8528404235839844, -2.735055685043335, -2.6172709465026855, -2.4994864463806152, -2.381701707839966, -2.2639169692993164, -2.146132469177246, -2.0283477306365967, -1.9105632305145264, -1.792778491973877, -1.674993872642517, -1.5572092533111572, -1.4394245147705078, -1.321639895439148, -1.203855276107788, -1.0860706567764282, -0.9682859778404236, -0.850501298904419, -0.7327166795730591, -0.6149320602416992, -0.4971473813056946, -0.37936270236968994, -0.261577844619751, -0.14379319548606873, -0.026008546352386475, 0.09177610278129578, 0.20956075191497803, 0.3273453712463379, 0.44513005018234253, 0.5629147291183472, 0.680699348449707, 0.7984839677810669, 0.9162686467170715, 1.0340533256530762, 1.151837944984436, 1.269622564315796, 1.3874073028564453, 1.5051919221878052, 1.622976541519165, 1.740761160850525, 1.8585457801818848, 1.9763305187225342, 2.0941152572631836, 2.211899757385254, 2.3296844959259033, 2.4474692344665527, 2.565253734588623, 2.6830384731292725, 2.8008229732513428, 2.918607711791992, 3.0363922119140625, 3.154176950454712, 3.2719616889953613, 3.3897461891174316, 3.507530927658081]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 4.0, 7.0, 11.0, 13.0, 13.0, 24.0, 26.0, 26.0, 22.0, 35.0, 39.0, 32.0, 57.0, 44.0, 49.0, 37.0, 42.0, 48.0, 47.0, 46.0, 46.0, 39.0, 36.0, 22.0, 39.0, 35.0, 24.0, 36.0, 15.0, 18.0, 10.0, 15.0, 9.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8297390937805176, -2.747905731201172, -2.6660726070404053, -2.5842392444610596, -2.502406120300293, -2.4205727577209473, -2.3387393951416016, -2.256906032562256, -2.1750729084014893, -2.0932395458221436, -2.011406421661377, -1.9295730590820312, -1.847739815711975, -1.765906572341919, -1.6840732097625732, -1.602239966392517, -1.520406723022461, -1.4385734796524048, -1.3567402362823486, -1.274906873703003, -1.1930736303329468, -1.1112403869628906, -1.029407024383545, -0.9475737810134888, -0.8657405376434326, -0.7839072942733765, -0.7020739912986755, -0.6202406883239746, -0.5384074449539185, -0.4565741717815399, -0.3747408986091614, -0.29290759563446045, -0.2110745906829834, -0.12924131751060486, -0.04740804433822632, 0.03442522883415222, 0.11625850200653076, 0.1980917751789093, 0.27992504835128784, 0.36175835132598877, 0.4435915946960449, 0.5254248380661011, 0.607258141040802, 0.6890914440155029, 0.7709246873855591, 0.8527579307556152, 0.9345912337303162, 1.016424536705017, 1.0982577800750732, 1.1800910234451294, 1.2619242668151855, 1.3437576293945312, 1.4255908727645874, 1.5074241161346436, 1.5892574787139893, 1.6710907220840454, 1.7529239654541016, 1.8347572088241577, 1.9165904521942139, 1.9984238147735596, 2.080256938934326, 2.162090301513672, 2.2439236640930176, 2.3257570266723633, 2.40759015083313]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 8.0, 15.0, 14.0, 11.0, 28.0, 43.0, 73.0, 92.0, 147.0, 216.0, 453.0, 1133.0, 3461.0, 15577.0, 163361.0, 770657.0, 79017.0, 9986.0, 2393.0, 862.0, 418.0, 219.0, 129.0, 74.0, 44.0, 35.0, 20.0, 18.0, 10.0, 10.0, 5.0, 7.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6796875, -0.6614990234375, -0.643310546875, -0.6251220703125, -0.60693359375, -0.5887451171875, -0.570556640625, -0.5523681640625, -0.5341796875, -0.5159912109375, -0.497802734375, -0.4796142578125, -0.46142578125, -0.4432373046875, -0.425048828125, -0.4068603515625, -0.388671875, -0.3704833984375, -0.352294921875, -0.3341064453125, -0.31591796875, -0.2977294921875, -0.279541015625, -0.2613525390625, -0.2431640625, -0.2249755859375, -0.206787109375, -0.1885986328125, -0.17041015625, -0.1522216796875, -0.134033203125, -0.1158447265625, -0.09765625, -0.0794677734375, -0.061279296875, -0.0430908203125, -0.02490234375, -0.0067138671875, 0.011474609375, 0.0296630859375, 0.0478515625, 0.0660400390625, 0.084228515625, 0.1024169921875, 0.12060546875, 0.1387939453125, 0.156982421875, 0.1751708984375, 0.193359375, 0.2115478515625, 0.229736328125, 0.2479248046875, 0.26611328125, 0.2843017578125, 0.302490234375, 0.3206787109375, 0.3388671875, 0.3570556640625, 0.375244140625, 0.3934326171875, 0.41162109375, 0.4298095703125, 0.447998046875, 0.4661865234375, 0.484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 9.0, 14.0, 16.0, 20.0, 27.0, 31.0, 35.0, 39.0, 40.0, 70.0, 61.0, 57.0, 57.0, 53.0, 49.0, 49.0, 56.0, 42.0, 39.0, 52.0, 39.0, 34.0, 25.0, 19.0, 11.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.375, -2.3097686767578125, -2.244537353515625, -2.1793060302734375, -2.11407470703125, -2.0488433837890625, -1.983612060546875, -1.9183807373046875, -1.8531494140625, -1.7879180908203125, -1.722686767578125, -1.6574554443359375, -1.59222412109375, -1.5269927978515625, -1.461761474609375, -1.3965301513671875, -1.331298828125, -1.2660675048828125, -1.200836181640625, -1.1356048583984375, -1.07037353515625, -1.0051422119140625, -0.939910888671875, -0.8746795654296875, -0.8094482421875, -0.7442169189453125, -0.678985595703125, -0.6137542724609375, -0.54852294921875, -0.4832916259765625, -0.418060302734375, -0.3528289794921875, -0.28759765625, -0.2223663330078125, -0.157135009765625, -0.0919036865234375, -0.02667236328125, 0.0385589599609375, 0.103790283203125, 0.1690216064453125, 0.2342529296875, 0.2994842529296875, 0.364715576171875, 0.4299468994140625, 0.49517822265625, 0.5604095458984375, 0.625640869140625, 0.6908721923828125, 0.756103515625, 0.8213348388671875, 0.886566162109375, 0.9517974853515625, 1.01702880859375, 1.0822601318359375, 1.147491455078125, 1.2127227783203125, 1.2779541015625, 1.3431854248046875, 1.408416748046875, 1.4736480712890625, 1.53887939453125, 1.6041107177734375, 1.669342041015625, 1.7345733642578125, 1.7998046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 2.0, 12.0, 17.0, 19.0, 20.0, 22.0, 42.0, 43.0, 71.0, 104.0, 124.0, 186.0, 247.0, 421.0, 649.0, 1958.0, 16362.0, 364427.0, 628969.0, 29768.0, 2769.0, 805.0, 482.0, 269.0, 222.0, 144.0, 105.0, 76.0, 61.0, 44.0, 22.0, 17.0, 15.0, 13.0, 9.0, 8.0, 6.0, 2.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40625, -0.3927574157714844, -0.37926483154296875, -0.3657722473144531, -0.3522796630859375, -0.3387870788574219, -0.32529449462890625, -0.3118019104003906, -0.298309326171875, -0.2848167419433594, -0.27132415771484375, -0.2578315734863281, -0.2443389892578125, -0.23084640502929688, -0.21735382080078125, -0.20386123657226562, -0.19036865234375, -0.17687606811523438, -0.16338348388671875, -0.14989089965820312, -0.1363983154296875, -0.12290573120117188, -0.10941314697265625, -0.09592056274414062, -0.082427978515625, -0.06893539428710938, -0.05544281005859375, -0.041950225830078125, -0.0284576416015625, -0.014965057373046875, -0.00147247314453125, 0.012020111083984375, 0.0255126953125, 0.039005279541015625, 0.05249786376953125, 0.06599044799804688, 0.0794830322265625, 0.09297561645507812, 0.10646820068359375, 0.11996078491210938, 0.133453369140625, 0.14694595336914062, 0.16043853759765625, 0.17393112182617188, 0.1874237060546875, 0.20091629028320312, 0.21440887451171875, 0.22790145874023438, 0.24139404296875, 0.2548866271972656, 0.26837921142578125, 0.2818717956542969, 0.2953643798828125, 0.3088569641113281, 0.32234954833984375, 0.3358421325683594, 0.349334716796875, 0.3628273010253906, 0.37631988525390625, 0.3898124694824219, 0.4033050537109375, 0.4167976379394531, 0.43029022216796875, 0.4437828063964844, 0.457275390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 16.0, 13.0, 13.0, 11.0, 15.0, 10.0, 26.0, 20.0, 22.0, 27.0, 34.0, 38.0, 44.0, 46.0, 56.0, 46.0, 53.0, 44.0, 50.0, 52.0, 38.0, 39.0, 34.0, 27.0, 31.0, 31.0, 24.0, 20.0, 19.0, 18.0, 12.0, 10.0, 8.0, 6.0, 8.0, 6.0, 2.0, 4.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.11328125, -3.012359619140625, -2.91143798828125, -2.810516357421875, -2.7095947265625, -2.608673095703125, -2.50775146484375, -2.406829833984375, -2.305908203125, -2.204986572265625, -2.10406494140625, -2.003143310546875, -1.9022216796875, -1.801300048828125, -1.70037841796875, -1.599456787109375, -1.49853515625, -1.397613525390625, -1.29669189453125, -1.195770263671875, -1.0948486328125, -0.993927001953125, -0.89300537109375, -0.792083740234375, -0.691162109375, -0.590240478515625, -0.48931884765625, -0.388397216796875, -0.2874755859375, -0.186553955078125, -0.08563232421875, 0.015289306640625, 0.1162109375, 0.217132568359375, 0.31805419921875, 0.418975830078125, 0.5198974609375, 0.620819091796875, 0.72174072265625, 0.822662353515625, 0.923583984375, 1.024505615234375, 1.12542724609375, 1.226348876953125, 1.3272705078125, 1.428192138671875, 1.52911376953125, 1.630035400390625, 1.73095703125, 1.831878662109375, 1.93280029296875, 2.033721923828125, 2.1346435546875, 2.235565185546875, 2.33648681640625, 2.437408447265625, 2.538330078125, 2.639251708984375, 2.74017333984375, 2.841094970703125, 2.9420166015625, 3.042938232421875, 3.14385986328125, 3.244781494140625, 3.345703125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 7.0, 11.0, 23.0, 13.0, 30.0, 33.0, 43.0, 73.0, 79.0, 101.0, 129.0, 188.0, 337.0, 758.0, 3397.0, 48043.0, 957843.0, 32812.0, 2943.0, 698.0, 271.0, 176.0, 137.0, 100.0, 70.0, 48.0, 42.0, 27.0, 24.0, 18.0, 15.0, 11.0, 5.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1070556640625, -0.10385417938232422, -0.10065269470214844, -0.09745121002197266, -0.09424972534179688, -0.0910482406616211, -0.08784675598144531, -0.08464527130126953, -0.08144378662109375, -0.07824230194091797, -0.07504081726074219, -0.0718393325805664, -0.06863784790039062, -0.06543636322021484, -0.06223487854003906, -0.05903339385986328, -0.0558319091796875, -0.05263042449951172, -0.04942893981933594, -0.046227455139160156, -0.043025970458984375, -0.039824485778808594, -0.03662300109863281, -0.03342151641845703, -0.03022003173828125, -0.02701854705810547, -0.023817062377929688, -0.020615577697753906, -0.017414093017578125, -0.014212608337402344, -0.011011123657226562, -0.007809638977050781, -0.004608154296875, -0.0014066696166992188, 0.0017948150634765625, 0.004996299743652344, 0.008197784423828125, 0.011399269104003906, 0.014600753784179688, 0.01780223846435547, 0.02100372314453125, 0.02420520782470703, 0.027406692504882812, 0.030608177185058594, 0.033809661865234375, 0.037011146545410156, 0.04021263122558594, 0.04341411590576172, 0.0466156005859375, 0.04981708526611328, 0.05301856994628906, 0.056220054626464844, 0.059421539306640625, 0.0626230239868164, 0.06582450866699219, 0.06902599334716797, 0.07222747802734375, 0.07542896270751953, 0.07863044738769531, 0.0818319320678711, 0.08503341674804688, 0.08823490142822266, 0.09143638610839844, 0.09463787078857422, 0.09783935546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 3.0, 8.0, 12.0, 16.0, 12.0, 29.0, 46.0, 65.0, 99.0, 135.0, 145.0, 123.0, 92.0, 57.0, 51.0, 25.0, 17.0, 15.0, 10.0, 5.0, 6.0, 6.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.286823630332947e-05, -3.1463801860809326e-05, -3.0059367418289185e-05, -2.8654932975769043e-05, -2.72504985332489e-05, -2.584606409072876e-05, -2.4441629648208618e-05, -2.3037195205688477e-05, -2.1632760763168335e-05, -2.0228326320648193e-05, -1.8823891878128052e-05, -1.741945743560791e-05, -1.601502299308777e-05, -1.4610588550567627e-05, -1.3206154108047485e-05, -1.1801719665527344e-05, -1.0397285223007202e-05, -8.99285078048706e-06, -7.588416337966919e-06, -6.183981895446777e-06, -4.779547452926636e-06, -3.375113010406494e-06, -1.9706785678863525e-06, -5.662441253662109e-07, 8.381903171539307e-07, 2.2426247596740723e-06, 3.647059202194214e-06, 5.0514936447143555e-06, 6.455928087234497e-06, 7.860362529754639e-06, 9.26479697227478e-06, 1.0669231414794922e-05, 1.2073665857315063e-05, 1.3478100299835205e-05, 1.4882534742355347e-05, 1.6286969184875488e-05, 1.769140362739563e-05, 1.909583806991577e-05, 2.0500272512435913e-05, 2.1904706954956055e-05, 2.3309141397476196e-05, 2.4713575839996338e-05, 2.611801028251648e-05, 2.752244472503662e-05, 2.8926879167556763e-05, 3.0331313610076904e-05, 3.1735748052597046e-05, 3.314018249511719e-05, 3.454461693763733e-05, 3.594905138015747e-05, 3.735348582267761e-05, 3.8757920265197754e-05, 4.0162354707717896e-05, 4.156678915023804e-05, 4.297122359275818e-05, 4.437565803527832e-05, 4.578009247779846e-05, 4.7184526920318604e-05, 4.8588961362838745e-05, 4.999339580535889e-05, 5.139783024787903e-05, 5.280226469039917e-05, 5.420669913291931e-05, 5.561113357543945e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 15.0, 20.0, 32.0, 38.0, 58.0, 98.0, 107.0, 169.0, 270.0, 394.0, 591.0, 950.0, 1776.0, 3961.0, 11438.0, 49538.0, 733485.0, 206628.0, 25215.0, 7246.0, 2778.0, 1416.0, 805.0, 462.0, 333.0, 204.0, 159.0, 113.0, 71.0, 53.0, 28.0, 23.0, 12.0, 14.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.0985250473022461, -0.09542655944824219, -0.09232807159423828, -0.08922958374023438, -0.08613109588623047, -0.08303260803222656, -0.07993412017822266, -0.07683563232421875, -0.07373714447021484, -0.07063865661621094, -0.06754016876220703, -0.06444168090820312, -0.06134319305419922, -0.05824470520019531, -0.055146217346191406, -0.0520477294921875, -0.048949241638183594, -0.04585075378417969, -0.04275226593017578, -0.039653778076171875, -0.03655529022216797, -0.03345680236816406, -0.030358314514160156, -0.02725982666015625, -0.024161338806152344, -0.021062850952148438, -0.01796436309814453, -0.014865875244140625, -0.011767387390136719, -0.008668899536132812, -0.005570411682128906, -0.002471923828125, 0.0006265640258789062, 0.0037250518798828125, 0.006823539733886719, 0.009922027587890625, 0.013020515441894531, 0.016119003295898438, 0.019217491149902344, 0.02231597900390625, 0.025414466857910156, 0.028512954711914062, 0.03161144256591797, 0.034709930419921875, 0.03780841827392578, 0.04090690612792969, 0.044005393981933594, 0.0471038818359375, 0.050202369689941406, 0.05330085754394531, 0.05639934539794922, 0.059497833251953125, 0.06259632110595703, 0.06569480895996094, 0.06879329681396484, 0.07189178466796875, 0.07499027252197266, 0.07808876037597656, 0.08118724822998047, 0.08428573608398438, 0.08738422393798828, 0.09048271179199219, 0.0935811996459961, 0.0966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 13.0, 9.0, 19.0, 19.0, 28.0, 44.0, 73.0, 150.0, 313.0, 124.0, 73.0, 40.0, 20.0, 23.0, 10.0, 11.0, 6.0, 7.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.020904541015625, -0.020277976989746094, -0.019651412963867188, -0.01902484893798828, -0.018398284912109375, -0.01777172088623047, -0.017145156860351562, -0.016518592834472656, -0.01589202880859375, -0.015265464782714844, -0.014638900756835938, -0.014012336730957031, -0.013385772705078125, -0.012759208679199219, -0.012132644653320312, -0.011506080627441406, -0.0108795166015625, -0.010252952575683594, -0.009626388549804688, -0.008999824523925781, -0.008373260498046875, -0.007746696472167969, -0.0071201324462890625, -0.006493568420410156, -0.00586700439453125, -0.005240440368652344, -0.0046138763427734375, -0.003987312316894531, -0.003360748291015625, -0.0027341842651367188, -0.0021076202392578125, -0.0014810562133789062, -0.0008544921875, -0.00022792816162109375, 0.0003986358642578125, 0.0010251998901367188, 0.001651763916015625, 0.0022783279418945312, 0.0029048919677734375, 0.0035314559936523438, 0.00415802001953125, 0.004784584045410156, 0.0054111480712890625, 0.006037712097167969, 0.006664276123046875, 0.007290840148925781, 0.007917404174804688, 0.008543968200683594, 0.0091705322265625, 0.009797096252441406, 0.010423660278320312, 0.011050224304199219, 0.011676788330078125, 0.012303352355957031, 0.012929916381835938, 0.013556480407714844, 0.01418304443359375, 0.014809608459472656, 0.015436172485351562, 0.01606273651123047, 0.016689300537109375, 0.01731586456298828, 0.017942428588867188, 0.018568992614746094, 0.019195556640625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 4.0, 7.0, 10.0, 12.0, 15.0, 19.0, 24.0, 26.0, 40.0, 60.0, 73.0, 71.0, 67.0, 82.0, 84.0, 73.0, 78.0, 69.0, 43.0, 36.0, 16.0, 20.0, 14.0, 15.0, 11.0, 11.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5374808311462402, -2.4661457538604736, -2.394810438156128, -2.3234753608703613, -2.2521400451660156, -2.180804967880249, -2.1094696521759033, -2.0381345748901367, -1.9667993783950806, -1.8954641819000244, -1.8241289854049683, -1.752793788909912, -1.6814587116241455, -1.6101233959197998, -1.5387883186340332, -1.467453122138977, -1.396117925643921, -1.3247827291488647, -1.2534475326538086, -1.1821123361587524, -1.1107771396636963, -1.0394420623779297, -0.9681068658828735, -0.8967716693878174, -0.8254364728927612, -0.7541012763977051, -0.6827660799026489, -0.6114309430122375, -0.5400957465171814, -0.46876055002212524, -0.3974253833293915, -0.3260902166366577, -0.25475478172302246, -0.1834196001291275, -0.11208441853523254, -0.040749236941337585, 0.030585944652557373, 0.10192114114761353, 0.1732563078403473, 0.24459147453308105, 0.3159266710281372, 0.38726186752319336, 0.4585970342159271, 0.5299322009086609, 0.601267397403717, 0.6726025938987732, 0.7439377307891846, 0.8152729272842407, 0.8866081237792969, 0.957943320274353, 1.0292785167694092, 1.1006137132644653, 1.1719489097595215, 1.243283987045288, 1.3146191835403442, 1.3859543800354004, 1.4572895765304565, 1.5286247730255127, 1.5999599695205688, 1.671295166015625, 1.7426302433013916, 1.8139655590057373, 1.885300636291504, 1.95663583278656, 2.027971029281616]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 11.0, 6.0, 9.0, 13.0, 16.0, 20.0, 31.0, 28.0, 28.0, 46.0, 48.0, 49.0, 55.0, 55.0, 38.0, 51.0, 55.0, 52.0, 59.0, 40.0, 34.0, 37.0, 35.0, 28.0, 40.0, 24.0, 20.0, 14.0, 13.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.021963596343994, -1.965125560760498, -1.908287525177002, -1.8514493703842163, -1.7946113348007202, -1.7377732992172241, -1.680935263633728, -1.6240971088409424, -1.5672590732574463, -1.5104210376739502, -1.453583002090454, -1.3967448472976685, -1.3399068117141724, -1.2830687761306763, -1.2262307405471802, -1.1693925857543945, -1.1125545501708984, -1.0557165145874023, -0.9988784193992615, -0.9420403838157654, -0.8852022886276245, -0.8283642530441284, -0.7715262174606323, -0.7146881222724915, -0.6578501462936401, -0.601012110710144, -0.5441740155220032, -0.4873359799385071, -0.4304978847503662, -0.3736598491668701, -0.31682178378105164, -0.25998371839523315, -0.20314562320709229, -0.1463075578212738, -0.08946949988603592, -0.032631441950798035, 0.024206623435020447, 0.08104467391967773, 0.13788273930549622, 0.1947208046913147, 0.2515588700771332, 0.30839693546295166, 0.36523500084877014, 0.4220730662345886, 0.4789111018180847, 0.5357491970062256, 0.5925872325897217, 0.6494252681732178, 0.7062633633613586, 0.7631013989448547, 0.8199394941329956, 0.8767775297164917, 0.9336156249046326, 0.9904536604881287, 1.0472917556762695, 1.1041297912597656, 1.1609678268432617, 1.2178058624267578, 1.274643898010254, 1.3314820528030396, 1.3883200883865356, 1.4451581239700317, 1.5019961595535278, 1.5588343143463135, 1.6156723499298096]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 10.0, 12.0, 23.0, 34.0, 54.0, 81.0, 134.0, 217.0, 370.0, 702.0, 1362.0, 2771.0, 5869.0, 13882.0, 34635.0, 95545.0, 393401.0, 354280.0, 88529.0, 32467.0, 13193.0, 5569.0, 2573.0, 1231.0, 683.0, 377.0, 206.0, 128.0, 77.0, 47.0, 37.0, 18.0, 12.0, 6.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.3515625, -3.269744873046875, -3.18792724609375, -3.106109619140625, -3.0242919921875, -2.942474365234375, -2.86065673828125, -2.778839111328125, -2.697021484375, -2.615203857421875, -2.53338623046875, -2.451568603515625, -2.3697509765625, -2.287933349609375, -2.20611572265625, -2.124298095703125, -2.04248046875, -1.960662841796875, -1.87884521484375, -1.797027587890625, -1.7152099609375, -1.633392333984375, -1.55157470703125, -1.469757080078125, -1.387939453125, -1.306121826171875, -1.22430419921875, -1.142486572265625, -1.0606689453125, -0.978851318359375, -0.89703369140625, -0.815216064453125, -0.7333984375, -0.651580810546875, -0.56976318359375, -0.487945556640625, -0.4061279296875, -0.324310302734375, -0.24249267578125, -0.160675048828125, -0.078857421875, 0.002960205078125, 0.08477783203125, 0.166595458984375, 0.2484130859375, 0.330230712890625, 0.41204833984375, 0.493865966796875, 0.57568359375, 0.657501220703125, 0.73931884765625, 0.821136474609375, 0.9029541015625, 0.984771728515625, 1.06658935546875, 1.148406982421875, 1.230224609375, 1.312042236328125, 1.39385986328125, 1.475677490234375, 1.5574951171875, 1.639312744140625, 1.72113037109375, 1.802947998046875, 1.884765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 12.0, 9.0, 15.0, 20.0, 20.0, 29.0, 38.0, 43.0, 47.0, 59.0, 50.0, 67.0, 75.0, 54.0, 65.0, 60.0, 45.0, 48.0, 36.0, 36.0, 42.0, 16.0, 22.0, 18.0, 12.0, 8.0, 8.0, 11.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.57232666015625, -4.4337158203125, -4.29510498046875, -4.156494140625, -4.01788330078125, -3.8792724609375, -3.74066162109375, -3.60205078125, -3.46343994140625, -3.3248291015625, -3.18621826171875, -3.047607421875, -2.90899658203125, -2.7703857421875, -2.63177490234375, -2.4931640625, -2.35455322265625, -2.2159423828125, -2.07733154296875, -1.938720703125, -1.80010986328125, -1.6614990234375, -1.52288818359375, -1.38427734375, -1.24566650390625, -1.1070556640625, -0.96844482421875, -0.829833984375, -0.69122314453125, -0.5526123046875, -0.41400146484375, -0.275390625, -0.13677978515625, 0.0018310546875, 0.14044189453125, 0.279052734375, 0.41766357421875, 0.5562744140625, 0.69488525390625, 0.83349609375, 0.97210693359375, 1.1107177734375, 1.24932861328125, 1.387939453125, 1.52655029296875, 1.6651611328125, 1.80377197265625, 1.9423828125, 2.08099365234375, 2.2196044921875, 2.35821533203125, 2.496826171875, 2.63543701171875, 2.7740478515625, 2.91265869140625, 3.05126953125, 3.18988037109375, 3.3284912109375, 3.46710205078125, 3.605712890625, 3.74432373046875, 3.8829345703125, 4.02154541015625, 4.16015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 10.0, 7.0, 12.0, 21.0, 31.0, 42.0, 89.0, 164.0, 336.0, 861.0, 3169.0, 16124.0, 107810.0, 764585.0, 130658.0, 19225.0, 3662.0, 992.0, 320.0, 159.0, 96.0, 59.0, 33.0, 24.0, 14.0, 9.0, 7.0, 8.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.22314453125, -4.0751953125, -3.92724609375, -3.779296875, -3.63134765625, -3.4833984375, -3.33544921875, -3.1875, -3.03955078125, -2.8916015625, -2.74365234375, -2.595703125, -2.44775390625, -2.2998046875, -2.15185546875, -2.00390625, -1.85595703125, -1.7080078125, -1.56005859375, -1.412109375, -1.26416015625, -1.1162109375, -0.96826171875, -0.8203125, -0.67236328125, -0.5244140625, -0.37646484375, -0.228515625, -0.08056640625, 0.0673828125, 0.21533203125, 0.36328125, 0.51123046875, 0.6591796875, 0.80712890625, 0.955078125, 1.10302734375, 1.2509765625, 1.39892578125, 1.546875, 1.69482421875, 1.8427734375, 1.99072265625, 2.138671875, 2.28662109375, 2.4345703125, 2.58251953125, 2.73046875, 2.87841796875, 3.0263671875, 3.17431640625, 3.322265625, 3.47021484375, 3.6181640625, 3.76611328125, 3.9140625, 4.06201171875, 4.2099609375, 4.35791015625, 4.505859375, 4.65380859375, 4.8017578125, 4.94970703125, 5.09765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 8.0, 5.0, 3.0, 5.0, 10.0, 12.0, 15.0, 19.0, 19.0, 29.0, 20.0, 24.0, 32.0, 32.0, 38.0, 34.0, 37.0, 41.0, 45.0, 45.0, 45.0, 35.0, 50.0, 40.0, 41.0, 50.0, 44.0, 35.0, 23.0, 25.0, 20.0, 30.0, 14.0, 10.0, 12.0, 11.0, 3.0, 12.0, 6.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0], "bins": [-4.8984375, -4.76483154296875, -4.6312255859375, -4.49761962890625, -4.364013671875, -4.23040771484375, -4.0968017578125, -3.96319580078125, -3.82958984375, -3.69598388671875, -3.5623779296875, -3.42877197265625, -3.295166015625, -3.16156005859375, -3.0279541015625, -2.89434814453125, -2.7607421875, -2.62713623046875, -2.4935302734375, -2.35992431640625, -2.226318359375, -2.09271240234375, -1.9591064453125, -1.82550048828125, -1.69189453125, -1.55828857421875, -1.4246826171875, -1.29107666015625, -1.157470703125, -1.02386474609375, -0.8902587890625, -0.75665283203125, -0.623046875, -0.48944091796875, -0.3558349609375, -0.22222900390625, -0.088623046875, 0.04498291015625, 0.1785888671875, 0.31219482421875, 0.44580078125, 0.57940673828125, 0.7130126953125, 0.84661865234375, 0.980224609375, 1.11383056640625, 1.2474365234375, 1.38104248046875, 1.5146484375, 1.64825439453125, 1.7818603515625, 1.91546630859375, 2.049072265625, 2.18267822265625, 2.3162841796875, 2.44989013671875, 2.58349609375, 2.71710205078125, 2.8507080078125, 2.98431396484375, 3.117919921875, 3.25152587890625, 3.3851318359375, 3.51873779296875, 3.65234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 11.0, 10.0, 14.0, 24.0, 54.0, 88.0, 237.0, 796.0, 3262.0, 19248.0, 298202.0, 681017.0, 38633.0, 5137.0, 1263.0, 325.0, 121.0, 51.0, 25.0, 19.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.9510345458984375, -1.888397216796875, -1.8257598876953125, -1.76312255859375, -1.7004852294921875, -1.637847900390625, -1.5752105712890625, -1.5125732421875, -1.4499359130859375, -1.387298583984375, -1.3246612548828125, -1.26202392578125, -1.1993865966796875, -1.136749267578125, -1.0741119384765625, -1.011474609375, -0.9488372802734375, -0.886199951171875, -0.8235626220703125, -0.76092529296875, -0.6982879638671875, -0.635650634765625, -0.5730133056640625, -0.5103759765625, -0.4477386474609375, -0.385101318359375, -0.3224639892578125, -0.25982666015625, -0.1971893310546875, -0.134552001953125, -0.0719146728515625, -0.00927734375, 0.0533599853515625, 0.115997314453125, 0.1786346435546875, 0.24127197265625, 0.3039093017578125, 0.366546630859375, 0.4291839599609375, 0.4918212890625, 0.5544586181640625, 0.617095947265625, 0.6797332763671875, 0.74237060546875, 0.8050079345703125, 0.867645263671875, 0.9302825927734375, 0.992919921875, 1.0555572509765625, 1.118194580078125, 1.1808319091796875, 1.24346923828125, 1.3061065673828125, 1.368743896484375, 1.4313812255859375, 1.4940185546875, 1.5566558837890625, 1.619293212890625, 1.6819305419921875, 1.74456787109375, 1.8072052001953125, 1.869842529296875, 1.9324798583984375, 1.9951171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 9.0, 3.0, 4.0, 17.0, 14.0, 21.0, 50.0, 44.0, 67.0, 86.0, 121.0, 149.0, 98.0, 91.0, 54.0, 54.0, 35.0, 17.0, 18.0, 10.0, 8.0, 7.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002124309539794922, -0.00020492449402809143, -0.00019741803407669067, -0.00018991157412528992, -0.00018240511417388916, -0.0001748986542224884, -0.00016739219427108765, -0.0001598857343196869, -0.00015237927436828613, -0.00014487281441688538, -0.00013736635446548462, -0.00012985989451408386, -0.0001223534345626831, -0.00011484697461128235, -0.00010734051465988159, -9.983405470848083e-05, -9.232759475708008e-05, -8.482113480567932e-05, -7.731467485427856e-05, -6.980821490287781e-05, -6.230175495147705e-05, -5.4795295000076294e-05, -4.728883504867554e-05, -3.978237509727478e-05, -3.2275915145874023e-05, -2.4769455194473267e-05, -1.726299524307251e-05, -9.756535291671753e-06, -2.250075340270996e-06, 5.256384611129761e-06, 1.2762844562530518e-05, 2.0269304513931274e-05, 2.777576446533203e-05, 3.528222441673279e-05, 4.2788684368133545e-05, 5.02951443195343e-05, 5.780160427093506e-05, 6.530806422233582e-05, 7.281452417373657e-05, 8.032098412513733e-05, 8.782744407653809e-05, 9.533390402793884e-05, 0.0001028403639793396, 0.00011034682393074036, 0.00011785328388214111, 0.00012535974383354187, 0.00013286620378494263, 0.00014037266373634338, 0.00014787912368774414, 0.0001553855836391449, 0.00016289204359054565, 0.0001703985035419464, 0.00017790496349334717, 0.00018541142344474792, 0.00019291788339614868, 0.00020042434334754944, 0.0002079308032989502, 0.00021543726325035095, 0.0002229437232017517, 0.00023045018315315247, 0.00023795664310455322, 0.000245463103055954, 0.00025296956300735474, 0.0002604760229587555, 0.00026798248291015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 5.0, 15.0, 16.0, 23.0, 26.0, 50.0, 59.0, 99.0, 171.0, 373.0, 742.0, 1611.0, 3779.0, 10657.0, 38340.0, 188881.0, 596461.0, 157847.0, 33429.0, 9475.0, 3485.0, 1523.0, 680.0, 322.0, 171.0, 112.0, 59.0, 42.0, 31.0, 21.0, 12.0, 8.0, 7.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9521484375, -0.91473388671875, -0.8773193359375, -0.83990478515625, -0.802490234375, -0.76507568359375, -0.7276611328125, -0.69024658203125, -0.65283203125, -0.61541748046875, -0.5780029296875, -0.54058837890625, -0.503173828125, -0.46575927734375, -0.4283447265625, -0.39093017578125, -0.353515625, -0.31610107421875, -0.2786865234375, -0.24127197265625, -0.203857421875, -0.16644287109375, -0.1290283203125, -0.09161376953125, -0.05419921875, -0.01678466796875, 0.0206298828125, 0.05804443359375, 0.095458984375, 0.13287353515625, 0.1702880859375, 0.20770263671875, 0.2451171875, 0.28253173828125, 0.3199462890625, 0.35736083984375, 0.394775390625, 0.43218994140625, 0.4696044921875, 0.50701904296875, 0.54443359375, 0.58184814453125, 0.6192626953125, 0.65667724609375, 0.694091796875, 0.73150634765625, 0.7689208984375, 0.80633544921875, 0.84375, 0.88116455078125, 0.9185791015625, 0.95599365234375, 0.993408203125, 1.03082275390625, 1.0682373046875, 1.10565185546875, 1.14306640625, 1.18048095703125, 1.2178955078125, 1.25531005859375, 1.292724609375, 1.33013916015625, 1.3675537109375, 1.40496826171875, 1.4423828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 8.0, 15.0, 7.0, 18.0, 17.0, 20.0, 36.0, 39.0, 34.0, 51.0, 67.0, 86.0, 79.0, 104.0, 86.0, 71.0, 50.0, 43.0, 45.0, 22.0, 25.0, 24.0, 9.0, 6.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4755973815917969, -0.45925140380859375, -0.4429054260253906, -0.4265594482421875, -0.4102134704589844, -0.39386749267578125, -0.3775215148925781, -0.361175537109375, -0.3448295593261719, -0.32848358154296875, -0.3121376037597656, -0.2957916259765625, -0.2794456481933594, -0.26309967041015625, -0.24675369262695312, -0.23040771484375, -0.21406173706054688, -0.19771575927734375, -0.18136978149414062, -0.1650238037109375, -0.14867782592773438, -0.13233184814453125, -0.11598587036132812, -0.099639892578125, -0.08329391479492188, -0.06694793701171875, -0.050601959228515625, -0.0342559814453125, -0.017910003662109375, -0.00156402587890625, 0.014781951904296875, 0.0311279296875, 0.047473907470703125, 0.06381988525390625, 0.08016586303710938, 0.0965118408203125, 0.11285781860351562, 0.12920379638671875, 0.14554977416992188, 0.161895751953125, 0.17824172973632812, 0.19458770751953125, 0.21093368530273438, 0.2272796630859375, 0.24362564086914062, 0.25997161865234375, 0.2763175964355469, 0.29266357421875, 0.3090095520019531, 0.32535552978515625, 0.3417015075683594, 0.3580474853515625, 0.3743934631347656, 0.39073944091796875, 0.4070854187011719, 0.423431396484375, 0.4397773742675781, 0.45612335205078125, 0.4724693298339844, 0.4888153076171875, 0.5051612854003906, 0.5215072631835938, 0.5378532409667969, 0.55419921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 10.0, 34.0, 139.0, 350.0, 345.0, 107.0, 25.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12266731262207, -3.290733575820923, -2.4587998390197754, -1.626866102218628, -0.7949323654174805, 0.037001609802246094, 0.8689351081848145, 1.7008686065673828, 2.5328025817871094, 3.364736318588257, 4.196670055389404, 5.028603553771973, 5.860537528991699, 6.692471504211426, 7.524405002593994, 8.356338500976562, 9.188272476196289, 10.020206451416016, 10.852140426635742, 11.684073448181152, 12.516007423400879, 13.347941398620605, 14.179874420166016, 15.011808395385742, 15.843742370605469, 16.675676345825195, 17.507610321044922, 18.33954429626465, 19.171478271484375, 20.00341033935547, 20.835344314575195, 21.667278289794922, 22.499210357666016, 23.331144332885742, 24.16307830810547, 24.995012283325195, 25.826946258544922, 26.658878326416016, 27.490812301635742, 28.32274627685547, 29.154680252075195, 29.986614227294922, 30.81854820251465, 31.650482177734375, 32.48241424560547, 33.31435012817383, 34.14628219604492, 34.97821807861328, 35.810150146484375, 36.64208221435547, 37.47401809692383, 38.30595016479492, 39.13788604736328, 39.969818115234375, 40.801753997802734, 41.63368606567383, 42.46562194824219, 43.29755401611328, 44.12948989868164, 44.961421966552734, 45.793357849121094, 46.62528991699219, 47.45722579956055, 48.28915786743164, 49.121089935302734]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 9.0, 6.0, 5.0, 9.0, 5.0, 10.0, 8.0, 21.0, 20.0, 21.0, 27.0, 26.0, 33.0, 28.0, 26.0, 25.0, 28.0, 36.0, 25.0, 32.0, 40.0, 45.0, 45.0, 33.0, 33.0, 29.0, 36.0, 38.0, 38.0, 24.0, 31.0, 38.0, 21.0, 22.0, 21.0, 22.0, 11.0, 16.0, 10.0, 13.0, 9.0, 11.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.895088195800781, -6.673768997192383, -6.452449321746826, -6.231130123138428, -6.009810447692871, -5.788491249084473, -5.567172050476074, -5.345852851867676, -5.124533176422119, -4.903213977813721, -4.681894302368164, -4.460575103759766, -4.239255905151367, -4.0179362297058105, -3.796617031097412, -3.5752975940704346, -3.353978157043457, -3.1326587200164795, -2.911339282989502, -2.6900200843811035, -2.468700647354126, -2.2473812103271484, -2.02606201171875, -1.8047425746917725, -1.583423137664795, -1.3621037006378174, -1.1407843828201294, -0.9194650053977966, -0.6981456279754639, -0.47682619094848633, -0.25550687313079834, -0.03418755531311035, 0.1871318817138672, 0.40845125913619995, 0.6297706365585327, 0.8510900139808655, 1.0724093914031982, 1.2937288284301758, 1.5150481462478638, 1.7363674640655518, 1.9576869010925293, 2.179006338119507, 2.4003257751464844, 2.621644973754883, 2.8429644107818604, 3.064283847808838, 3.2856030464172363, 3.506922483444214, 3.7282419204711914, 3.949561357498169, 4.1708807945251465, 4.392199993133545, 4.613519668579102, 4.8348388671875, 5.056158065795898, 5.277477264404297, 5.4987969398498535, 5.720116138458252, 5.941435813903809, 6.162755012512207, 6.3840742111206055, 6.605393886566162, 6.8267130851745605, 7.048032760620117, 7.269351959228516]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 3.0, 4.0, 12.0, 10.0, 14.0, 18.0, 19.0, 32.0, 37.0, 42.0, 77.0, 113.0, 249.0, 529.0, 1460.0, 5537.0, 31550.0, 481842.0, 3501949.0, 149303.0, 16097.0, 3361.0, 1030.0, 427.0, 171.0, 118.0, 60.0, 50.0, 37.0, 27.0, 23.0, 18.0, 16.0, 13.0, 7.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-7.06640625, -6.88671875, -6.70703125, -6.52734375, -6.34765625, -6.16796875, -5.98828125, -5.80859375, -5.62890625, -5.44921875, -5.26953125, -5.08984375, -4.91015625, -4.73046875, -4.55078125, -4.37109375, -4.19140625, -4.01171875, -3.83203125, -3.65234375, -3.47265625, -3.29296875, -3.11328125, -2.93359375, -2.75390625, -2.57421875, -2.39453125, -2.21484375, -2.03515625, -1.85546875, -1.67578125, -1.49609375, -1.31640625, -1.13671875, -0.95703125, -0.77734375, -0.59765625, -0.41796875, -0.23828125, -0.05859375, 0.12109375, 0.30078125, 0.48046875, 0.66015625, 0.83984375, 1.01953125, 1.19921875, 1.37890625, 1.55859375, 1.73828125, 1.91796875, 2.09765625, 2.27734375, 2.45703125, 2.63671875, 2.81640625, 2.99609375, 3.17578125, 3.35546875, 3.53515625, 3.71484375, 3.89453125, 4.07421875, 4.25390625, 4.43359375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 8.0, 7.0, 6.0, 5.0, 11.0, 13.0, 18.0, 13.0, 15.0, 18.0, 39.0, 37.0, 37.0, 30.0, 49.0, 45.0, 36.0, 41.0, 38.0, 50.0, 52.0, 57.0, 42.0, 37.0, 40.0, 31.0, 33.0, 27.0, 28.0, 23.0, 17.0, 19.0, 15.0, 18.0, 7.0, 6.0, 5.0, 11.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.501953125, -1.457000732421875, -1.41204833984375, -1.367095947265625, -1.3221435546875, -1.277191162109375, -1.23223876953125, -1.187286376953125, -1.142333984375, -1.097381591796875, -1.05242919921875, -1.007476806640625, -0.9625244140625, -0.917572021484375, -0.87261962890625, -0.827667236328125, -0.78271484375, -0.737762451171875, -0.69281005859375, -0.647857666015625, -0.6029052734375, -0.557952880859375, -0.51300048828125, -0.468048095703125, -0.423095703125, -0.378143310546875, -0.33319091796875, -0.288238525390625, -0.2432861328125, -0.198333740234375, -0.15338134765625, -0.108428955078125, -0.0634765625, -0.018524169921875, 0.02642822265625, 0.071380615234375, 0.1163330078125, 0.161285400390625, 0.20623779296875, 0.251190185546875, 0.296142578125, 0.341094970703125, 0.38604736328125, 0.430999755859375, 0.4759521484375, 0.520904541015625, 0.56585693359375, 0.610809326171875, 0.65576171875, 0.700714111328125, 0.74566650390625, 0.790618896484375, 0.8355712890625, 0.880523681640625, 0.92547607421875, 0.970428466796875, 1.015380859375, 1.060333251953125, 1.10528564453125, 1.150238037109375, 1.1951904296875, 1.240142822265625, 1.28509521484375, 1.330047607421875, 1.375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 7.0, 11.0, 8.0, 13.0, 20.0, 16.0, 36.0, 46.0, 60.0, 105.0, 148.0, 273.0, 661.0, 2364.0, 11201.0, 87820.0, 1748714.0, 2222833.0, 103102.0, 12791.0, 2518.0, 717.0, 329.0, 175.0, 89.0, 66.0, 40.0, 32.0, 16.0, 18.0, 11.0, 7.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.35235595703125, -4.1851806640625, -4.01800537109375, -3.850830078125, -3.68365478515625, -3.5164794921875, -3.34930419921875, -3.18212890625, -3.01495361328125, -2.8477783203125, -2.68060302734375, -2.513427734375, -2.34625244140625, -2.1790771484375, -2.01190185546875, -1.8447265625, -1.67755126953125, -1.5103759765625, -1.34320068359375, -1.176025390625, -1.00885009765625, -0.8416748046875, -0.67449951171875, -0.50732421875, -0.34014892578125, -0.1729736328125, -0.00579833984375, 0.161376953125, 0.32855224609375, 0.4957275390625, 0.66290283203125, 0.830078125, 0.99725341796875, 1.1644287109375, 1.33160400390625, 1.498779296875, 1.66595458984375, 1.8331298828125, 2.00030517578125, 2.16748046875, 2.33465576171875, 2.5018310546875, 2.66900634765625, 2.836181640625, 3.00335693359375, 3.1705322265625, 3.33770751953125, 3.5048828125, 3.67205810546875, 3.8392333984375, 4.00640869140625, 4.173583984375, 4.34075927734375, 4.5079345703125, 4.67510986328125, 4.84228515625, 5.00946044921875, 5.1766357421875, 5.34381103515625, 5.510986328125, 5.67816162109375, 5.8453369140625, 6.01251220703125, 6.1796875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 11.0, 16.0, 24.0, 34.0, 47.0, 55.0, 72.0, 122.0, 139.0, 189.0, 244.0, 346.0, 470.0, 551.0, 442.0, 326.0, 270.0, 163.0, 132.0, 95.0, 74.0, 48.0, 38.0, 28.0, 23.0, 16.0, 12.0, 15.0, 7.0, 6.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.1943359375, -1.1624298095703125, -1.130523681640625, -1.0986175537109375, -1.06671142578125, -1.0348052978515625, -1.002899169921875, -0.9709930419921875, -0.9390869140625, -0.9071807861328125, -0.875274658203125, -0.8433685302734375, -0.81146240234375, -0.7795562744140625, -0.747650146484375, -0.7157440185546875, -0.683837890625, -0.6519317626953125, -0.620025634765625, -0.5881195068359375, -0.55621337890625, -0.5243072509765625, -0.492401123046875, -0.4604949951171875, -0.4285888671875, -0.3966827392578125, -0.364776611328125, -0.3328704833984375, -0.30096435546875, -0.2690582275390625, -0.237152099609375, -0.2052459716796875, -0.17333984375, -0.1414337158203125, -0.109527587890625, -0.0776214599609375, -0.04571533203125, -0.0138092041015625, 0.018096923828125, 0.0500030517578125, 0.0819091796875, 0.1138153076171875, 0.145721435546875, 0.1776275634765625, 0.20953369140625, 0.2414398193359375, 0.273345947265625, 0.3052520751953125, 0.337158203125, 0.3690643310546875, 0.400970458984375, 0.4328765869140625, 0.46478271484375, 0.4966888427734375, 0.528594970703125, 0.5605010986328125, 0.5924072265625, 0.6243133544921875, 0.656219482421875, 0.6881256103515625, 0.72003173828125, 0.7519378662109375, 0.783843994140625, 0.8157501220703125, 0.84765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 5.0, 5.0, 5.0, 8.0, 11.0, 14.0, 17.0, 13.0, 18.0, 19.0, 28.0, 38.0, 27.0, 34.0, 27.0, 42.0, 31.0, 46.0, 42.0, 37.0, 42.0, 40.0, 46.0, 50.0, 43.0, 42.0, 37.0, 36.0, 32.0, 21.0, 21.0, 13.0, 21.0, 9.0, 13.0, 13.0, 5.0, 8.0, 4.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.2177224159240723, -2.1481213569641113, -2.0785205364227295, -2.0089194774627686, -1.9393186569213867, -1.8697177171707153, -1.800116777420044, -1.730515718460083, -1.6609148979187012, -1.5913139581680298, -1.5217130184173584, -1.452112078666687, -1.3825111389160156, -1.3129101991653442, -1.2433092594146729, -1.173708200454712, -1.1041072607040405, -1.0345063209533691, -0.9649053812026978, -0.8953044414520264, -0.825703501701355, -0.7561025619506836, -0.6865015625953674, -0.616900622844696, -0.5472996830940247, -0.47769874334335327, -0.4080978035926819, -0.3384968340396881, -0.2688958942890167, -0.19929495453834534, -0.12969398498535156, -0.060093045234680176, 0.009507894515991211, 0.0791088417172432, 0.14870978891849518, 0.21831074357032776, 0.28791168332099915, 0.35751262307167053, 0.4271135926246643, 0.4967145323753357, 0.5663154721260071, 0.6359164118766785, 0.7055173516273499, 0.775118350982666, 0.8447192907333374, 0.9143202304840088, 0.9839211702346802, 1.0535221099853516, 1.123123049736023, 1.1927239894866943, 1.2623249292373657, 1.331925868988037, 1.4015268087387085, 1.4711277484893799, 1.5407288074493408, 1.6103296279907227, 1.6799306869506836, 1.749531626701355, 1.8191325664520264, 1.8887335062026978, 1.9583344459533691, 2.02793550491333, 2.097536325454712, 2.167137384414673, 2.2367382049560547]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 1.0, 0.0, 6.0, 8.0, 9.0, 20.0, 17.0, 19.0, 25.0, 28.0, 26.0, 38.0, 37.0, 42.0, 27.0, 27.0, 38.0, 27.0, 51.0, 41.0, 31.0, 42.0, 40.0, 39.0, 42.0, 30.0, 28.0, 35.0, 51.0, 29.0, 18.0, 18.0, 20.0, 21.0, 11.0, 14.0, 6.0, 11.0, 5.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.814331531524658, -2.73667573928833, -2.659019947052002, -2.581364393234253, -2.503708600997925, -2.4260528087615967, -2.3483972549438477, -2.2707414627075195, -2.1930856704711914, -2.1154298782348633, -2.037774085998535, -1.9601185321807861, -1.882462739944458, -1.8048069477081299, -1.7271512746810913, -1.6494956016540527, -1.5718398094177246, -1.4941840171813965, -1.416528344154358, -1.3388726711273193, -1.2612168788909912, -1.183561086654663, -1.1059054136276245, -1.028249740600586, -0.9505939483642578, -0.8729382157325745, -0.7952824831008911, -0.7176267504692078, -0.6399710178375244, -0.5623152852058411, -0.4846595525741577, -0.40700381994247437, -0.3293483257293701, -0.25169259309768677, -0.17403686046600342, -0.09638112783432007, -0.01872539520263672, 0.05893033742904663, 0.13658607006072998, 0.21424180269241333, 0.2918975353240967, 0.36955326795578003, 0.4472090005874634, 0.5248647332191467, 0.6025204658508301, 0.6801761984825134, 0.7578319311141968, 0.8354876637458801, 0.9131433963775635, 0.9907991290092468, 1.0684548616409302, 1.1461105346679688, 1.2237663269042969, 1.301422119140625, 1.3790777921676636, 1.4567334651947021, 1.5343892574310303, 1.6120450496673584, 1.689700722694397, 1.7673563957214355, 1.8450121879577637, 1.9226679801940918, 2.00032377243042, 2.077979326248169, 2.155635118484497]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 5.0, 8.0, 12.0, 10.0, 25.0, 30.0, 39.0, 48.0, 63.0, 92.0, 113.0, 159.0, 254.0, 388.0, 695.0, 1503.0, 10324.0, 612096.0, 411642.0, 7783.0, 1380.0, 656.0, 349.0, 262.0, 172.0, 105.0, 82.0, 65.0, 46.0, 28.0, 28.0, 18.0, 17.0, 17.0, 11.0, 5.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94580078125, -0.9142227172851562, -0.8826446533203125, -0.8510665893554688, -0.819488525390625, -0.7879104614257812, -0.7563323974609375, -0.7247543334960938, -0.69317626953125, -0.6615982055664062, -0.6300201416015625, -0.5984420776367188, -0.566864013671875, -0.5352859497070312, -0.5037078857421875, -0.47212982177734375, -0.4405517578125, -0.40897369384765625, -0.3773956298828125, -0.34581756591796875, -0.314239501953125, -0.28266143798828125, -0.2510833740234375, -0.21950531005859375, -0.18792724609375, -0.15634918212890625, -0.1247711181640625, -0.09319305419921875, -0.061614990234375, -0.03003692626953125, 0.0015411376953125, 0.03311920166015625, 0.064697265625, 0.09627532958984375, 0.1278533935546875, 0.15943145751953125, 0.191009521484375, 0.22258758544921875, 0.2541656494140625, 0.28574371337890625, 0.31732177734375, 0.34889984130859375, 0.3804779052734375, 0.41205596923828125, 0.443634033203125, 0.47521209716796875, 0.5067901611328125, 0.5383682250976562, 0.5699462890625, 0.6015243530273438, 0.6331024169921875, 0.6646804809570312, 0.696258544921875, 0.7278366088867188, 0.7594146728515625, 0.7909927368164062, 0.82257080078125, 0.8541488647460938, 0.8857269287109375, 0.9173049926757812, 0.948883056640625, 0.9804611206054688, 1.0120391845703125, 1.0436172485351562, 1.0751953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 5.0, 8.0, 11.0, 14.0, 14.0, 15.0, 21.0, 28.0, 25.0, 26.0, 32.0, 44.0, 39.0, 37.0, 44.0, 44.0, 36.0, 42.0, 36.0, 39.0, 46.0, 44.0, 36.0, 40.0, 34.0, 30.0, 33.0, 32.0, 23.0, 23.0, 21.0, 21.0, 14.0, 8.0, 11.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.02734375, -1.9683074951171875, -1.909271240234375, -1.8502349853515625, -1.79119873046875, -1.7321624755859375, -1.673126220703125, -1.6140899658203125, -1.5550537109375, -1.4960174560546875, -1.436981201171875, -1.3779449462890625, -1.31890869140625, -1.2598724365234375, -1.200836181640625, -1.1417999267578125, -1.082763671875, -1.0237274169921875, -0.964691162109375, -0.9056549072265625, -0.84661865234375, -0.7875823974609375, -0.728546142578125, -0.6695098876953125, -0.6104736328125, -0.5514373779296875, -0.492401123046875, -0.4333648681640625, -0.37432861328125, -0.3152923583984375, -0.256256103515625, -0.1972198486328125, -0.13818359375, -0.0791473388671875, -0.020111083984375, 0.0389251708984375, 0.09796142578125, 0.1569976806640625, 0.216033935546875, 0.2750701904296875, 0.3341064453125, 0.3931427001953125, 0.452178955078125, 0.5112152099609375, 0.57025146484375, 0.6292877197265625, 0.688323974609375, 0.7473602294921875, 0.806396484375, 0.8654327392578125, 0.924468994140625, 0.9835052490234375, 1.04254150390625, 1.1015777587890625, 1.160614013671875, 1.2196502685546875, 1.2786865234375, 1.3377227783203125, 1.396759033203125, 1.4557952880859375, 1.51483154296875, 1.5738677978515625, 1.632904052734375, 1.6919403076171875, 1.7509765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 5.0, 1.0, 6.0, 4.0, 7.0, 8.0, 10.0, 15.0, 9.0, 17.0, 20.0, 22.0, 41.0, 36.0, 57.0, 85.0, 104.0, 144.0, 199.0, 324.0, 599.0, 1770.0, 10051.0, 106609.0, 756260.0, 155296.0, 12789.0, 2191.0, 726.0, 351.0, 217.0, 146.0, 110.0, 78.0, 59.0, 42.0, 41.0, 25.0, 25.0, 17.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.417236328125, -0.40358734130859375, -0.3899383544921875, -0.37628936767578125, -0.362640380859375, -0.34899139404296875, -0.3353424072265625, -0.32169342041015625, -0.30804443359375, -0.29439544677734375, -0.2807464599609375, -0.26709747314453125, -0.253448486328125, -0.23979949951171875, -0.2261505126953125, -0.21250152587890625, -0.1988525390625, -0.18520355224609375, -0.1715545654296875, -0.15790557861328125, -0.144256591796875, -0.13060760498046875, -0.1169586181640625, -0.10330963134765625, -0.08966064453125, -0.07601165771484375, -0.0623626708984375, -0.04871368408203125, -0.035064697265625, -0.02141571044921875, -0.0077667236328125, 0.00588226318359375, 0.01953125, 0.03318023681640625, 0.0468292236328125, 0.06047821044921875, 0.074127197265625, 0.08777618408203125, 0.1014251708984375, 0.11507415771484375, 0.12872314453125, 0.14237213134765625, 0.1560211181640625, 0.16967010498046875, 0.183319091796875, 0.19696807861328125, 0.2106170654296875, 0.22426605224609375, 0.2379150390625, 0.25156402587890625, 0.2652130126953125, 0.27886199951171875, 0.292510986328125, 0.30615997314453125, 0.3198089599609375, 0.33345794677734375, 0.34710693359375, 0.36075592041015625, 0.3744049072265625, 0.38805389404296875, 0.401702880859375, 0.41535186767578125, 0.4290008544921875, 0.44264984130859375, 0.456298828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 7.0, 8.0, 16.0, 16.0, 17.0, 26.0, 19.0, 30.0, 27.0, 35.0, 37.0, 48.0, 47.0, 42.0, 60.0, 46.0, 50.0, 67.0, 45.0, 52.0, 52.0, 34.0, 43.0, 25.0, 28.0, 27.0, 20.0, 13.0, 14.0, 9.0, 5.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.6053466796875, -4.441162109375, -4.2769775390625, -4.11279296875, -3.9486083984375, -3.784423828125, -3.6202392578125, -3.4560546875, -3.2918701171875, -3.127685546875, -2.9635009765625, -2.79931640625, -2.6351318359375, -2.470947265625, -2.3067626953125, -2.142578125, -1.9783935546875, -1.814208984375, -1.6500244140625, -1.48583984375, -1.3216552734375, -1.157470703125, -0.9932861328125, -0.8291015625, -0.6649169921875, -0.500732421875, -0.3365478515625, -0.17236328125, -0.0081787109375, 0.156005859375, 0.3201904296875, 0.484375, 0.6485595703125, 0.812744140625, 0.9769287109375, 1.14111328125, 1.3052978515625, 1.469482421875, 1.6336669921875, 1.7978515625, 1.9620361328125, 2.126220703125, 2.2904052734375, 2.45458984375, 2.6187744140625, 2.782958984375, 2.9471435546875, 3.111328125, 3.2755126953125, 3.439697265625, 3.6038818359375, 3.76806640625, 3.9322509765625, 4.096435546875, 4.2606201171875, 4.4248046875, 4.5889892578125, 4.753173828125, 4.9173583984375, 5.08154296875, 5.2457275390625, 5.409912109375, 5.5740966796875, 5.73828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 3.0, 8.0, 9.0, 10.0, 17.0, 22.0, 29.0, 27.0, 49.0, 72.0, 109.0, 175.0, 341.0, 772.0, 2832.0, 41238.0, 979586.0, 19584.0, 2113.0, 740.0, 313.0, 147.0, 103.0, 58.0, 51.0, 28.0, 34.0, 16.0, 18.0, 11.0, 11.0, 4.0, 5.0, 2.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.14269065856933594, -0.13828659057617188, -0.1338825225830078, -0.12947845458984375, -0.1250743865966797, -0.12067031860351562, -0.11626625061035156, -0.1118621826171875, -0.10745811462402344, -0.10305404663085938, -0.09864997863769531, -0.09424591064453125, -0.08984184265136719, -0.08543777465820312, -0.08103370666503906, -0.076629638671875, -0.07222557067871094, -0.06782150268554688, -0.06341743469238281, -0.05901336669921875, -0.05460929870605469, -0.050205230712890625, -0.04580116271972656, -0.0413970947265625, -0.03699302673339844, -0.032588958740234375, -0.028184890747070312, -0.02378082275390625, -0.019376754760742188, -0.014972686767578125, -0.010568618774414062, -0.00616455078125, -0.0017604827880859375, 0.002643585205078125, 0.0070476531982421875, 0.01145172119140625, 0.015855789184570312, 0.020259857177734375, 0.024663925170898438, 0.0290679931640625, 0.03347206115722656, 0.037876129150390625, 0.04228019714355469, 0.04668426513671875, 0.05108833312988281, 0.055492401123046875, 0.05989646911621094, 0.064300537109375, 0.06870460510253906, 0.07310867309570312, 0.07751274108886719, 0.08191680908203125, 0.08632087707519531, 0.09072494506835938, 0.09512901306152344, 0.0995330810546875, 0.10393714904785156, 0.10834121704101562, 0.11274528503417969, 0.11714935302734375, 0.12155342102050781, 0.12595748901367188, 0.13036155700683594, 0.134765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 20.0, 27.0, 32.0, 63.0, 61.0, 89.0, 119.0, 111.0, 107.0, 95.0, 72.0, 48.0, 38.0, 26.0, 14.0, 15.0, 9.0, 6.0, 7.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.458427429199219e-05, -4.312768578529358e-05, -4.167109727859497e-05, -4.021450877189636e-05, -3.8757920265197754e-05, -3.7301331758499146e-05, -3.584474325180054e-05, -3.438815474510193e-05, -3.293156623840332e-05, -3.147497773170471e-05, -3.0018389225006104e-05, -2.8561800718307495e-05, -2.7105212211608887e-05, -2.564862370491028e-05, -2.419203519821167e-05, -2.273544669151306e-05, -2.1278858184814453e-05, -1.9822269678115845e-05, -1.8365681171417236e-05, -1.6909092664718628e-05, -1.545250415802002e-05, -1.3995915651321411e-05, -1.2539327144622803e-05, -1.1082738637924194e-05, -9.626150131225586e-06, -8.169561624526978e-06, -6.712973117828369e-06, -5.256384611129761e-06, -3.7997961044311523e-06, -2.343207597732544e-06, -8.866190910339355e-07, 5.699694156646729e-07, 2.0265579223632812e-06, 3.4831464290618896e-06, 4.939734935760498e-06, 6.3963234424591064e-06, 7.852911949157715e-06, 9.309500455856323e-06, 1.0766088962554932e-05, 1.222267746925354e-05, 1.3679265975952148e-05, 1.5135854482650757e-05, 1.6592442989349365e-05, 1.8049031496047974e-05, 1.9505620002746582e-05, 2.096220850944519e-05, 2.24187970161438e-05, 2.3875385522842407e-05, 2.5331974029541016e-05, 2.6788562536239624e-05, 2.8245151042938232e-05, 2.970173954963684e-05, 3.115832805633545e-05, 3.261491656303406e-05, 3.4071505069732666e-05, 3.5528093576431274e-05, 3.698468208312988e-05, 3.844127058982849e-05, 3.98978590965271e-05, 4.135444760322571e-05, 4.2811036109924316e-05, 4.4267624616622925e-05, 4.572421312332153e-05, 4.718080163002014e-05, 4.863739013671875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 15.0, 20.0, 27.0, 31.0, 44.0, 42.0, 68.0, 86.0, 126.0, 151.0, 209.0, 302.0, 390.0, 593.0, 852.0, 1523.0, 2442.0, 4342.0, 8595.0, 20762.0, 69702.0, 583233.0, 278408.0, 44790.0, 15116.0, 6961.0, 3673.0, 2106.0, 1284.0, 816.0, 522.0, 354.0, 251.0, 174.0, 116.0, 103.0, 67.0, 65.0, 47.0, 17.0, 25.0, 24.0, 22.0, 11.0, 8.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.07769775390625, -0.07540225982666016, -0.07310676574707031, -0.07081127166748047, -0.06851577758789062, -0.06622028350830078, -0.06392478942871094, -0.061629295349121094, -0.05933380126953125, -0.057038307189941406, -0.05474281311035156, -0.05244731903076172, -0.050151824951171875, -0.04785633087158203, -0.04556083679199219, -0.043265342712402344, -0.0409698486328125, -0.038674354553222656, -0.03637886047363281, -0.03408336639404297, -0.031787872314453125, -0.02949237823486328, -0.027196884155273438, -0.024901390075683594, -0.02260589599609375, -0.020310401916503906, -0.018014907836914062, -0.01571941375732422, -0.013423919677734375, -0.011128425598144531, -0.008832931518554688, -0.006537437438964844, -0.004241943359375, -0.0019464492797851562, 0.0003490447998046875, 0.0026445388793945312, 0.004940032958984375, 0.007235527038574219, 0.009531021118164062, 0.011826515197753906, 0.01412200927734375, 0.016417503356933594, 0.018712997436523438, 0.02100849151611328, 0.023303985595703125, 0.02559947967529297, 0.027894973754882812, 0.030190467834472656, 0.0324859619140625, 0.034781455993652344, 0.03707695007324219, 0.03937244415283203, 0.041667938232421875, 0.04396343231201172, 0.04625892639160156, 0.048554420471191406, 0.05084991455078125, 0.053145408630371094, 0.05544090270996094, 0.05773639678955078, 0.060031890869140625, 0.06232738494873047, 0.06462287902832031, 0.06691837310791016, 0.0692138671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 10.0, 12.0, 19.0, 11.0, 24.0, 53.0, 75.0, 154.0, 271.0, 137.0, 79.0, 44.0, 32.0, 10.0, 9.0, 11.0, 3.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026171207427978516, -0.02536487579345703, -0.024558544158935547, -0.023752212524414062, -0.022945880889892578, -0.022139549255371094, -0.02133321762084961, -0.020526885986328125, -0.01972055435180664, -0.018914222717285156, -0.018107891082763672, -0.017301559448242188, -0.016495227813720703, -0.01568889617919922, -0.014882564544677734, -0.01407623291015625, -0.013269901275634766, -0.012463569641113281, -0.011657238006591797, -0.010850906372070312, -0.010044574737548828, -0.009238243103027344, -0.00843191146850586, -0.007625579833984375, -0.006819248199462891, -0.006012916564941406, -0.005206584930419922, -0.0044002532958984375, -0.003593921661376953, -0.0027875900268554688, -0.0019812583923339844, -0.0011749267578125, -0.0003685951232910156, 0.00043773651123046875, 0.0012440681457519531, 0.0020503997802734375, 0.002856731414794922, 0.0036630630493164062, 0.004469394683837891, 0.005275726318359375, 0.006082057952880859, 0.006888389587402344, 0.007694721221923828, 0.008501052856445312, 0.009307384490966797, 0.010113716125488281, 0.010920047760009766, 0.01172637939453125, 0.012532711029052734, 0.013339042663574219, 0.014145374298095703, 0.014951705932617188, 0.015758037567138672, 0.016564369201660156, 0.01737070083618164, 0.018177032470703125, 0.01898336410522461, 0.019789695739746094, 0.020596027374267578, 0.021402359008789062, 0.022208690643310547, 0.02301502227783203, 0.023821353912353516, 0.024627685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 7.0, 5.0, 13.0, 19.0, 14.0, 22.0, 24.0, 23.0, 24.0, 41.0, 32.0, 38.0, 44.0, 38.0, 31.0, 47.0, 52.0, 41.0, 42.0, 39.0, 56.0, 48.0, 43.0, 42.0, 28.0, 31.0, 24.0, 27.0, 11.0, 8.0, 9.0, 6.0, 12.0, 8.0, 6.0, 4.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4931228160858154, -1.4449156522750854, -1.3967084884643555, -1.348501443862915, -1.300294280052185, -1.252087116241455, -1.2038800716400146, -1.1556729078292847, -1.1074657440185547, -1.0592585802078247, -1.0110514163970947, -0.9628443717956543, -0.9146372079849243, -0.8664300441741943, -0.8182229399681091, -0.7700158357620239, -0.721808671951294, -0.673601508140564, -0.6253944039344788, -0.5771872997283936, -0.5289801359176636, -0.480773001909256, -0.4325658679008484, -0.3843587338924408, -0.3361515998840332, -0.2879444658756256, -0.23973733186721802, -0.19153019785881042, -0.14332306385040283, -0.09511592984199524, -0.046908795833587646, 0.0012983381748199463, 0.04950559139251709, 0.09771272540092468, 0.14591985940933228, 0.19412699341773987, 0.24233412742614746, 0.29054126143455505, 0.33874839544296265, 0.38695552945137024, 0.43516266345977783, 0.4833697974681854, 0.531576931476593, 0.5797840356826782, 0.6279911994934082, 0.6761983633041382, 0.7244054675102234, 0.7726125717163086, 0.8208197355270386, 0.8690268993377686, 0.9172340035438538, 0.965441107749939, 1.013648271560669, 1.061855435371399, 1.110062599182129, 1.1582696437835693, 1.2064768075942993, 1.2546839714050293, 1.3028910160064697, 1.3510981798171997, 1.3993053436279297, 1.4475125074386597, 1.4957196712493896, 1.54392671585083, 1.59213387966156]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 20.0, 17.0, 15.0, 28.0, 23.0, 27.0, 47.0, 41.0, 48.0, 24.0, 43.0, 33.0, 37.0, 49.0, 42.0, 47.0, 35.0, 45.0, 42.0, 35.0, 40.0, 38.0, 41.0, 25.0, 19.0, 17.0, 21.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.1137325763702393, -2.0571537017822266, -2.000574827194214, -1.9439959526062012, -1.887417197227478, -1.8308383226394653, -1.7742594480514526, -1.71768057346344, -1.6611018180847168, -1.604522943496704, -1.5479440689086914, -1.4913651943206787, -1.4347864389419556, -1.3782075643539429, -1.3216286897659302, -1.2650498151779175, -1.2084709405899048, -1.151892066001892, -1.0953131914138794, -1.0387344360351562, -0.9821555614471436, -0.9255766868591309, -0.8689978122711182, -0.8124189376831055, -0.7558401226997375, -0.6992612481117249, -0.6426824331283569, -0.5861035585403442, -0.5295246839523315, -0.4729458689689636, -0.4163669943809509, -0.3597881495952606, -0.3032093048095703, -0.24663046002388, -0.1900516003370285, -0.133472740650177, -0.0768938958644867, -0.020315051078796387, 0.03626382350921631, 0.09284266829490662, 0.14942151308059692, 0.20600035786628723, 0.26257920265197754, 0.31915807723999023, 0.37573692202568054, 0.43231576681137085, 0.48889464139938354, 0.5454734563827515, 0.6020523309707642, 0.6586312055587769, 0.7152100205421448, 0.7717888951301575, 0.8283677101135254, 0.8849465847015381, 0.9415254592895508, 0.9981043338775635, 1.0546832084655762, 1.1112620830535889, 1.1678409576416016, 1.2244198322296143, 1.2809985876083374, 1.33757746219635, 1.3941563367843628, 1.4507352113723755, 1.5073139667510986]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 11.0, 11.0, 11.0, 21.0, 36.0, 74.0, 87.0, 151.0, 260.0, 424.0, 903.0, 1820.0, 3947.0, 9477.0, 25303.0, 75614.0, 238026.0, 431038.0, 173132.0, 55413.0, 19025.0, 7268.0, 3260.0, 1529.0, 754.0, 382.0, 223.0, 137.0, 92.0, 44.0, 36.0, 10.0, 12.0, 14.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.586090087890625, -3.48468017578125, -3.383270263671875, -3.2818603515625, -3.180450439453125, -3.07904052734375, -2.977630615234375, -2.876220703125, -2.774810791015625, -2.67340087890625, -2.571990966796875, -2.4705810546875, -2.369171142578125, -2.26776123046875, -2.166351318359375, -2.06494140625, -1.963531494140625, -1.86212158203125, -1.760711669921875, -1.6593017578125, -1.557891845703125, -1.45648193359375, -1.355072021484375, -1.253662109375, -1.152252197265625, -1.05084228515625, -0.949432373046875, -0.8480224609375, -0.746612548828125, -0.64520263671875, -0.543792724609375, -0.4423828125, -0.340972900390625, -0.23956298828125, -0.138153076171875, -0.0367431640625, 0.064666748046875, 0.16607666015625, 0.267486572265625, 0.368896484375, 0.470306396484375, 0.57171630859375, 0.673126220703125, 0.7745361328125, 0.875946044921875, 0.97735595703125, 1.078765869140625, 1.18017578125, 1.281585693359375, 1.38299560546875, 1.484405517578125, 1.5858154296875, 1.687225341796875, 1.78863525390625, 1.890045166015625, 1.991455078125, 2.092864990234375, 2.19427490234375, 2.295684814453125, 2.3970947265625, 2.498504638671875, 2.59991455078125, 2.701324462890625, 2.802734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 4.0, 12.0, 12.0, 16.0, 16.0, 23.0, 24.0, 23.0, 39.0, 28.0, 37.0, 38.0, 49.0, 39.0, 49.0, 38.0, 33.0, 49.0, 41.0, 48.0, 42.0, 42.0, 34.0, 36.0, 31.0, 29.0, 34.0, 25.0, 17.0, 11.0, 11.0, 15.0, 11.0, 13.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.064453125, -2.971832275390625, -2.87921142578125, -2.786590576171875, -2.6939697265625, -2.601348876953125, -2.50872802734375, -2.416107177734375, -2.323486328125, -2.230865478515625, -2.13824462890625, -2.045623779296875, -1.9530029296875, -1.860382080078125, -1.76776123046875, -1.675140380859375, -1.58251953125, -1.489898681640625, -1.39727783203125, -1.304656982421875, -1.2120361328125, -1.119415283203125, -1.02679443359375, -0.934173583984375, -0.841552734375, -0.748931884765625, -0.65631103515625, -0.563690185546875, -0.4710693359375, -0.378448486328125, -0.28582763671875, -0.193206787109375, -0.1005859375, -0.007965087890625, 0.08465576171875, 0.177276611328125, 0.2698974609375, 0.362518310546875, 0.45513916015625, 0.547760009765625, 0.640380859375, 0.733001708984375, 0.82562255859375, 0.918243408203125, 1.0108642578125, 1.103485107421875, 1.19610595703125, 1.288726806640625, 1.38134765625, 1.473968505859375, 1.56658935546875, 1.659210205078125, 1.7518310546875, 1.844451904296875, 1.93707275390625, 2.029693603515625, 2.122314453125, 2.214935302734375, 2.30755615234375, 2.400177001953125, 2.4927978515625, 2.585418701171875, 2.67803955078125, 2.770660400390625, 2.86328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 3.0, 10.0, 21.0, 22.0, 23.0, 36.0, 42.0, 90.0, 113.0, 181.0, 279.0, 440.0, 769.0, 1249.0, 2252.0, 4063.0, 7739.0, 15297.0, 31272.0, 65920.0, 137460.0, 276749.0, 259481.0, 125250.0, 59939.0, 29237.0, 14348.0, 7230.0, 3926.0, 2081.0, 1200.0, 670.0, 403.0, 240.0, 169.0, 110.0, 58.0, 62.0, 36.0, 22.0, 18.0, 16.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9814453125, -1.9174041748046875, -1.853363037109375, -1.7893218994140625, -1.72528076171875, -1.6612396240234375, -1.597198486328125, -1.5331573486328125, -1.4691162109375, -1.4050750732421875, -1.341033935546875, -1.2769927978515625, -1.21295166015625, -1.1489105224609375, -1.084869384765625, -1.0208282470703125, -0.956787109375, -0.8927459716796875, -0.828704833984375, -0.7646636962890625, -0.70062255859375, -0.6365814208984375, -0.572540283203125, -0.5084991455078125, -0.4444580078125, -0.3804168701171875, -0.316375732421875, -0.2523345947265625, -0.18829345703125, -0.1242523193359375, -0.060211181640625, 0.0038299560546875, 0.06787109375, 0.1319122314453125, 0.195953369140625, 0.2599945068359375, 0.32403564453125, 0.3880767822265625, 0.452117919921875, 0.5161590576171875, 0.5802001953125, 0.6442413330078125, 0.708282470703125, 0.7723236083984375, 0.83636474609375, 0.9004058837890625, 0.964447021484375, 1.0284881591796875, 1.092529296875, 1.1565704345703125, 1.220611572265625, 1.2846527099609375, 1.34869384765625, 1.4127349853515625, 1.476776123046875, 1.5408172607421875, 1.6048583984375, 1.6688995361328125, 1.732940673828125, 1.7969818115234375, 1.86102294921875, 1.9250640869140625, 1.989105224609375, 2.0531463623046875, 2.1171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 7.0, 10.0, 11.0, 9.0, 12.0, 19.0, 22.0, 20.0, 20.0, 25.0, 36.0, 29.0, 27.0, 28.0, 32.0, 47.0, 49.0, 43.0, 51.0, 43.0, 42.0, 38.0, 37.0, 33.0, 45.0, 28.0, 33.0, 30.0, 19.0, 20.0, 14.0, 20.0, 14.0, 10.0, 11.0, 6.0, 10.0, 7.0, 4.0, 10.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-3.890625, -3.774749755859375, -3.65887451171875, -3.542999267578125, -3.4271240234375, -3.311248779296875, -3.19537353515625, -3.079498291015625, -2.963623046875, -2.847747802734375, -2.73187255859375, -2.615997314453125, -2.5001220703125, -2.384246826171875, -2.26837158203125, -2.152496337890625, -2.03662109375, -1.920745849609375, -1.80487060546875, -1.688995361328125, -1.5731201171875, -1.457244873046875, -1.34136962890625, -1.225494384765625, -1.109619140625, -0.993743896484375, -0.87786865234375, -0.761993408203125, -0.6461181640625, -0.530242919921875, -0.41436767578125, -0.298492431640625, -0.1826171875, -0.066741943359375, 0.04913330078125, 0.165008544921875, 0.2808837890625, 0.396759033203125, 0.51263427734375, 0.628509521484375, 0.744384765625, 0.860260009765625, 0.97613525390625, 1.092010498046875, 1.2078857421875, 1.323760986328125, 1.43963623046875, 1.555511474609375, 1.67138671875, 1.787261962890625, 1.90313720703125, 2.019012451171875, 2.1348876953125, 2.250762939453125, 2.36663818359375, 2.482513427734375, 2.598388671875, 2.714263916015625, 2.83013916015625, 2.946014404296875, 3.0618896484375, 3.177764892578125, 3.29364013671875, 3.409515380859375, 3.525390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 10.0, 8.0, 14.0, 29.0, 38.0, 46.0, 68.0, 101.0, 137.0, 200.0, 353.0, 536.0, 852.0, 1353.0, 2184.0, 3600.0, 6010.0, 10157.0, 17796.0, 30975.0, 56903.0, 104562.0, 189649.0, 263425.0, 161248.0, 87277.0, 47779.0, 26319.0, 14996.0, 8619.0, 5065.0, 3034.0, 1917.0, 1204.0, 732.0, 445.0, 306.0, 191.0, 147.0, 81.0, 64.0, 38.0, 33.0, 15.0, 17.0, 4.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.4150390625, -0.40259552001953125, -0.3901519775390625, -0.37770843505859375, -0.365264892578125, -0.35282135009765625, -0.3403778076171875, -0.32793426513671875, -0.31549072265625, -0.30304718017578125, -0.2906036376953125, -0.27816009521484375, -0.265716552734375, -0.25327301025390625, -0.2408294677734375, -0.22838592529296875, -0.2159423828125, -0.20349884033203125, -0.1910552978515625, -0.17861175537109375, -0.166168212890625, -0.15372467041015625, -0.1412811279296875, -0.12883758544921875, -0.11639404296875, -0.10395050048828125, -0.0915069580078125, -0.07906341552734375, -0.066619873046875, -0.05417633056640625, -0.0417327880859375, -0.02928924560546875, -0.016845703125, -0.00440216064453125, 0.0080413818359375, 0.02048492431640625, 0.032928466796875, 0.04537200927734375, 0.0578155517578125, 0.07025909423828125, 0.08270263671875, 0.09514617919921875, 0.1075897216796875, 0.12003326416015625, 0.132476806640625, 0.14492034912109375, 0.1573638916015625, 0.16980743408203125, 0.1822509765625, 0.19469451904296875, 0.2071380615234375, 0.21958160400390625, 0.232025146484375, 0.24446868896484375, 0.2569122314453125, 0.26935577392578125, 0.28179931640625, 0.29424285888671875, 0.3066864013671875, 0.31912994384765625, 0.331573486328125, 0.34401702880859375, 0.3564605712890625, 0.36890411376953125, 0.38134765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 8.0, 8.0, 16.0, 19.0, 19.0, 38.0, 27.0, 47.0, 64.0, 73.0, 84.0, 79.0, 94.0, 90.0, 58.0, 68.0, 55.0, 38.0, 29.0, 22.0, 12.0, 12.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019443035125732422, -0.00018889643251895905, -0.00018336251378059387, -0.0001778285950422287, -0.00017229467630386353, -0.00016676075756549835, -0.00016122683882713318, -0.000155692920088768, -0.00015015900135040283, -0.00014462508261203766, -0.00013909116387367249, -0.0001335572451353073, -0.00012802332639694214, -0.00012248940765857697, -0.00011695548892021179, -0.00011142157018184662, -0.00010588765144348145, -0.00010035373270511627, -9.48198139667511e-05, -8.928589522838593e-05, -8.375197649002075e-05, -7.821805775165558e-05, -7.26841390132904e-05, -6.715022027492523e-05, -6.161630153656006e-05, -5.6082382798194885e-05, -5.054846405982971e-05, -4.501454532146454e-05, -3.9480626583099365e-05, -3.394670784473419e-05, -2.841278910636902e-05, -2.2878870368003845e-05, -1.7344951629638672e-05, -1.1811032891273499e-05, -6.277114152908325e-06, -7.431954145431519e-07, 4.7907233238220215e-06, 1.0324642062187195e-05, 1.5858560800552368e-05, 2.139247953891754e-05, 2.6926398277282715e-05, 3.246031701564789e-05, 3.799423575401306e-05, 4.3528154492378235e-05, 4.906207323074341e-05, 5.459599196910858e-05, 6.0129910707473755e-05, 6.566382944583893e-05, 7.11977481842041e-05, 7.673166692256927e-05, 8.226558566093445e-05, 8.779950439929962e-05, 9.33334231376648e-05, 9.886734187602997e-05, 0.00010440126061439514, 0.00010993517935276031, 0.00011546909809112549, 0.00012100301682949066, 0.00012653693556785583, 0.000132070854306221, 0.00013760477304458618, 0.00014313869178295135, 0.00014867261052131653, 0.0001542065292596817, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 13.0, 31.0, 25.0, 42.0, 64.0, 77.0, 105.0, 148.0, 203.0, 361.0, 474.0, 686.0, 1104.0, 1820.0, 2984.0, 5049.0, 9232.0, 17438.0, 34470.0, 69575.0, 141133.0, 278618.0, 238383.0, 121779.0, 59923.0, 29633.0, 15254.0, 8159.0, 4469.0, 2657.0, 1638.0, 957.0, 630.0, 414.0, 322.0, 209.0, 141.0, 98.0, 75.0, 37.0, 32.0, 33.0, 18.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.52978515625, -0.5136795043945312, -0.4975738525390625, -0.48146820068359375, -0.465362548828125, -0.44925689697265625, -0.4331512451171875, -0.41704559326171875, -0.40093994140625, -0.38483428955078125, -0.3687286376953125, -0.35262298583984375, -0.336517333984375, -0.32041168212890625, -0.3043060302734375, -0.28820037841796875, -0.2720947265625, -0.25598907470703125, -0.2398834228515625, -0.22377777099609375, -0.207672119140625, -0.19156646728515625, -0.1754608154296875, -0.15935516357421875, -0.14324951171875, -0.12714385986328125, -0.1110382080078125, -0.09493255615234375, -0.078826904296875, -0.06272125244140625, -0.0466156005859375, -0.03050994873046875, -0.014404296875, 0.00170135498046875, 0.0178070068359375, 0.03391265869140625, 0.050018310546875, 0.06612396240234375, 0.0822296142578125, 0.09833526611328125, 0.11444091796875, 0.13054656982421875, 0.1466522216796875, 0.16275787353515625, 0.178863525390625, 0.19496917724609375, 0.2110748291015625, 0.22718048095703125, 0.2432861328125, 0.25939178466796875, 0.2754974365234375, 0.29160308837890625, 0.307708740234375, 0.32381439208984375, 0.3399200439453125, 0.35602569580078125, 0.37213134765625, 0.38823699951171875, 0.4043426513671875, 0.42044830322265625, 0.436553955078125, 0.45265960693359375, 0.4687652587890625, 0.48487091064453125, 0.5009765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 6.0, 6.0, 15.0, 14.0, 29.0, 25.0, 14.0, 30.0, 42.0, 38.0, 60.0, 57.0, 79.0, 78.0, 83.0, 86.0, 52.0, 34.0, 45.0, 36.0, 31.0, 28.0, 16.0, 17.0, 12.0, 7.0, 11.0, 8.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.49462890625, -0.48003387451171875, -0.4654388427734375, -0.45084381103515625, -0.436248779296875, -0.42165374755859375, -0.4070587158203125, -0.39246368408203125, -0.37786865234375, -0.36327362060546875, -0.3486785888671875, -0.33408355712890625, -0.319488525390625, -0.30489349365234375, -0.2902984619140625, -0.27570343017578125, -0.2611083984375, -0.24651336669921875, -0.2319183349609375, -0.21732330322265625, -0.202728271484375, -0.18813323974609375, -0.1735382080078125, -0.15894317626953125, -0.14434814453125, -0.12975311279296875, -0.1151580810546875, -0.10056304931640625, -0.085968017578125, -0.07137298583984375, -0.0567779541015625, -0.04218292236328125, -0.027587890625, -0.01299285888671875, 0.0016021728515625, 0.01619720458984375, 0.030792236328125, 0.04538726806640625, 0.0599822998046875, 0.07457733154296875, 0.08917236328125, 0.10376739501953125, 0.1183624267578125, 0.13295745849609375, 0.147552490234375, 0.16214752197265625, 0.1767425537109375, 0.19133758544921875, 0.2059326171875, 0.22052764892578125, 0.2351226806640625, 0.24971771240234375, 0.264312744140625, 0.27890777587890625, 0.2935028076171875, 0.30809783935546875, 0.32269287109375, 0.33728790283203125, 0.3518829345703125, 0.36647796630859375, 0.381072998046875, 0.39566802978515625, 0.4102630615234375, 0.42485809326171875, 0.439453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 10.0, 26.0, 34.0, 59.0, 79.0, 125.0, 151.0, 108.0, 126.0, 101.0, 61.0, 43.0, 32.0, 21.0, 5.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.081125259399414, -5.7800140380859375, -5.478902816772461, -5.177792072296143, -4.876680850982666, -4.5755696296691895, -4.274458885192871, -3.9733476638793945, -3.672236442565918, -3.3711252212524414, -3.070014238357544, -2.7689032554626465, -2.46779203414917, -2.1666808128356934, -1.865569829940796, -1.5644588470458984, -1.2633476257324219, -0.9622365236282349, -0.6611254215240479, -0.36001431941986084, -0.05890321731567383, 0.24220788478851318, 0.5433189868927002, 0.8444299697875977, 1.1455411911010742, 1.4466522932052612, 1.7477633953094482, 2.0488743782043457, 2.3499855995178223, 2.651096820831299, 2.9522078037261963, 3.2533187866210938, 3.5544309616088867, 3.8555421829223633, 4.15665340423584, 4.457764148712158, 4.758875370025635, 5.059986591339111, 5.36109733581543, 5.662208557128906, 5.963319778442383, 6.264430999755859, 6.565542221069336, 6.866652965545654, 7.167764186859131, 7.468875408172607, 7.769986152648926, 8.071097373962402, 8.372208595275879, 8.673319816589355, 8.974431037902832, 9.275542259216309, 9.576652526855469, 9.877763748168945, 10.178874969482422, 10.479986190795898, 10.781097412109375, 11.082208633422852, 11.383319854736328, 11.684431076049805, 11.985542297363281, 12.286652565002441, 12.587763786315918, 12.888875007629395, 13.189986228942871]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 3.0, 5.0, 14.0, 10.0, 14.0, 13.0, 22.0, 16.0, 19.0, 26.0, 28.0, 34.0, 29.0, 36.0, 31.0, 41.0, 47.0, 46.0, 42.0, 33.0, 52.0, 41.0, 40.0, 39.0, 36.0, 39.0, 33.0, 34.0, 21.0, 31.0, 20.0, 24.0, 11.0, 15.0, 12.0, 9.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.644021034240723, -7.400257110595703, -7.156493186950684, -6.912729263305664, -6.668964862823486, -6.425200939178467, -6.181437015533447, -5.937673091888428, -5.69390869140625, -5.4501447677612305, -5.206380844116211, -4.962616920471191, -4.718852519989014, -4.475088596343994, -4.231324672698975, -3.987560749053955, -3.7437968254089355, -3.500032901763916, -3.2562687397003174, -3.012504816055298, -2.768740653991699, -2.5249767303466797, -2.28121280670166, -2.0374488830566406, -1.793684720993042, -1.549920678138733, -1.3061566352844238, -1.0623927116394043, -0.8186286687850952, -0.5748646259307861, -0.3311007022857666, -0.08733665943145752, 0.15642786026000977, 0.40019187331199646, 0.6439558863639832, 0.8877198696136475, 1.1314839124679565, 1.3752479553222656, 1.6190118789672852, 1.8627759218215942, 2.1065399646759033, 2.350303888320923, 2.5940680503845215, 2.837831974029541, 3.0815958976745605, 3.325360059738159, 3.5691239833831787, 3.8128881454467773, 4.056652069091797, 4.300415992736816, 4.544179916381836, 4.7879438400268555, 5.031708240509033, 5.275472164154053, 5.519236087799072, 5.763000011444092, 6.0067644119262695, 6.250528335571289, 6.494292259216309, 6.738056182861328, 6.981820583343506, 7.225584506988525, 7.469348430633545, 7.7131123542785645, 7.956876277923584]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 18.0, 9.0, 17.0, 22.0, 25.0, 38.0, 51.0, 53.0, 89.0, 112.0, 159.0, 216.0, 309.0, 414.0, 558.0, 785.0, 1176.0, 1706.0, 3094.0, 1034804.0, 2120.0, 1373.0, 917.0, 671.0, 493.0, 356.0, 263.0, 195.0, 140.0, 101.0, 67.0, 68.0, 42.0, 36.0, 22.0, 21.0, 10.0, 15.0, 5.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.278793334960938, -8.005146980285645, -7.731500625610352, -7.457854270935059, -7.184207916259766, -6.910561561584473, -6.6369147300720215, -6.3632683753967285, -6.0896220207214355, -5.815975666046143, -5.54232931137085, -5.268682956695557, -4.9950361251831055, -4.7213897705078125, -4.4477434158325195, -4.174097061157227, -3.9004507064819336, -3.6268043518066406, -3.3531579971313477, -3.0795114040374756, -2.8058650493621826, -2.5322186946868896, -2.2585721015930176, -1.9849257469177246, -1.7112793922424316, -1.4376330375671387, -1.1639865636825562, -0.8903401494026184, -0.6166937351226807, -0.3430473804473877, -0.06940090656280518, 0.20424556732177734, 0.4778909683227539, 0.7515373826026917, 1.0251837968826294, 1.298830270767212, 1.5724766254425049, 1.8461229801177979, 2.11976957321167, 2.393415927886963, 2.667062282562256, 2.940708637237549, 3.214354991912842, 3.488001585006714, 3.761647939682007, 4.035294532775879, 4.308940887451172, 4.582587242126465, 4.856233596801758, 5.129879951477051, 5.403526306152344, 5.677172660827637, 5.95081901550293, 6.224465370178223, 6.498112201690674, 6.771758556365967, 7.04540491104126, 7.319051265716553, 7.592697620391846, 7.866343975067139, 8.13999080657959, 8.413637161254883, 8.687283515930176, 8.960929870605469, 9.234576225280762]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 42.0, 78.0, 130.0, 316.0, 1672.0, 12631.0, 51434052.0, 18995.0, 2572.0, 504.0, 165.0, 58.0, 25.0, 18.0, 7.0, 9.0, 12.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.71875, -32.34563446044922, -30.972518920898438, -29.599403381347656, -28.226289749145508, -26.853174209594727, -25.480058670043945, -24.106945037841797, -22.733829498291016, -21.360713958740234, -19.987598419189453, -18.614482879638672, -17.241369247436523, -15.868253707885742, -14.495138168334961, -13.122023582458496, -11.748907089233398, -10.375791549682617, -9.002676963806152, -7.629561424255371, -6.256446361541748, -4.883331298828125, -3.5102157592773438, -2.137101173400879, -0.7639856338500977, 0.6091295480728149, 1.9822447299957275, 3.3553600311279297, 4.728475093841553, 6.101590156555176, 7.474705696105957, 8.847820281982422, 10.220935821533203, 11.594051361083984, 12.96716594696045, 14.34028148651123, 15.713396072387695, 17.086511611938477, 18.459627151489258, 19.832740783691406, 21.205856323242188, 22.57897186279297, 23.95208740234375, 25.32520294189453, 26.69831657409668, 28.07143211364746, 29.444547653198242, 30.81766128540039, 32.19078063964844, 33.56389617919922, 34.93701171875, 36.31012725830078, 37.68324279785156, 39.056358337402344, 40.429473876953125, 41.80258560180664, 43.17570114135742, 44.5488166809082, 45.921932220458984, 47.295047760009766, 48.66816329956055, 50.04127502441406, 51.414390563964844, 52.787506103515625, 54.160621643066406]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 3.0, 11.0, 8.0, 13.0, 15.0, 27.0, 25.0, 53.0, 71.0, 111.0, 153.0, 230.0, 356.0, 484.0, 757.0, 1270.0, 2343.0, 4923.0, 12286.0, 39192.0, 147367.0, 592249.0, 4509129.0, 723973.0, 183102.0, 47266.0, 14737.0, 5358.0, 2528.0, 1241.0, 764.0, 502.0, 310.0, 186.0, 143.0, 80.0, 52.0, 27.0, 33.0, 15.0, 9.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.63037109375, -0.6144447326660156, -0.5985183715820312, -0.5825920104980469, -0.5666656494140625, -0.5507392883300781, -0.5348129272460938, -0.5188865661621094, -0.502960205078125, -0.4870338439941406, -0.47110748291015625, -0.4551811218261719, -0.4392547607421875, -0.4233283996582031, -0.40740203857421875, -0.3914756774902344, -0.37554931640625, -0.3596229553222656, -0.34369659423828125, -0.3277702331542969, -0.3118438720703125, -0.2959175109863281, -0.27999114990234375, -0.2640647888183594, -0.248138427734375, -0.23221206665039062, -0.21628570556640625, -0.20035934448242188, -0.1844329833984375, -0.16850662231445312, -0.15258026123046875, -0.13665390014648438, -0.1207275390625, -0.10480117797851562, -0.08887481689453125, -0.07294845581054688, -0.0570220947265625, -0.041095733642578125, -0.02516937255859375, -0.009243011474609375, 0.006683349609375, 0.022609710693359375, 0.03853607177734375, 0.054462432861328125, 0.0703887939453125, 0.08631515502929688, 0.10224151611328125, 0.11816787719726562, 0.13409423828125, 0.15002059936523438, 0.16594696044921875, 0.18187332153320312, 0.1977996826171875, 0.21372604370117188, 0.22965240478515625, 0.24557876586914062, 0.261505126953125, 0.2774314880371094, 0.29335784912109375, 0.3092842102050781, 0.3252105712890625, 0.3411369323730469, 0.35706329345703125, 0.3729896545410156, 0.388916015625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 10.0, 16.0, 10.0, 17.0, 22.0, 25.0, 18.0, 34.0, 44.0, 39.0, 55.0, 52.0, 53.0, 105.0, 1006.0, 59.0, 59.0, 54.0, 46.0, 40.0, 38.0, 33.0, 30.0, 27.0, 21.0, 21.0, 18.0, 14.0, 9.0, 4.0, 8.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.15625, -17.552734375, -16.94921875, -16.345703125, -15.7421875, -15.138671875, -14.53515625, -13.931640625, -13.328125, -12.724609375, -12.12109375, -11.517578125, -10.9140625, -10.310546875, -9.70703125, -9.103515625, -8.5, -7.896484375, -7.29296875, -6.689453125, -6.0859375, -5.482421875, -4.87890625, -4.275390625, -3.671875, -3.068359375, -2.46484375, -1.861328125, -1.2578125, -0.654296875, -0.05078125, 0.552734375, 1.15625, 1.759765625, 2.36328125, 2.966796875, 3.5703125, 4.173828125, 4.77734375, 5.380859375, 5.984375, 6.587890625, 7.19140625, 7.794921875, 8.3984375, 9.001953125, 9.60546875, 10.208984375, 10.8125, 11.416015625, 12.01953125, 12.623046875, 13.2265625, 13.830078125, 14.43359375, 15.037109375, 15.640625, 16.244140625, 16.84765625, 17.451171875, 18.0546875, 18.658203125, 19.26171875, 19.865234375, 20.46875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 0.0, 17.0, 20.0, 16.0, 20.0, 30.0, 43.0, 49.0, 40.0, 49.0, 65.0, 80.0, 119.0, 150.0, 198.0, 249.0, 337.0, 394.0, 523.0, 771.0, 1212.0, 1986.0, 3713.0, 7658.0, 17265.0, 46175.0, 138520.0, 445342.0, 4206059.0, 920655.0, 331574.0, 103870.0, 35495.0, 13785.0, 6042.0, 3165.0, 1670.0, 1146.0, 761.0, 516.0, 354.0, 292.0, 214.0, 167.0, 133.0, 106.0, 90.0, 72.0, 74.0, 44.0, 25.0, 21.0, 14.0, 21.0, 15.0, 4.0, 7.0, 3.0, 5.0, 2.0], "bins": [-0.322265625, -0.31246185302734375, -0.3026580810546875, -0.29285430908203125, -0.283050537109375, -0.27324676513671875, -0.2634429931640625, -0.25363922119140625, -0.24383544921875, -0.23403167724609375, -0.2242279052734375, -0.21442413330078125, -0.204620361328125, -0.19481658935546875, -0.1850128173828125, -0.17520904541015625, -0.1654052734375, -0.15560150146484375, -0.1457977294921875, -0.13599395751953125, -0.126190185546875, -0.11638641357421875, -0.1065826416015625, -0.09677886962890625, -0.08697509765625, -0.07717132568359375, -0.0673675537109375, -0.05756378173828125, -0.047760009765625, -0.03795623779296875, -0.0281524658203125, -0.01834869384765625, -0.008544921875, 0.00125885009765625, 0.0110626220703125, 0.02086639404296875, 0.030670166015625, 0.04047393798828125, 0.0502777099609375, 0.06008148193359375, 0.06988525390625, 0.07968902587890625, 0.0894927978515625, 0.09929656982421875, 0.109100341796875, 0.11890411376953125, 0.1287078857421875, 0.13851165771484375, 0.1483154296875, 0.15811920166015625, 0.1679229736328125, 0.17772674560546875, 0.187530517578125, 0.19733428955078125, 0.2071380615234375, 0.21694183349609375, 0.22674560546875, 0.23654937744140625, 0.2463531494140625, 0.25615692138671875, 0.265960693359375, 0.27576446533203125, 0.2855682373046875, 0.29537200927734375, 0.30517578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 8.0, 17.0, 16.0, 14.0, 23.0, 35.0, 28.0, 35.0, 59.0, 49.0, 47.0, 61.0, 56.0, 1076.0, 72.0, 71.0, 61.0, 50.0, 51.0, 38.0, 32.0, 23.0, 17.0, 10.0, 20.0, 14.0, 9.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.1875, -22.515380859375, -21.84326171875, -21.171142578125, -20.4990234375, -19.826904296875, -19.15478515625, -18.482666015625, -17.810546875, -17.138427734375, -16.46630859375, -15.794189453125, -15.1220703125, -14.449951171875, -13.77783203125, -13.105712890625, -12.43359375, -11.761474609375, -11.08935546875, -10.417236328125, -9.7451171875, -9.072998046875, -8.40087890625, -7.728759765625, -7.056640625, -6.384521484375, -5.71240234375, -5.040283203125, -4.3681640625, -3.696044921875, -3.02392578125, -2.351806640625, -1.6796875, -1.007568359375, -0.33544921875, 0.336669921875, 1.0087890625, 1.680908203125, 2.35302734375, 3.025146484375, 3.697265625, 4.369384765625, 5.04150390625, 5.713623046875, 6.3857421875, 7.057861328125, 7.72998046875, 8.402099609375, 9.07421875, 9.746337890625, 10.41845703125, 11.090576171875, 11.7626953125, 12.434814453125, 13.10693359375, 13.779052734375, 14.451171875, 15.123291015625, 15.79541015625, 16.467529296875, 17.1396484375, 17.811767578125, 18.48388671875, 19.156005859375, 19.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 13.0, 11.0, 20.0, 23.0, 43.0, 60.0, 98.0, 228.0, 409.0, 729.0, 1565.0, 3940.0, 23214.0, 6129902.0, 119443.0, 6912.0, 2549.0, 1022.0, 553.0, 243.0, 184.0, 74.0, 55.0, 36.0, 28.0, 23.0, 12.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.4609375, -2.3989410400390625, -2.336944580078125, -2.2749481201171875, -2.21295166015625, -2.1509552001953125, -2.088958740234375, -2.0269622802734375, -1.9649658203125, -1.9029693603515625, -1.840972900390625, -1.7789764404296875, -1.71697998046875, -1.6549835205078125, -1.592987060546875, -1.5309906005859375, -1.468994140625, -1.4069976806640625, -1.345001220703125, -1.2830047607421875, -1.22100830078125, -1.1590118408203125, -1.097015380859375, -1.0350189208984375, -0.9730224609375, -0.9110260009765625, -0.849029541015625, -0.7870330810546875, -0.72503662109375, -0.6630401611328125, -0.601043701171875, -0.5390472412109375, -0.47705078125, -0.4150543212890625, -0.353057861328125, -0.2910614013671875, -0.22906494140625, -0.1670684814453125, -0.105072021484375, -0.0430755615234375, 0.0189208984375, 0.0809173583984375, 0.142913818359375, 0.2049102783203125, 0.26690673828125, 0.3289031982421875, 0.390899658203125, 0.4528961181640625, 0.514892578125, 0.5768890380859375, 0.638885498046875, 0.7008819580078125, 0.76287841796875, 0.8248748779296875, 0.886871337890625, 0.9488677978515625, 1.0108642578125, 1.0728607177734375, 1.134857177734375, 1.1968536376953125, 1.25885009765625, 1.3208465576171875, 1.382843017578125, 1.4448394775390625, 1.5068359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 8.0, 11.0, 15.0, 38.0, 56.0, 83.0, 94.0, 120.0, 1152.0, 106.0, 100.0, 67.0, 71.0, 47.0, 18.0, 15.0, 8.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.40625, -14.3388671875, -13.271484375, -12.2041015625, -11.13671875, -10.0693359375, -9.001953125, -7.9345703125, -6.8671875, -5.7998046875, -4.732421875, -3.6650390625, -2.59765625, -1.5302734375, -0.462890625, 0.6044921875, 1.671875, 2.7392578125, 3.806640625, 4.8740234375, 5.94140625, 7.0087890625, 8.076171875, 9.1435546875, 10.2109375, 11.2783203125, 12.345703125, 13.4130859375, 14.48046875, 15.5478515625, 16.615234375, 17.6826171875, 18.75, 19.8173828125, 20.884765625, 21.9521484375, 23.01953125, 24.0869140625, 25.154296875, 26.2216796875, 27.2890625, 28.3564453125, 29.423828125, 30.4912109375, 31.55859375, 32.6259765625, 33.693359375, 34.7607421875, 35.828125, 36.8955078125, 37.962890625, 39.0302734375, 40.09765625, 41.1650390625, 42.232421875, 43.2998046875, 44.3671875, 45.4345703125, 46.501953125, 47.5693359375, 48.63671875, 49.7041015625, 50.771484375, 51.8388671875, 52.90625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 16.0, 883.0, 107.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.4377670288086, -85.56261444091797, -82.68745422363281, -79.81230163574219, -76.93714904785156, -74.0619888305664, -71.18683624267578, -68.31167602539062, -65.4365234375, -62.56136703491211, -59.68621063232422, -56.811058044433594, -53.9359016418457, -51.06074523925781, -48.18559265136719, -45.3104362487793, -42.435279846191406, -39.560123443603516, -36.684967041015625, -33.809814453125, -30.93465805053711, -28.05950164794922, -25.18434715270996, -22.309192657470703, -19.434036254882812, -16.558879852294922, -13.683725357055664, -10.80856990814209, -7.933414459228516, -5.058259010314941, -2.183103561401367, 0.6920509338378906, 3.56719970703125, 6.442355155944824, 9.317510604858398, 12.192666053771973, 15.067821502685547, 17.942977905273438, 20.818132400512695, 23.693286895751953, 26.568443298339844, 29.443599700927734, 32.318756103515625, 35.19390869140625, 38.06906509399414, 40.94422149658203, 43.819374084472656, 46.69453048706055, 49.56968688964844, 52.44484329223633, 55.31999969482422, 58.195152282714844, 61.070308685302734, 63.945465087890625, 66.82061767578125, 69.69577026367188, 72.57093048095703, 75.44608306884766, 78.32124328613281, 81.19639587402344, 84.07154846191406, 86.94670867919922, 89.82186126708984, 92.697021484375, 95.57217407226562]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 21.0, 56.0, 118.0, 186.0, 207.0, 182.0, 117.0, 58.0, 24.0, 16.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.10977935791016, -93.33302307128906, -90.55626678466797, -87.7795181274414, -85.00276184082031, -82.22600555419922, -79.44924926757812, -76.67250061035156, -73.89574432373047, -71.11898803710938, -68.34223175048828, -65.56548309326172, -62.788726806640625, -60.01197052001953, -57.23521423339844, -54.45846176147461, -51.681705474853516, -48.90494918823242, -46.128196716308594, -43.3514404296875, -40.57468795776367, -37.79793167114258, -35.02117919921875, -32.244422912597656, -29.467668533325195, -26.690914154052734, -23.914159774780273, -21.137405395507812, -18.36064910888672, -15.583895683288574, -12.807140350341797, -10.030385971069336, -7.253631591796875, -4.476877212524414, -1.700122356414795, 1.0766324996948242, 3.853386878967285, 6.630141258239746, 9.406896591186523, 12.183650970458984, 14.960405349731445, 17.737159729003906, 20.513914108276367, 23.290668487548828, 26.067424774169922, 28.84417724609375, 31.620933532714844, 34.39768981933594, 37.174442291259766, 39.95119857788086, 42.72795104980469, 45.50470733642578, 48.28145980834961, 51.0582160949707, 53.83496856689453, 56.611724853515625, 59.38848114013672, 62.16523742675781, 64.9419937133789, 67.71874237060547, 70.49549865722656, 73.27225494384766, 76.04901123046875, 78.82575988769531, 81.6025161743164]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 21.0, 25.0, 3286.0, 6444.0, 134530.0, 4041061.0, 6289.0, 1330.0, 1236.0, 18.0, 8.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1585693359375, -0.15392494201660156, -0.14928054809570312, -0.1446361541748047, -0.13999176025390625, -0.1353473663330078, -0.13070297241210938, -0.12605857849121094, -0.1214141845703125, -0.11676979064941406, -0.11212539672851562, -0.10748100280761719, -0.10283660888671875, -0.09819221496582031, -0.09354782104492188, -0.08890342712402344, -0.084259033203125, -0.07961463928222656, -0.07497024536132812, -0.07032585144042969, -0.06568145751953125, -0.06103706359863281, -0.056392669677734375, -0.05174827575683594, -0.0471038818359375, -0.04245948791503906, -0.037815093994140625, -0.03317070007324219, -0.02852630615234375, -0.023881912231445312, -0.019237518310546875, -0.014593124389648438, -0.00994873046875, -0.0053043365478515625, -0.000659942626953125, 0.0039844512939453125, 0.00862884521484375, 0.013273239135742188, 0.017917633056640625, 0.022562026977539062, 0.0272064208984375, 0.03185081481933594, 0.036495208740234375, 0.04113960266113281, 0.04578399658203125, 0.05042839050292969, 0.055072784423828125, 0.05971717834472656, 0.064361572265625, 0.06900596618652344, 0.07365036010742188, 0.07829475402832031, 0.08293914794921875, 0.08758354187011719, 0.09222793579101562, 0.09687232971191406, 0.1015167236328125, 0.10616111755371094, 0.11080551147460938, 0.11544990539550781, 0.12009429931640625, 0.12473869323730469, 0.12938308715820312, 0.13402748107910156, 0.138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 59.0, 225.0, 579.0, 90.0, 28.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0906982421875, -0.08805465698242188, -0.08541107177734375, -0.08276748657226562, -0.0801239013671875, -0.07748031616210938, -0.07483673095703125, -0.07219314575195312, -0.069549560546875, -0.06690597534179688, -0.06426239013671875, -0.061618804931640625, -0.0589752197265625, -0.056331634521484375, -0.05368804931640625, -0.051044464111328125, -0.04840087890625, -0.045757293701171875, -0.04311370849609375, -0.040470123291015625, -0.0378265380859375, -0.035182952880859375, -0.03253936767578125, -0.029895782470703125, -0.027252197265625, -0.024608612060546875, -0.02196502685546875, -0.019321441650390625, -0.0166778564453125, -0.014034271240234375, -0.01139068603515625, -0.008747100830078125, -0.006103515625, -0.003459930419921875, -0.00081634521484375, 0.001827239990234375, 0.0044708251953125, 0.007114410400390625, 0.00975799560546875, 0.012401580810546875, 0.015045166015625, 0.017688751220703125, 0.02033233642578125, 0.022975921630859375, 0.0256195068359375, 0.028263092041015625, 0.03090667724609375, 0.033550262451171875, 0.03619384765625, 0.038837432861328125, 0.04148101806640625, 0.044124603271484375, 0.0467681884765625, 0.049411773681640625, 0.05205535888671875, 0.054698944091796875, 0.057342529296875, 0.059986114501953125, 0.06262969970703125, 0.06527328491210938, 0.0679168701171875, 0.07056045532226562, 0.07320404052734375, 0.07584762573242188, 0.0784912109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 9.0, 21.0, 31.0, 56.0, 70.0, 160.0, 351.0, 1695.0, 4187705.0, 3402.0, 390.0, 138.0, 65.0, 49.0, 28.0, 23.0, 12.0, 12.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1494140625, -0.1446819305419922, -0.13994979858398438, -0.13521766662597656, -0.13048553466796875, -0.12575340270996094, -0.12102127075195312, -0.11628913879394531, -0.1115570068359375, -0.10682487487792969, -0.10209274291992188, -0.09736061096191406, -0.09262847900390625, -0.08789634704589844, -0.08316421508789062, -0.07843208312988281, -0.073699951171875, -0.06896781921386719, -0.06423568725585938, -0.05950355529785156, -0.05477142333984375, -0.05003929138183594, -0.045307159423828125, -0.04057502746582031, -0.0358428955078125, -0.031110763549804688, -0.026378631591796875, -0.021646499633789062, -0.01691436767578125, -0.012182235717773438, -0.007450103759765625, -0.0027179718017578125, 0.00201416015625, 0.0067462921142578125, 0.011478424072265625, 0.016210556030273438, 0.02094268798828125, 0.025674819946289062, 0.030406951904296875, 0.03513908386230469, 0.0398712158203125, 0.04460334777832031, 0.049335479736328125, 0.05406761169433594, 0.05879974365234375, 0.06353187561035156, 0.06826400756835938, 0.07299613952636719, 0.077728271484375, 0.08246040344238281, 0.08719253540039062, 0.09192466735839844, 0.09665679931640625, 0.10138893127441406, 0.10612106323242188, 0.11085319519042969, 0.1155853271484375, 0.12031745910644531, 0.12504959106445312, 0.12978172302246094, 0.13451385498046875, 0.13924598693847656, 0.14397811889648438, 0.1487102508544922, 0.1534423828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 10.0, 20.0, 30.0, 51.0, 75.0, 154.0, 299.0, 710.0, 1325.0, 740.0, 294.0, 118.0, 67.0, 46.0, 26.0, 21.0, 13.0, 11.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.032379150390625, -0.031352996826171875, -0.03032684326171875, -0.029300689697265625, -0.0282745361328125, -0.027248382568359375, -0.02622222900390625, -0.025196075439453125, -0.024169921875, -0.023143768310546875, -0.02211761474609375, -0.021091461181640625, -0.0200653076171875, -0.019039154052734375, -0.01801300048828125, -0.016986846923828125, -0.015960693359375, -0.014934539794921875, -0.01390838623046875, -0.012882232666015625, -0.0118560791015625, -0.010829925537109375, -0.00980377197265625, -0.008777618408203125, -0.00775146484375, -0.006725311279296875, -0.00569915771484375, -0.004673004150390625, -0.0036468505859375, -0.002620697021484375, -0.00159454345703125, -0.000568389892578125, 0.000457763671875, 0.001483917236328125, 0.00251007080078125, 0.003536224365234375, 0.0045623779296875, 0.005588531494140625, 0.00661468505859375, 0.007640838623046875, 0.0086669921875, 0.009693145751953125, 0.01071929931640625, 0.011745452880859375, 0.0127716064453125, 0.013797760009765625, 0.01482391357421875, 0.015850067138671875, 0.016876220703125, 0.017902374267578125, 0.01892852783203125, 0.019954681396484375, 0.0209808349609375, 0.022006988525390625, 0.02303314208984375, 0.024059295654296875, 0.02508544921875, 0.026111602783203125, 0.02713775634765625, 0.028163909912109375, 0.0291900634765625, 0.030216217041015625, 0.03124237060546875, 0.032268524169921875, 0.033294677734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 957.0, 59.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13312101364135742, -0.12063343077898026, -0.10814584791660309, -0.09565827250480652, -0.08317068964242935, -0.07068310678005219, -0.058195531368255615, -0.04570794850587845, -0.03322036564350128, -0.020732784643769264, -0.008245203644037247, 0.004242375493049622, 0.01672995835542679, 0.029217541217803955, 0.041705116629600525, 0.05419269949197769, 0.06668028235435486, 0.07916786521673203, 0.09165544807910919, 0.10414302349090576, 0.11663060635328293, 0.1291181892156601, 0.14160576462745667, 0.15409335494041443, 0.166580930352211, 0.17906850576400757, 0.19155609607696533, 0.2040436714887619, 0.21653124690055847, 0.22901883721351624, 0.2415064126253128, 0.2539939880371094, 0.26648157835006714, 0.2789691686630249, 0.2914567291736603, 0.30394431948661804, 0.3164319097995758, 0.3289194703102112, 0.34140706062316895, 0.3538946509361267, 0.3663822412490845, 0.37886983156204224, 0.3913573920726776, 0.4038449823856354, 0.41633257269859314, 0.4288201332092285, 0.4413077235221863, 0.45379531383514404, 0.4662828743457794, 0.4787704646587372, 0.49125802516937256, 0.5037456154823303, 0.5162332057952881, 0.5287207961082458, 0.5412083864212036, 0.5536959171295166, 0.5661835074424744, 0.5786710977554321, 0.5911586880683899, 0.6036462783813477, 0.6161338090896606, 0.6286213994026184, 0.6411089897155762, 0.6535965800285339, 0.6660841703414917]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 15.0, 14.0, 9.0, 12.0, 18.0, 17.0, 19.0, 27.0, 28.0, 28.0, 25.0, 23.0, 32.0, 42.0, 34.0, 32.0, 38.0, 40.0, 46.0, 36.0, 43.0, 46.0, 43.0, 25.0, 31.0, 36.0, 37.0, 30.0, 24.0, 24.0, 20.0, 20.0, 16.0, 12.0, 5.0, 12.0, 8.0, 5.0, 2.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.051763057708740234, -0.050176411867141724, -0.048589762300252914, -0.047003112733364105, -0.045416466891765594, -0.043829821050167084, -0.042243171483278275, -0.040656521916389465, -0.039069876074790955, -0.037483230233192444, -0.035896580666303635, -0.034309931099414825, -0.032723285257816315, -0.031136637553572655, -0.029549989849328995, -0.027963342145085335, -0.026376694440841675, -0.024790046736598015, -0.023203399032354355, -0.021616751328110695, -0.020030103623867035, -0.018443455919623375, -0.016856808215379715, -0.015270160511136055, -0.013683512806892395, -0.012096865102648735, -0.010510217398405075, -0.008923569694161415, -0.007336921989917755, -0.005750274285674095, -0.004163626581430435, -0.002576978877186775, -0.0009903311729431152, 0.0005963165313005447, 0.0021829642355442047, 0.0037696119397878647, 0.005356259644031525, 0.006942907348275185, 0.008529555052518845, 0.010116202756762505, 0.011702850461006165, 0.013289498165249825, 0.014876145869493484, 0.016462793573737144, 0.018049441277980804, 0.019636088982224464, 0.021222736686468124, 0.022809384390711784, 0.024396032094955444, 0.025982679799199104, 0.027569327503442764, 0.029155975207686424, 0.030742622911930084, 0.032329268753528595, 0.033915918320417404, 0.03550256788730621, 0.037089213728904724, 0.038675859570503235, 0.040262509137392044, 0.04184915870428085, 0.043435804545879364, 0.045022450387477875, 0.046609099954366684, 0.04819574952125549, 0.049782395362854004]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 6.0, 7.0, 20.0, 30.0, 26.0, 37.0, 76.0, 96.0, 144.0, 251.0, 458.0, 1097.0, 7143.0, 1020429.0, 15718.0, 1636.0, 584.0, 280.0, 162.0, 86.0, 71.0, 38.0, 40.0, 17.0, 17.0, 11.0, 13.0, 12.0, 3.0, 1.0, 7.0, 7.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.21484375, -4.093109130859375, -3.97137451171875, -3.849639892578125, -3.7279052734375, -3.606170654296875, -3.48443603515625, -3.362701416015625, -3.240966796875, -3.119232177734375, -2.99749755859375, -2.875762939453125, -2.7540283203125, -2.632293701171875, -2.51055908203125, -2.388824462890625, -2.26708984375, -2.145355224609375, -2.02362060546875, -1.901885986328125, -1.7801513671875, -1.658416748046875, -1.53668212890625, -1.414947509765625, -1.293212890625, -1.171478271484375, -1.04974365234375, -0.928009033203125, -0.8062744140625, -0.684539794921875, -0.56280517578125, -0.441070556640625, -0.3193359375, -0.197601318359375, -0.07586669921875, 0.045867919921875, 0.1676025390625, 0.289337158203125, 0.41107177734375, 0.532806396484375, 0.654541015625, 0.776275634765625, 0.89801025390625, 1.019744873046875, 1.1414794921875, 1.263214111328125, 1.38494873046875, 1.506683349609375, 1.62841796875, 1.750152587890625, 1.87188720703125, 1.993621826171875, 2.1153564453125, 2.237091064453125, 2.35882568359375, 2.480560302734375, 2.602294921875, 2.724029541015625, 2.84576416015625, 2.967498779296875, 3.0892333984375, 3.210968017578125, 3.33270263671875, 3.454437255859375, 3.576171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 56.0, 203.0, 589.0, 101.0, 29.0, 11.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0897216796875, -0.08711051940917969, -0.08449935913085938, -0.08188819885253906, -0.07927703857421875, -0.07666587829589844, -0.07405471801757812, -0.07144355773925781, -0.0688323974609375, -0.06622123718261719, -0.06361007690429688, -0.06099891662597656, -0.05838775634765625, -0.05577659606933594, -0.053165435791015625, -0.05055427551269531, -0.047943115234375, -0.04533195495605469, -0.042720794677734375, -0.04010963439941406, -0.03749847412109375, -0.03488731384277344, -0.032276153564453125, -0.029664993286132812, -0.0270538330078125, -0.024442672729492188, -0.021831512451171875, -0.019220352172851562, -0.01660919189453125, -0.013998031616210938, -0.011386871337890625, -0.008775711059570312, -0.00616455078125, -0.0035533905029296875, -0.000942230224609375, 0.0016689300537109375, 0.00428009033203125, 0.0068912506103515625, 0.009502410888671875, 0.012113571166992188, 0.0147247314453125, 0.017335891723632812, 0.019947052001953125, 0.022558212280273438, 0.02516937255859375, 0.027780532836914062, 0.030391693115234375, 0.03300285339355469, 0.035614013671875, 0.03822517395019531, 0.040836334228515625, 0.04344749450683594, 0.04605865478515625, 0.04866981506347656, 0.051280975341796875, 0.05389213562011719, 0.0565032958984375, 0.05911445617675781, 0.061725616455078125, 0.06433677673339844, 0.06694793701171875, 0.06955909729003906, 0.07217025756835938, 0.07478141784667969, 0.077392578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 8.0, 4.0, 3.0, 8.0, 13.0, 17.0, 17.0, 21.0, 44.0, 77.0, 103.0, 156.0, 258.0, 567.0, 987.0, 1779.0, 3790.0, 8231.0, 19052.0, 49265.0, 178620.0, 589486.0, 127358.0, 39589.0, 15393.0, 6871.0, 3307.0, 1572.0, 836.0, 432.0, 261.0, 151.0, 85.0, 54.0, 39.0, 31.0, 14.0, 19.0, 11.0, 12.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09325122833251953, -0.09037208557128906, -0.0874929428100586, -0.08461380004882812, -0.08173465728759766, -0.07885551452636719, -0.07597637176513672, -0.07309722900390625, -0.07021808624267578, -0.06733894348144531, -0.06445980072021484, -0.061580657958984375, -0.058701515197753906, -0.05582237243652344, -0.05294322967529297, -0.0500640869140625, -0.04718494415283203, -0.04430580139160156, -0.041426658630371094, -0.038547515869140625, -0.035668373107910156, -0.03278923034667969, -0.02991008758544922, -0.02703094482421875, -0.02415180206298828, -0.021272659301757812, -0.018393516540527344, -0.015514373779296875, -0.012635231018066406, -0.009756088256835938, -0.006876945495605469, -0.003997802734375, -0.0011186599731445312, 0.0017604827880859375, 0.004639625549316406, 0.007518768310546875, 0.010397911071777344, 0.013277053833007812, 0.01615619659423828, 0.01903533935546875, 0.02191448211669922, 0.024793624877929688, 0.027672767639160156, 0.030551910400390625, 0.033431053161621094, 0.03631019592285156, 0.03918933868408203, 0.0420684814453125, 0.04494762420654297, 0.04782676696777344, 0.050705909729003906, 0.053585052490234375, 0.056464195251464844, 0.05934333801269531, 0.06222248077392578, 0.06510162353515625, 0.06798076629638672, 0.07085990905761719, 0.07373905181884766, 0.07661819458007812, 0.0794973373413086, 0.08237648010253906, 0.08525562286376953, 0.088134765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 8.0, 10.0, 24.0, 22.0, 21.0, 31.0, 24.0, 29.0, 36.0, 31.0, 42.0, 42.0, 52.0, 37.0, 43.0, 55.0, 49.0, 46.0, 37.0, 43.0, 41.0, 38.0, 33.0, 24.0, 26.0, 32.0, 14.0, 16.0, 6.0, 8.0, 12.0, 6.0, 7.0, 5.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04718017578125, -0.0456395149230957, -0.044098854064941406, -0.04255819320678711, -0.04101753234863281, -0.039476871490478516, -0.03793621063232422, -0.03639554977416992, -0.034854888916015625, -0.03331422805786133, -0.03177356719970703, -0.030232906341552734, -0.028692245483398438, -0.02715158462524414, -0.025610923767089844, -0.024070262908935547, -0.02252960205078125, -0.020988941192626953, -0.019448280334472656, -0.01790761947631836, -0.016366958618164062, -0.014826297760009766, -0.013285636901855469, -0.011744976043701172, -0.010204315185546875, -0.008663654327392578, -0.007122993469238281, -0.005582332611083984, -0.0040416717529296875, -0.0025010108947753906, -0.0009603500366210938, 0.0005803108215332031, 0.0021209716796875, 0.003661632537841797, 0.005202293395996094, 0.006742954254150391, 0.008283615112304688, 0.009824275970458984, 0.011364936828613281, 0.012905597686767578, 0.014446258544921875, 0.015986919403076172, 0.01752758026123047, 0.019068241119384766, 0.020608901977539062, 0.02214956283569336, 0.023690223693847656, 0.025230884552001953, 0.02677154541015625, 0.028312206268310547, 0.029852867126464844, 0.03139352798461914, 0.03293418884277344, 0.034474849700927734, 0.03601551055908203, 0.03755617141723633, 0.039096832275390625, 0.04063749313354492, 0.04217815399169922, 0.043718814849853516, 0.04525947570800781, 0.04680013656616211, 0.048340797424316406, 0.0498814582824707, 0.051422119140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 7.0, 13.0, 16.0, 28.0, 59.0, 117.0, 224.0, 538.0, 1460.0, 5541.0, 38235.0, 881458.0, 107268.0, 9936.0, 2226.0, 792.0, 303.0, 152.0, 73.0, 45.0, 24.0, 16.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0198211669921875, -0.01912999153137207, -0.01843881607055664, -0.01774764060974121, -0.01705646514892578, -0.01636528968811035, -0.015674114227294922, -0.014982938766479492, -0.014291763305664062, -0.013600587844848633, -0.012909412384033203, -0.012218236923217773, -0.011527061462402344, -0.010835886001586914, -0.010144710540771484, -0.009453535079956055, -0.008762359619140625, -0.008071184158325195, -0.007380008697509766, -0.006688833236694336, -0.005997657775878906, -0.0053064823150634766, -0.004615306854248047, -0.003924131393432617, -0.0032329559326171875, -0.002541780471801758, -0.0018506050109863281, -0.0011594295501708984, -0.00046825408935546875, 0.00022292137145996094, 0.0009140968322753906, 0.0016052722930908203, 0.00229644775390625, 0.0029876232147216797, 0.0036787986755371094, 0.004369974136352539, 0.005061149597167969, 0.0057523250579833984, 0.006443500518798828, 0.007134675979614258, 0.007825851440429688, 0.008517026901245117, 0.009208202362060547, 0.009899377822875977, 0.010590553283691406, 0.011281728744506836, 0.011972904205322266, 0.012664079666137695, 0.013355255126953125, 0.014046430587768555, 0.014737606048583984, 0.015428781509399414, 0.016119956970214844, 0.016811132431030273, 0.017502307891845703, 0.018193483352661133, 0.018884658813476562, 0.019575834274291992, 0.020267009735107422, 0.02095818519592285, 0.02164936065673828, 0.02234053611755371, 0.02303171157836914, 0.02372288703918457, 0.0244140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 17.0, 17.0, 41.0, 77.0, 174.0, 283.0, 190.0, 98.0, 47.0, 24.0, 6.0, 3.0, 0.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-05, -7.27195292711258e-05, -6.735697388648987e-05, -6.199441850185394e-05, -5.663186311721802e-05, -5.126930773258209e-05, -4.590675234794617e-05, -4.054419696331024e-05, -3.5181641578674316e-05, -2.981908619403839e-05, -2.4456530809402466e-05, -1.909397542476654e-05, -1.3731420040130615e-05, -8.36886465549469e-06, -3.0063092708587646e-06, 2.3562461137771606e-06, 7.718801498413086e-06, 1.3081356883049011e-05, 1.8443912267684937e-05, 2.3806467652320862e-05, 2.9169023036956787e-05, 3.453157842159271e-05, 3.989413380622864e-05, 4.525668919086456e-05, 5.061924457550049e-05, 5.5981799960136414e-05, 6.134435534477234e-05, 6.670691072940826e-05, 7.206946611404419e-05, 7.743202149868011e-05, 8.279457688331604e-05, 8.815713226795197e-05, 9.351968765258789e-05, 9.888224303722382e-05, 0.00010424479842185974, 0.00010960735380649567, 0.00011496990919113159, 0.00012033246457576752, 0.00012569501996040344, 0.00013105757534503937, 0.0001364201307296753, 0.00014178268611431122, 0.00014714524149894714, 0.00015250779688358307, 0.000157870352268219, 0.00016323290765285492, 0.00016859546303749084, 0.00017395801842212677, 0.0001793205738067627, 0.00018468312919139862, 0.00019004568457603455, 0.00019540823996067047, 0.0002007707953453064, 0.00020613335072994232, 0.00021149590611457825, 0.00021685846149921417, 0.0002222210168838501, 0.00022758357226848602, 0.00023294612765312195, 0.00023830868303775787, 0.0002436712384223938, 0.0002490337938070297, 0.00025439634919166565, 0.0002597589045763016, 0.0002651214599609375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 13.0, 11.0, 15.0, 24.0, 32.0, 48.0, 78.0, 198.0, 423.0, 994.0, 2920.0, 11055.0, 105368.0, 884654.0, 33311.0, 6210.0, 1903.0, 664.0, 283.0, 127.0, 73.0, 41.0, 26.0, 22.0, 16.0, 16.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0195465087890625, -0.018901348114013672, -0.018256187438964844, -0.017611026763916016, -0.016965866088867188, -0.01632070541381836, -0.01567554473876953, -0.015030384063720703, -0.014385223388671875, -0.013740062713623047, -0.013094902038574219, -0.01244974136352539, -0.011804580688476562, -0.011159420013427734, -0.010514259338378906, -0.009869098663330078, -0.00922393798828125, -0.008578777313232422, -0.007933616638183594, -0.007288455963134766, -0.0066432952880859375, -0.005998134613037109, -0.005352973937988281, -0.004707813262939453, -0.004062652587890625, -0.003417491912841797, -0.0027723312377929688, -0.0021271705627441406, -0.0014820098876953125, -0.0008368492126464844, -0.00019168853759765625, 0.0004534721374511719, 0.0010986328125, 0.0017437934875488281, 0.0023889541625976562, 0.0030341148376464844, 0.0036792755126953125, 0.004324436187744141, 0.004969596862792969, 0.005614757537841797, 0.006259918212890625, 0.006905078887939453, 0.007550239562988281, 0.00819540023803711, 0.008840560913085938, 0.009485721588134766, 0.010130882263183594, 0.010776042938232422, 0.01142120361328125, 0.012066364288330078, 0.012711524963378906, 0.013356685638427734, 0.014001846313476562, 0.01464700698852539, 0.015292167663574219, 0.015937328338623047, 0.016582489013671875, 0.017227649688720703, 0.01787281036376953, 0.01851797103881836, 0.019163131713867188, 0.019808292388916016, 0.020453453063964844, 0.021098613739013672, 0.0217437744140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 8.0, 6.0, 9.0, 8.0, 17.0, 21.0, 24.0, 30.0, 68.0, 91.0, 173.0, 210.0, 101.0, 62.0, 54.0, 27.0, 24.0, 12.0, 7.0, 5.0, 5.0, 3.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.008989214897155762, -0.008632421493530273, -0.008275628089904785, -0.007918834686279297, -0.007562041282653809, -0.00720524787902832, -0.006848454475402832, -0.006491661071777344, -0.0061348676681518555, -0.005778074264526367, -0.005421280860900879, -0.005064487457275391, -0.004707694053649902, -0.004350900650024414, -0.003994107246398926, -0.0036373138427734375, -0.0032805204391479492, -0.002923727035522461, -0.0025669336318969727, -0.0022101402282714844, -0.001853346824645996, -0.0014965534210205078, -0.0011397600173950195, -0.0007829666137695312, -0.00042617321014404297, -6.937980651855469e-05, 0.0002874135971069336, 0.0006442070007324219, 0.0010010004043579102, 0.0013577938079833984, 0.0017145872116088867, 0.002071380615234375, 0.0024281740188598633, 0.0027849674224853516, 0.00314176082611084, 0.003498554229736328, 0.0038553476333618164, 0.004212141036987305, 0.004568934440612793, 0.004925727844238281, 0.0052825212478637695, 0.005639314651489258, 0.005996108055114746, 0.006352901458740234, 0.006709694862365723, 0.007066488265991211, 0.007423281669616699, 0.0077800750732421875, 0.008136868476867676, 0.008493661880493164, 0.008850455284118652, 0.00920724868774414, 0.009564042091369629, 0.009920835494995117, 0.010277628898620605, 0.010634422302246094, 0.010991215705871582, 0.01134800910949707, 0.011704802513122559, 0.012061595916748047, 0.012418389320373535, 0.012775182723999023, 0.013131976127624512, 0.01348876953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 10.0, 17.0, 31.0, 87.0, 304.0, 266.0, 130.0, 50.0, 42.0, 19.0, 20.0, 4.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4709995985031128, -0.453492671251297, -0.4359857439994812, -0.4184788465499878, -0.400971919298172, -0.3834649920463562, -0.3659580647945404, -0.3484511375427246, -0.3309442400932312, -0.3134373128414154, -0.2959303855895996, -0.2784234881401062, -0.2609165608882904, -0.2434096336364746, -0.2259027063846588, -0.20839577913284302, -0.19088885188102722, -0.17338192462921143, -0.15587501227855682, -0.13836808502674103, -0.12086116522550583, -0.10335424542427063, -0.08584731817245483, -0.06834039837121964, -0.050833478569984436, -0.03332655876874924, -0.01581963524222374, 0.0016872882843017578, 0.019194208085536957, 0.036701127886772156, 0.05420805513858795, 0.07171497493982315, 0.08922189474105835, 0.10672881454229355, 0.12423573434352875, 0.14174266159534454, 0.15924957394599915, 0.17675650119781494, 0.19426342844963074, 0.21177035570144653, 0.22927726805210114, 0.24678419530391693, 0.26429110765457153, 0.28179803490638733, 0.2993049621582031, 0.31681185960769653, 0.3343188166618347, 0.3518257141113281, 0.3693326413631439, 0.3868395686149597, 0.4043464958667755, 0.4218534231185913, 0.4393603205680847, 0.4568672478199005, 0.4743741750717163, 0.4918811023235321, 0.5093880295753479, 0.5268949270248413, 0.5444018840789795, 0.5619087815284729, 0.5794157385826111, 0.5969226360321045, 0.6144295930862427, 0.6319364905357361, 0.6494433879852295]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 20.0, 42.0, 62.0, 83.0, 120.0, 108.0, 133.0, 127.0, 84.0, 78.0, 58.0, 28.0, 20.0, 11.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5549145936965942, -0.535903811454773, -0.5168930888175964, -0.49788230657577515, -0.47887152433395386, -0.45986077189445496, -0.44085001945495605, -0.42183923721313477, -0.40282848477363586, -0.38381773233413696, -0.3648069500923157, -0.3457961976528168, -0.32678544521331787, -0.3077746629714966, -0.2887639105319977, -0.2697531580924988, -0.2507423758506775, -0.2317316085100174, -0.2127208411693573, -0.1937100887298584, -0.1746993213891983, -0.1556885540485382, -0.1366778016090393, -0.11766703426837921, -0.09865626692771912, -0.07964549958705902, -0.06063473969697952, -0.041623976081609726, -0.02261321246623993, -0.003602445125579834, 0.015408314764499664, 0.03441907465457916, 0.05342990159988403, 0.07244066894054413, 0.09145142883062363, 0.11046218872070312, 0.12947295606136322, 0.14848372340202332, 0.16749447584152222, 0.1865052431821823, 0.2055160105228424, 0.2245267778635025, 0.2435375452041626, 0.2625482976436615, 0.2815590500831604, 0.3005698323249817, 0.3195805847644806, 0.3385913372039795, 0.3576021194458008, 0.3766128718852997, 0.39562365412712097, 0.4146344065666199, 0.43364518880844116, 0.45265594124794006, 0.47166669368743896, 0.49067747592926025, 0.5096882581710815, 0.5286990404129028, 0.5477097630500793, 0.5667205452919006, 0.5857313275337219, 0.6047420501708984, 0.6237528324127197, 0.642763614654541, 0.6617743372917175]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 11.0, 14.0, 9.0, 19.0, 25.0, 30.0, 47.0, 54.0, 86.0, 102.0, 207.0, 592.0, 4910.0, 4169072.0, 17017.0, 1136.0, 328.0, 152.0, 118.0, 89.0, 67.0, 41.0, 37.0, 29.0, 18.0, 21.0, 10.0, 11.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4951171875, -0.48040771484375, -0.4656982421875, -0.45098876953125, -0.436279296875, -0.42156982421875, -0.4068603515625, -0.39215087890625, -0.37744140625, -0.36273193359375, -0.3480224609375, -0.33331298828125, -0.318603515625, -0.30389404296875, -0.2891845703125, -0.27447509765625, -0.259765625, -0.24505615234375, -0.2303466796875, -0.21563720703125, -0.200927734375, -0.18621826171875, -0.1715087890625, -0.15679931640625, -0.14208984375, -0.12738037109375, -0.1126708984375, -0.09796142578125, -0.083251953125, -0.06854248046875, -0.0538330078125, -0.03912353515625, -0.0244140625, -0.00970458984375, 0.0050048828125, 0.01971435546875, 0.034423828125, 0.04913330078125, 0.0638427734375, 0.07855224609375, 0.09326171875, 0.10797119140625, 0.1226806640625, 0.13739013671875, 0.152099609375, 0.16680908203125, 0.1815185546875, 0.19622802734375, 0.2109375, 0.22564697265625, 0.2403564453125, 0.25506591796875, 0.269775390625, 0.28448486328125, 0.2991943359375, 0.31390380859375, 0.32861328125, 0.34332275390625, 0.3580322265625, 0.37274169921875, 0.387451171875, 0.40216064453125, 0.4168701171875, 0.43157958984375, 0.4462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 18.0, 94.0, 396.0, 395.0, 63.0, 22.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0830078125, -0.0805673599243164, -0.07812690734863281, -0.07568645477294922, -0.07324600219726562, -0.07080554962158203, -0.06836509704589844, -0.06592464447021484, -0.06348419189453125, -0.061043739318847656, -0.05860328674316406, -0.05616283416748047, -0.053722381591796875, -0.05128192901611328, -0.04884147644042969, -0.046401023864746094, -0.0439605712890625, -0.041520118713378906, -0.03907966613769531, -0.03663921356201172, -0.034198760986328125, -0.03175830841064453, -0.029317855834960938, -0.026877403259277344, -0.02443695068359375, -0.021996498107910156, -0.019556045532226562, -0.01711559295654297, -0.014675140380859375, -0.012234687805175781, -0.009794235229492188, -0.007353782653808594, -0.004913330078125, -0.0024728775024414062, -3.24249267578125e-05, 0.0024080276489257812, 0.004848480224609375, 0.007288932800292969, 0.009729385375976562, 0.012169837951660156, 0.01461029052734375, 0.017050743103027344, 0.019491195678710938, 0.02193164825439453, 0.024372100830078125, 0.02681255340576172, 0.029253005981445312, 0.031693458557128906, 0.0341339111328125, 0.036574363708496094, 0.03901481628417969, 0.04145526885986328, 0.043895721435546875, 0.04633617401123047, 0.04877662658691406, 0.051217079162597656, 0.05365753173828125, 0.056097984313964844, 0.05853843688964844, 0.06097888946533203, 0.06341934204101562, 0.06585979461669922, 0.06830024719238281, 0.0707406997680664, 0.07318115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 24.0, 34.0, 56.0, 137.0, 424.0, 2334.0, 114974.0, 4069200.0, 6006.0, 705.0, 210.0, 79.0, 38.0, 26.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28076171875, -0.2739429473876953, -0.2671241760253906, -0.26030540466308594, -0.25348663330078125, -0.24666786193847656, -0.23984909057617188, -0.2330303192138672, -0.2262115478515625, -0.2193927764892578, -0.21257400512695312, -0.20575523376464844, -0.19893646240234375, -0.19211769104003906, -0.18529891967773438, -0.1784801483154297, -0.171661376953125, -0.1648426055908203, -0.15802383422851562, -0.15120506286621094, -0.14438629150390625, -0.13756752014160156, -0.13074874877929688, -0.12392997741699219, -0.1171112060546875, -0.11029243469238281, -0.10347366333007812, -0.09665489196777344, -0.08983612060546875, -0.08301734924316406, -0.07619857788085938, -0.06937980651855469, -0.06256103515625, -0.05574226379394531, -0.048923492431640625, -0.04210472106933594, -0.03528594970703125, -0.028467178344726562, -0.021648406982421875, -0.014829635620117188, -0.0080108642578125, -0.0011920928955078125, 0.005626678466796875, 0.012445449829101562, 0.01926422119140625, 0.026082992553710938, 0.032901763916015625, 0.03972053527832031, 0.046539306640625, 0.05335807800292969, 0.060176849365234375, 0.06699562072753906, 0.07381439208984375, 0.08063316345214844, 0.08745193481445312, 0.09427070617675781, 0.1010894775390625, 0.10790824890136719, 0.11472702026367188, 0.12154579162597656, 0.12836456298828125, 0.13518333435058594, 0.14200210571289062, 0.1488208770751953, 0.1556396484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 9.0, 9.0, 20.0, 31.0, 50.0, 111.0, 260.0, 1941.0, 1222.0, 236.0, 89.0, 41.0, 26.0, 13.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09160423278808594, -0.08951950073242188, -0.08743476867675781, -0.08535003662109375, -0.08326530456542969, -0.08118057250976562, -0.07909584045410156, -0.0770111083984375, -0.07492637634277344, -0.07284164428710938, -0.07075691223144531, -0.06867218017578125, -0.06658744812011719, -0.06450271606445312, -0.06241798400878906, -0.060333251953125, -0.05824851989746094, -0.056163787841796875, -0.05407905578613281, -0.05199432373046875, -0.04990959167480469, -0.047824859619140625, -0.04574012756347656, -0.0436553955078125, -0.04157066345214844, -0.039485931396484375, -0.03740119934082031, -0.03531646728515625, -0.03323173522949219, -0.031147003173828125, -0.029062271118164062, -0.0269775390625, -0.024892807006835938, -0.022808074951171875, -0.020723342895507812, -0.01863861083984375, -0.016553878784179688, -0.014469146728515625, -0.012384414672851562, -0.0102996826171875, -0.008214950561523438, -0.006130218505859375, -0.0040454864501953125, -0.00196075439453125, 0.0001239776611328125, 0.002208709716796875, 0.0042934417724609375, 0.006378173828125, 0.008462905883789062, 0.010547637939453125, 0.012632369995117188, 0.01471710205078125, 0.016801834106445312, 0.018886566162109375, 0.020971298217773438, 0.0230560302734375, 0.025140762329101562, 0.027225494384765625, 0.029310226440429688, 0.03139495849609375, 0.03347969055175781, 0.035564422607421875, 0.03764915466308594, 0.03973388671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 43.0, 657.0, 303.0, 8.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47507214546203613, -0.4534001350402832, -0.4317281246185303, -0.41005611419677734, -0.3883841037750244, -0.3667120933532715, -0.34504005312919617, -0.32336804270744324, -0.3016960322856903, -0.2800240218639374, -0.25835201144218445, -0.23667998611927032, -0.2150079756975174, -0.19333596527576447, -0.17166393995285034, -0.1499919295310974, -0.12831991910934448, -0.10664790868759155, -0.08497589081525803, -0.0633038729429245, -0.04163186252117157, -0.01995985209941864, 0.0017121732234954834, 0.023384183645248413, 0.04505619406700134, 0.06672820448875427, 0.0884002223610878, 0.11007224023342133, 0.13174425065517426, 0.15341626107692719, 0.1750882863998413, 0.19676029682159424, 0.21843230724334717, 0.2401043176651001, 0.261776328086853, 0.28344833850860596, 0.3051203489303589, 0.3267923593521118, 0.34846439957618713, 0.37013640999794006, 0.391808420419693, 0.4134804308414459, 0.43515244126319885, 0.45682448148727417, 0.4784964919090271, 0.50016850233078, 0.521840512752533, 0.5435125231742859, 0.5651845335960388, 0.5868565440177917, 0.6085285544395447, 0.6302005648612976, 0.6518725752830505, 0.6735445857048035, 0.6952166557312012, 0.7168886661529541, 0.738560676574707, 0.76023268699646, 0.7819046974182129, 0.8035767078399658, 0.8252487182617188, 0.8469207286834717, 0.8685927391052246, 0.8902647495269775, 0.9119367599487305]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 13.0, 20.0, 21.0, 22.0, 18.0, 19.0, 32.0, 38.0, 26.0, 30.0, 33.0, 46.0, 25.0, 25.0, 34.0, 37.0, 43.0, 42.0, 41.0, 33.0, 45.0, 38.0, 40.0, 33.0, 23.0, 27.0, 19.0, 16.0, 17.0, 16.0, 17.0, 10.0, 15.0, 13.0, 6.0, 6.0, 5.0, 9.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06899738311767578, -0.06689704954624176, -0.06479671597480774, -0.06269637495279312, -0.0605960413813591, -0.05849570780992508, -0.05639537051320076, -0.05429503321647644, -0.05219469964504242, -0.0500943660736084, -0.04799402877688408, -0.04589369148015976, -0.04379335790872574, -0.04169302433729172, -0.0395926870405674, -0.03749234974384308, -0.03539201617240906, -0.03329168260097504, -0.031191345304250717, -0.029091009870171547, -0.026990674436092377, -0.024890339002013206, -0.022790003567934036, -0.020689668133854866, -0.018589332699775696, -0.016488997265696526, -0.014388661831617355, -0.012288326397538185, -0.010187990963459015, -0.008087655529379845, -0.0059873200953006744, -0.003886984661221504, -0.001786649227142334, 0.00031368620693683624, 0.0024140216410160065, 0.004514357075095177, 0.006614692509174347, 0.008715027943253517, 0.010815363377332687, 0.012915698811411858, 0.015016034245491028, 0.017116369679570198, 0.01921670511364937, 0.02131704054772854, 0.02341737598180771, 0.02551771141588688, 0.02761804684996605, 0.02971838228404522, 0.03181871771812439, 0.03391905128955841, 0.03601938858628273, 0.03811972588300705, 0.04022005945444107, 0.04232039302587509, 0.04442073032259941, 0.04652106761932373, 0.04862140119075775, 0.05072173476219177, 0.05282207205891609, 0.05492240935564041, 0.05702274292707443, 0.05912307649850845, 0.06122341379523277, 0.06332375109195709, 0.06542408466339111]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 7.0, 5.0, 9.0, 7.0, 13.0, 14.0, 18.0, 27.0, 46.0, 41.0, 51.0, 82.0, 106.0, 131.0, 171.0, 270.0, 358.0, 517.0, 967.0, 3441.0, 52973.0, 964744.0, 19763.0, 2274.0, 836.0, 507.0, 293.0, 235.0, 138.0, 126.0, 65.0, 88.0, 52.0, 40.0, 29.0, 28.0, 15.0, 18.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1611328125, -0.15599632263183594, -0.15085983276367188, -0.1457233428955078, -0.14058685302734375, -0.1354503631591797, -0.13031387329101562, -0.12517738342285156, -0.1200408935546875, -0.11490440368652344, -0.10976791381835938, -0.10463142395019531, -0.09949493408203125, -0.09435844421386719, -0.08922195434570312, -0.08408546447753906, -0.078948974609375, -0.07381248474121094, -0.06867599487304688, -0.06353950500488281, -0.05840301513671875, -0.05326652526855469, -0.048130035400390625, -0.04299354553222656, -0.0378570556640625, -0.03272056579589844, -0.027584075927734375, -0.022447586059570312, -0.01731109619140625, -0.012174606323242188, -0.007038116455078125, -0.0019016265869140625, 0.00323486328125, 0.008371353149414062, 0.013507843017578125, 0.018644332885742188, 0.02378082275390625, 0.028917312622070312, 0.034053802490234375, 0.03919029235839844, 0.0443267822265625, 0.04946327209472656, 0.054599761962890625, 0.05973625183105469, 0.06487274169921875, 0.07000923156738281, 0.07514572143554688, 0.08028221130371094, 0.085418701171875, 0.09055519104003906, 0.09569168090820312, 0.10082817077636719, 0.10596466064453125, 0.11110115051269531, 0.11623764038085938, 0.12137413024902344, 0.1265106201171875, 0.13164710998535156, 0.13678359985351562, 0.1419200897216797, 0.14705657958984375, 0.1521930694580078, 0.15732955932617188, 0.16246604919433594, 0.1676025390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 30.0, 129.0, 493.0, 273.0, 48.0, 16.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08514404296875, -0.08269500732421875, -0.0802459716796875, -0.07779693603515625, -0.075347900390625, -0.07289886474609375, -0.0704498291015625, -0.06800079345703125, -0.0655517578125, -0.06310272216796875, -0.0606536865234375, -0.05820465087890625, -0.055755615234375, -0.05330657958984375, -0.0508575439453125, -0.04840850830078125, -0.04595947265625, -0.04351043701171875, -0.0410614013671875, -0.03861236572265625, -0.036163330078125, -0.03371429443359375, -0.0312652587890625, -0.02881622314453125, -0.0263671875, -0.02391815185546875, -0.0214691162109375, -0.01902008056640625, -0.016571044921875, -0.01412200927734375, -0.0116729736328125, -0.00922393798828125, -0.00677490234375, -0.00432586669921875, -0.0018768310546875, 0.00057220458984375, 0.003021240234375, 0.00547027587890625, 0.0079193115234375, 0.01036834716796875, 0.0128173828125, 0.01526641845703125, 0.0177154541015625, 0.02016448974609375, 0.022613525390625, 0.02506256103515625, 0.0275115966796875, 0.02996063232421875, 0.03240966796875, 0.03485870361328125, 0.0373077392578125, 0.03975677490234375, 0.042205810546875, 0.04465484619140625, 0.0471038818359375, 0.04955291748046875, 0.052001953125, 0.05445098876953125, 0.0569000244140625, 0.05934906005859375, 0.061798095703125, 0.06424713134765625, 0.0666961669921875, 0.06914520263671875, 0.07159423828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 7.0, 8.0, 11.0, 16.0, 16.0, 16.0, 21.0, 32.0, 26.0, 41.0, 43.0, 56.0, 91.0, 128.0, 265.0, 651.0, 3801.0, 866813.0, 173457.0, 1763.0, 519.0, 216.0, 129.0, 77.0, 64.0, 59.0, 38.0, 48.0, 20.0, 20.0, 25.0, 16.0, 11.0, 8.0, 9.0, 4.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.24755859375, -0.2402477264404297, -0.23293685913085938, -0.22562599182128906, -0.21831512451171875, -0.21100425720214844, -0.20369338989257812, -0.1963825225830078, -0.1890716552734375, -0.1817607879638672, -0.17444992065429688, -0.16713905334472656, -0.15982818603515625, -0.15251731872558594, -0.14520645141601562, -0.1378955841064453, -0.130584716796875, -0.12327384948730469, -0.11596298217773438, -0.10865211486816406, -0.10134124755859375, -0.09403038024902344, -0.08671951293945312, -0.07940864562988281, -0.0720977783203125, -0.06478691101074219, -0.057476043701171875, -0.05016517639160156, -0.04285430908203125, -0.03554344177246094, -0.028232574462890625, -0.020921707153320312, -0.01361083984375, -0.0062999725341796875, 0.001010894775390625, 0.008321762084960938, 0.01563262939453125, 0.022943496704101562, 0.030254364013671875, 0.03756523132324219, 0.0448760986328125, 0.05218696594238281, 0.059497833251953125, 0.06680870056152344, 0.07411956787109375, 0.08143043518066406, 0.08874130249023438, 0.09605216979980469, 0.103363037109375, 0.11067390441894531, 0.11798477172851562, 0.12529563903808594, 0.13260650634765625, 0.13991737365722656, 0.14722824096679688, 0.1545391082763672, 0.1618499755859375, 0.1691608428955078, 0.17647171020507812, 0.18378257751464844, 0.19109344482421875, 0.19840431213378906, 0.20571517944335938, 0.2130260467529297, 0.2203369140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 13.0, 16.0, 14.0, 14.0, 26.0, 17.0, 21.0, 23.0, 34.0, 33.0, 36.0, 32.0, 40.0, 52.0, 51.0, 54.0, 42.0, 45.0, 57.0, 47.0, 44.0, 45.0, 31.0, 34.0, 27.0, 23.0, 22.0, 20.0, 13.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.040172576904296875, -0.03896331787109375, -0.037754058837890625, -0.0365447998046875, -0.035335540771484375, -0.03412628173828125, -0.032917022705078125, -0.031707763671875, -0.030498504638671875, -0.02928924560546875, -0.028079986572265625, -0.0268707275390625, -0.025661468505859375, -0.02445220947265625, -0.023242950439453125, -0.02203369140625, -0.020824432373046875, -0.01961517333984375, -0.018405914306640625, -0.0171966552734375, -0.015987396240234375, -0.01477813720703125, -0.013568878173828125, -0.012359619140625, -0.011150360107421875, -0.00994110107421875, -0.008731842041015625, -0.0075225830078125, -0.006313323974609375, -0.00510406494140625, -0.003894805908203125, -0.002685546875, -0.001476287841796875, -0.00026702880859375, 0.000942230224609375, 0.0021514892578125, 0.003360748291015625, 0.00457000732421875, 0.005779266357421875, 0.006988525390625, 0.008197784423828125, 0.00940704345703125, 0.010616302490234375, 0.0118255615234375, 0.013034820556640625, 0.01424407958984375, 0.015453338623046875, 0.01666259765625, 0.017871856689453125, 0.01908111572265625, 0.020290374755859375, 0.0214996337890625, 0.022708892822265625, 0.02391815185546875, 0.025127410888671875, 0.026336669921875, 0.027545928955078125, 0.02875518798828125, 0.029964447021484375, 0.0311737060546875, 0.032382965087890625, 0.03359222412109375, 0.034801483154296875, 0.0360107421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 8.0, 10.0, 20.0, 18.0, 27.0, 24.0, 43.0, 75.0, 123.0, 246.0, 488.0, 1234.0, 4017.0, 26051.0, 929898.0, 76278.0, 6837.0, 1821.0, 631.0, 287.0, 146.0, 86.0, 44.0, 23.0, 17.0, 13.0, 14.0, 11.0, 8.0, 4.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0382080078125, -0.03707313537597656, -0.035938262939453125, -0.03480339050292969, -0.03366851806640625, -0.03253364562988281, -0.031398773193359375, -0.030263900756835938, -0.0291290283203125, -0.027994155883789062, -0.026859283447265625, -0.025724411010742188, -0.02458953857421875, -0.023454666137695312, -0.022319793701171875, -0.021184921264648438, -0.020050048828125, -0.018915176391601562, -0.017780303955078125, -0.016645431518554688, -0.01551055908203125, -0.014375686645507812, -0.013240814208984375, -0.012105941772460938, -0.0109710693359375, -0.009836196899414062, -0.008701324462890625, -0.0075664520263671875, -0.00643157958984375, -0.0052967071533203125, -0.004161834716796875, -0.0030269622802734375, -0.00189208984375, -0.0007572174072265625, 0.000377655029296875, 0.0015125274658203125, 0.00264739990234375, 0.0037822723388671875, 0.004917144775390625, 0.0060520172119140625, 0.0071868896484375, 0.008321762084960938, 0.009456634521484375, 0.010591506958007812, 0.01172637939453125, 0.012861251831054688, 0.013996124267578125, 0.015130996704101562, 0.016265869140625, 0.017400741577148438, 0.018535614013671875, 0.019670486450195312, 0.02080535888671875, 0.021940231323242188, 0.023075103759765625, 0.024209976196289062, 0.0253448486328125, 0.026479721069335938, 0.027614593505859375, 0.028749465942382812, 0.02988433837890625, 0.031019210815429688, 0.032154083251953125, 0.03328895568847656, 0.034423828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 2.0, 1.0, 4.0, 10.0, 4.0, 4.0, 12.0, 10.0, 16.0, 17.0, 22.0, 23.0, 34.0, 50.0, 45.0, 73.0, 81.0, 106.0, 108.0, 74.0, 54.0, 43.0, 46.0, 35.0, 21.0, 20.0, 16.0, 10.0, 13.0, 11.0, 9.0, 10.0, 2.0, 4.0, 3.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.086992263793945e-05, -6.801262497901917e-05, -6.515532732009888e-05, -6.229802966117859e-05, -5.94407320022583e-05, -5.658343434333801e-05, -5.3726136684417725e-05, -5.0868839025497437e-05, -4.801154136657715e-05, -4.515424370765686e-05, -4.229694604873657e-05, -3.9439648389816284e-05, -3.6582350730895996e-05, -3.372505307197571e-05, -3.086775541305542e-05, -2.8010457754135132e-05, -2.5153160095214844e-05, -2.2295862436294556e-05, -1.9438564777374268e-05, -1.658126711845398e-05, -1.3723969459533691e-05, -1.0866671800613403e-05, -8.009374141693115e-06, -5.152076482772827e-06, -2.294778823852539e-06, 5.62518835067749e-07, 3.419816493988037e-06, 6.277114152908325e-06, 9.134411811828613e-06, 1.1991709470748901e-05, 1.484900712966919e-05, 1.7706304788589478e-05, 2.0563602447509766e-05, 2.3420900106430054e-05, 2.6278197765350342e-05, 2.913549542427063e-05, 3.199279308319092e-05, 3.4850090742111206e-05, 3.7707388401031494e-05, 4.056468605995178e-05, 4.342198371887207e-05, 4.627928137779236e-05, 4.9136579036712646e-05, 5.1993876695632935e-05, 5.485117435455322e-05, 5.770847201347351e-05, 6.05657696723938e-05, 6.342306733131409e-05, 6.628036499023438e-05, 6.913766264915466e-05, 7.199496030807495e-05, 7.485225796699524e-05, 7.770955562591553e-05, 8.056685328483582e-05, 8.34241509437561e-05, 8.628144860267639e-05, 8.913874626159668e-05, 9.199604392051697e-05, 9.485334157943726e-05, 9.771063923835754e-05, 0.00010056793689727783, 0.00010342523455619812, 0.00010628253221511841, 0.0001091398298740387, 0.00011199712753295898]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 1.0, 7.0, 5.0, 15.0, 14.0, 28.0, 39.0, 51.0, 65.0, 115.0, 548.0, 27765.0, 1016880.0, 2502.0, 226.0, 78.0, 45.0, 37.0, 27.0, 19.0, 25.0, 9.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04498291015625, -0.04363059997558594, -0.042278289794921875, -0.04092597961425781, -0.03957366943359375, -0.03822135925292969, -0.036869049072265625, -0.03551673889160156, -0.0341644287109375, -0.03281211853027344, -0.031459808349609375, -0.030107498168945312, -0.02875518798828125, -0.027402877807617188, -0.026050567626953125, -0.024698257446289062, -0.023345947265625, -0.021993637084960938, -0.020641326904296875, -0.019289016723632812, -0.01793670654296875, -0.016584396362304688, -0.015232086181640625, -0.013879776000976562, -0.0125274658203125, -0.011175155639648438, -0.009822845458984375, -0.008470535278320312, -0.00711822509765625, -0.0057659149169921875, -0.004413604736328125, -0.0030612945556640625, -0.001708984375, -0.0003566741943359375, 0.000995635986328125, 0.0023479461669921875, 0.00370025634765625, 0.0050525665283203125, 0.006404876708984375, 0.0077571868896484375, 0.0091094970703125, 0.010461807250976562, 0.011814117431640625, 0.013166427612304688, 0.01451873779296875, 0.015871047973632812, 0.017223358154296875, 0.018575668334960938, 0.019927978515625, 0.021280288696289062, 0.022632598876953125, 0.023984909057617188, 0.02533721923828125, 0.026689529418945312, 0.028041839599609375, 0.029394149780273438, 0.0307464599609375, 0.03209877014160156, 0.033451080322265625, 0.03480339050292969, 0.03615570068359375, 0.03750801086425781, 0.038860321044921875, 0.04021263122558594, 0.04156494140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 2.0, 6.0, 5.0, 13.0, 15.0, 24.0, 37.0, 51.0, 49.0, 56.0, 77.0, 107.0, 126.0, 96.0, 82.0, 55.0, 41.0, 35.0, 21.0, 21.0, 24.0, 7.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00722503662109375, -0.007008254528045654, -0.006791472434997559, -0.006574690341949463, -0.006357908248901367, -0.0061411261558532715, -0.005924344062805176, -0.00570756196975708, -0.005490779876708984, -0.005273997783660889, -0.005057215690612793, -0.004840433597564697, -0.0046236515045166016, -0.004406869411468506, -0.00419008731842041, -0.0039733052253723145, -0.0037565231323242188, -0.003539741039276123, -0.0033229589462280273, -0.0031061768531799316, -0.002889394760131836, -0.0026726126670837402, -0.0024558305740356445, -0.002239048480987549, -0.002022266387939453, -0.0018054842948913574, -0.0015887022018432617, -0.001371920108795166, -0.0011551380157470703, -0.0009383559226989746, -0.0007215738296508789, -0.0005047917366027832, -0.0002880096435546875, -7.12275505065918e-05, 0.0001455545425415039, 0.0003623366355895996, 0.0005791187286376953, 0.000795900821685791, 0.0010126829147338867, 0.0012294650077819824, 0.0014462471008300781, 0.0016630291938781738, 0.0018798112869262695, 0.0020965933799743652, 0.002313375473022461, 0.0025301575660705566, 0.0027469396591186523, 0.002963721752166748, 0.0031805038452148438, 0.0033972859382629395, 0.003614068031311035, 0.003830850124359131, 0.0040476322174072266, 0.004264414310455322, 0.004481196403503418, 0.004697978496551514, 0.004914760589599609, 0.005131542682647705, 0.005348324775695801, 0.0055651068687438965, 0.005781888961791992, 0.005998671054840088, 0.006215453147888184, 0.006432235240936279, 0.006649017333984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 45.0, 841.0, 106.0, 12.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0873236656188965, -1.0519155263900757, -1.0165073871612549, -0.9810993075370789, -0.9456911683082581, -0.9102830290794373, -0.8748749494552612, -0.8394668102264404, -0.8040586709976196, -0.7686505317687988, -0.733242392539978, -0.697834312915802, -0.6624261736869812, -0.6270180344581604, -0.5916099548339844, -0.5562018156051636, -0.5207936763763428, -0.485385537147522, -0.44997742772102356, -0.41456931829452515, -0.37916117906570435, -0.34375303983688354, -0.30834493041038513, -0.2729368209838867, -0.23752868175506592, -0.2021205574274063, -0.1667124330997467, -0.1313043087720871, -0.09589618444442749, -0.06048806011676788, -0.025079935789108276, 0.01032818853855133, 0.04573643207550049, 0.0811445564031601, 0.1165526807308197, 0.1519608050584793, 0.18736892938613892, 0.22277705371379852, 0.25818517804145813, 0.29359328746795654, 0.32900142669677734, 0.36440956592559814, 0.39981767535209656, 0.43522578477859497, 0.47063392400741577, 0.5060420632362366, 0.5414501428604126, 0.5768582820892334, 0.6122664213180542, 0.647674560546875, 0.6830826997756958, 0.7184907793998718, 0.7538989186286926, 0.7893070578575134, 0.8247151374816895, 0.8601232767105103, 0.895531415939331, 0.9309395551681519, 0.9663476943969727, 1.0017558336257935, 1.0371639728546143, 1.0725719928741455, 1.1079801321029663, 1.143388271331787, 1.178796410560608]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 12.0, 19.0, 23.0, 28.0, 35.0, 55.0, 81.0, 81.0, 104.0, 111.0, 96.0, 89.0, 85.0, 63.0, 51.0, 33.0, 10.0, 10.0, 10.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27862876653671265, -0.2688198685646057, -0.25901100039482117, -0.24920211732387543, -0.2393932342529297, -0.22958433628082275, -0.21977545320987701, -0.20996657013893127, -0.20015768706798553, -0.1903488039970398, -0.18053992092609406, -0.17073103785514832, -0.16092213988304138, -0.15111327171325684, -0.1413043737411499, -0.13149549067020416, -0.12168660759925842, -0.11187772452831268, -0.10206884145736694, -0.0922599509358406, -0.08245106786489487, -0.07264218479394913, -0.06283329427242279, -0.05302441120147705, -0.04321552813053131, -0.03340664505958557, -0.023597758263349533, -0.013788873329758644, -0.003979988396167755, 0.005828894674777985, 0.015637781471014023, 0.02544666826725006, 0.0352555513381958, 0.04506443440914154, 0.05487332120537758, 0.06468220800161362, 0.07449109107255936, 0.0842999741435051, 0.09410886466503143, 0.10391774773597717, 0.11372663080692291, 0.12353551387786865, 0.1333443969488144, 0.14315328001976013, 0.15296217799186707, 0.1627710461616516, 0.17257994413375854, 0.18238882720470428, 0.19219771027565002, 0.20200659334659576, 0.2118154764175415, 0.22162435948848724, 0.23143324255943298, 0.24124214053153992, 0.25105100870132446, 0.2608599066734314, 0.27066880464553833, 0.28047770261764526, 0.2902865707874298, 0.30009546875953674, 0.3099043369293213, 0.3197132349014282, 0.32952210307121277, 0.3393310010433197, 0.34913986921310425]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 7.0, 9.0, 22.0, 38.0, 105.0, 460.0, 92433.0, 4100118.0, 774.0, 181.0, 68.0, 28.0, 14.0, 8.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.43389892578125, -0.4207763671875, -0.40765380859375, -0.39453125, -0.38140869140625, -0.3682861328125, -0.35516357421875, -0.342041015625, -0.32891845703125, -0.3157958984375, -0.30267333984375, -0.28955078125, -0.27642822265625, -0.2633056640625, -0.25018310546875, -0.237060546875, -0.22393798828125, -0.2108154296875, -0.19769287109375, -0.1845703125, -0.17144775390625, -0.1583251953125, -0.14520263671875, -0.132080078125, -0.11895751953125, -0.1058349609375, -0.09271240234375, -0.07958984375, -0.06646728515625, -0.0533447265625, -0.04022216796875, -0.027099609375, -0.01397705078125, -0.0008544921875, 0.01226806640625, 0.025390625, 0.03851318359375, 0.0516357421875, 0.06475830078125, 0.077880859375, 0.09100341796875, 0.1041259765625, 0.11724853515625, 0.13037109375, 0.14349365234375, 0.1566162109375, 0.16973876953125, 0.182861328125, 0.19598388671875, 0.2091064453125, 0.22222900390625, 0.2353515625, 0.24847412109375, 0.2615966796875, 0.27471923828125, 0.287841796875, 0.30096435546875, 0.3140869140625, 0.32720947265625, 0.34033203125, 0.35345458984375, 0.3665771484375, 0.37969970703125, 0.392822265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 66.0, 250.0, 491.0, 140.0, 30.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07952880859375, -0.07721328735351562, -0.07489776611328125, -0.07258224487304688, -0.0702667236328125, -0.06795120239257812, -0.06563568115234375, -0.06332015991210938, -0.061004638671875, -0.058689117431640625, -0.05637359619140625, -0.054058074951171875, -0.0517425537109375, -0.049427032470703125, -0.04711151123046875, -0.044795989990234375, -0.04248046875, -0.040164947509765625, -0.03784942626953125, -0.035533905029296875, -0.0332183837890625, -0.030902862548828125, -0.02858734130859375, -0.026271820068359375, -0.023956298828125, -0.021640777587890625, -0.01932525634765625, -0.017009735107421875, -0.0146942138671875, -0.012378692626953125, -0.01006317138671875, -0.007747650146484375, -0.00543212890625, -0.003116607666015625, -0.00080108642578125, 0.001514434814453125, 0.0038299560546875, 0.006145477294921875, 0.00846099853515625, 0.010776519775390625, 0.013092041015625, 0.015407562255859375, 0.01772308349609375, 0.020038604736328125, 0.0223541259765625, 0.024669647216796875, 0.02698516845703125, 0.029300689697265625, 0.0316162109375, 0.033931732177734375, 0.03624725341796875, 0.038562774658203125, 0.0408782958984375, 0.043193817138671875, 0.04550933837890625, 0.047824859619140625, 0.050140380859375, 0.052455902099609375, 0.05477142333984375, 0.057086944580078125, 0.0594024658203125, 0.061717987060546875, 0.06403350830078125, 0.06634902954101562, 0.06866455078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 9.0, 3.0, 10.0, 10.0, 14.0, 18.0, 28.0, 32.0, 45.0, 78.0, 131.0, 205.0, 341.0, 767.0, 2001.0, 8505.0, 93442.0, 3876830.0, 194966.0, 12529.0, 2470.0, 802.0, 388.0, 230.0, 124.0, 77.0, 73.0, 45.0, 21.0, 15.0, 20.0, 14.0, 5.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.061309814453125, -0.059369564056396484, -0.05742931365966797, -0.05548906326293945, -0.05354881286621094, -0.05160856246948242, -0.049668312072753906, -0.04772806167602539, -0.045787811279296875, -0.04384756088256836, -0.041907310485839844, -0.03996706008911133, -0.03802680969238281, -0.0360865592956543, -0.03414630889892578, -0.032206058502197266, -0.03026580810546875, -0.028325557708740234, -0.02638530731201172, -0.024445056915283203, -0.022504806518554688, -0.020564556121826172, -0.018624305725097656, -0.01668405532836914, -0.014743804931640625, -0.01280355453491211, -0.010863304138183594, -0.008923053741455078, -0.0069828033447265625, -0.005042552947998047, -0.0031023025512695312, -0.0011620521545410156, 0.0007781982421875, 0.0027184486389160156, 0.004658699035644531, 0.006598949432373047, 0.008539199829101562, 0.010479450225830078, 0.012419700622558594, 0.01435995101928711, 0.016300201416015625, 0.01824045181274414, 0.020180702209472656, 0.022120952606201172, 0.024061203002929688, 0.026001453399658203, 0.02794170379638672, 0.029881954193115234, 0.03182220458984375, 0.033762454986572266, 0.03570270538330078, 0.0376429557800293, 0.03958320617675781, 0.04152345657348633, 0.043463706970214844, 0.04540395736694336, 0.047344207763671875, 0.04928445816040039, 0.051224708557128906, 0.05316495895385742, 0.05510520935058594, 0.05704545974731445, 0.05898571014404297, 0.060925960540771484, 0.0628662109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 13.0, 10.0, 11.0, 21.0, 29.0, 48.0, 58.0, 74.0, 118.0, 149.0, 296.0, 420.0, 628.0, 748.0, 470.0, 274.0, 185.0, 110.0, 105.0, 72.0, 46.0, 41.0, 35.0, 19.0, 17.0, 10.0, 14.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0232086181640625, -0.022531509399414062, -0.021854400634765625, -0.021177291870117188, -0.02050018310546875, -0.019823074340820312, -0.019145965576171875, -0.018468856811523438, -0.017791748046875, -0.017114639282226562, -0.016437530517578125, -0.015760421752929688, -0.01508331298828125, -0.014406204223632812, -0.013729095458984375, -0.013051986694335938, -0.0123748779296875, -0.011697769165039062, -0.011020660400390625, -0.010343551635742188, -0.00966644287109375, -0.008989334106445312, -0.008312225341796875, -0.0076351165771484375, -0.0069580078125, -0.0062808990478515625, -0.005603790283203125, -0.0049266815185546875, -0.00424957275390625, -0.0035724639892578125, -0.002895355224609375, -0.0022182464599609375, -0.0015411376953125, -0.0008640289306640625, -0.000186920166015625, 0.0004901885986328125, 0.00116729736328125, 0.0018444061279296875, 0.002521514892578125, 0.0031986236572265625, 0.003875732421875, 0.0045528411865234375, 0.005229949951171875, 0.0059070587158203125, 0.00658416748046875, 0.0072612762451171875, 0.007938385009765625, 0.008615493774414062, 0.0092926025390625, 0.009969711303710938, 0.010646820068359375, 0.011323928833007812, 0.01200103759765625, 0.012678146362304688, 0.013355255126953125, 0.014032363891601562, 0.01470947265625, 0.015386581420898438, 0.016063690185546875, 0.016740798950195312, 0.01741790771484375, 0.018095016479492188, 0.018772125244140625, 0.019449234008789062, 0.0201263427734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 33.0, 909.0, 62.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9128276705741882, -0.8871968388557434, -0.8615660071372986, -0.8359351754188538, -0.8103043437004089, -0.7846734523773193, -0.7590426206588745, -0.7334117889404297, -0.7077809572219849, -0.68215012550354, -0.6565192937850952, -0.6308884620666504, -0.6052576303482056, -0.5796267986297607, -0.5539959669113159, -0.5283650755882263, -0.5027343034744263, -0.47710347175598145, -0.4514726400375366, -0.4258418083190918, -0.4002109467983246, -0.37458011507987976, -0.34894928336143494, -0.3233184218406677, -0.2976875901222229, -0.2720567584037781, -0.24642591178417206, -0.22079508006572723, -0.19516423344612122, -0.1695334017276764, -0.14390257000923157, -0.11827172338962555, -0.09264087677001953, -0.06701003760099411, -0.04137920215725899, -0.015748366713523865, 0.009882472455501556, 0.03551331162452698, 0.0611441433429718, 0.08677498996257782, 0.11240582168102264, 0.13803665339946747, 0.1636675000190735, 0.1892983317375183, 0.21492916345596313, 0.24056001007556915, 0.2661908268928528, 0.29182168841362, 0.3174525201320648, 0.34308335185050964, 0.36871418356895447, 0.3943450450897217, 0.4199758768081665, 0.44560670852661133, 0.47123754024505615, 0.496868371963501, 0.5224992036819458, 0.5481300354003906, 0.5737608671188354, 0.5993916988372803, 0.6250225305557251, 0.6506533622741699, 0.6762841939926147, 0.7019150853157043, 0.7275459170341492]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 15.0, 15.0, 15.0, 29.0, 36.0, 47.0, 67.0, 83.0, 90.0, 63.0, 95.0, 85.0, 70.0, 67.0, 52.0, 44.0, 42.0, 16.0, 19.0, 15.0, 8.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10208785533905029, -0.09830343723297119, -0.09451901912689209, -0.09073460102081299, -0.08695018291473389, -0.08316576480865479, -0.07938135415315628, -0.07559693604707718, -0.07181251794099808, -0.06802809983491898, -0.06424368172883987, -0.06045926734805107, -0.05667484924197197, -0.05289043113589287, -0.049106016755104065, -0.04532159864902496, -0.04153718054294586, -0.03775276243686676, -0.03396834433078766, -0.030183929949998856, -0.026399511843919754, -0.022615093737840652, -0.0188306774944067, -0.015046261250972748, -0.011261843144893646, -0.007477425970137119, -0.0036930087953805923, 9.14083793759346e-05, 0.0038758255541324615, 0.007660243660211563, 0.011444659903645515, 0.015229076147079468, 0.01901349425315857, 0.02279791235923767, 0.026582328602671623, 0.030366744846105576, 0.03415116295218468, 0.03793558105826378, 0.04171999543905258, 0.04550441354513168, 0.049288831651210785, 0.053073249757289886, 0.05685766786336899, 0.06064208224415779, 0.0644264966249466, 0.0682109147310257, 0.0719953328371048, 0.0757797509431839, 0.079564169049263, 0.0833485871553421, 0.0871330052614212, 0.0909174233675003, 0.0947018414735794, 0.09848625957965851, 0.10227067023515701, 0.10605508834123611, 0.10983950644731522, 0.11362392455339432, 0.11740834265947342, 0.12119276076555252, 0.12497717142105103, 0.12876158952713013, 0.13254600763320923, 0.13633042573928833, 0.14011484384536743]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 13.0, 9.0, 17.0, 19.0, 17.0, 21.0, 31.0, 36.0, 47.0, 65.0, 81.0, 116.0, 158.0, 217.0, 338.0, 596.0, 1404.0, 7648.0, 885982.0, 144987.0, 4071.0, 1074.0, 508.0, 282.0, 189.0, 146.0, 109.0, 74.0, 63.0, 48.0, 33.0, 35.0, 18.0, 16.0, 14.0, 15.0, 13.0, 5.0, 7.0, 4.0, 6.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.303955078125, -0.2949790954589844, -0.28600311279296875, -0.2770271301269531, -0.2680511474609375, -0.2590751647949219, -0.25009918212890625, -0.24112319946289062, -0.232147216796875, -0.22317123413085938, -0.21419525146484375, -0.20521926879882812, -0.1962432861328125, -0.18726730346679688, -0.17829132080078125, -0.16931533813476562, -0.16033935546875, -0.15136337280273438, -0.14238739013671875, -0.13341140747070312, -0.1244354248046875, -0.11545944213867188, -0.10648345947265625, -0.09750747680664062, -0.088531494140625, -0.07955551147460938, -0.07057952880859375, -0.061603546142578125, -0.0526275634765625, -0.043651580810546875, -0.03467559814453125, -0.025699615478515625, -0.0167236328125, -0.007747650146484375, 0.00122833251953125, 0.010204315185546875, 0.0191802978515625, 0.028156280517578125, 0.03713226318359375, 0.046108245849609375, 0.055084228515625, 0.06406021118164062, 0.07303619384765625, 0.08201217651367188, 0.0909881591796875, 0.09996414184570312, 0.10894012451171875, 0.11791610717773438, 0.12689208984375, 0.13586807250976562, 0.14484405517578125, 0.15382003784179688, 0.1627960205078125, 0.17177200317382812, 0.18074798583984375, 0.18972396850585938, 0.198699951171875, 0.20767593383789062, 0.21665191650390625, 0.22562789916992188, 0.2346038818359375, 0.24357986450195312, 0.25255584716796875, 0.2615318298339844, 0.2705078125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 61.0, 245.0, 481.0, 164.0, 29.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07940673828125, -0.07709980010986328, -0.07479286193847656, -0.07248592376708984, -0.07017898559570312, -0.0678720474243164, -0.06556510925292969, -0.06325817108154297, -0.06095123291015625, -0.05864429473876953, -0.05633735656738281, -0.054030418395996094, -0.051723480224609375, -0.049416542053222656, -0.04710960388183594, -0.04480266571044922, -0.0424957275390625, -0.04018878936767578, -0.03788185119628906, -0.035574913024902344, -0.033267974853515625, -0.030961036682128906, -0.028654098510742188, -0.02634716033935547, -0.02404022216796875, -0.02173328399658203, -0.019426345825195312, -0.017119407653808594, -0.014812469482421875, -0.012505531311035156, -0.010198593139648438, -0.007891654968261719, -0.005584716796875, -0.0032777786254882812, -0.0009708404541015625, 0.0013360977172851562, 0.003643035888671875, 0.005949974060058594, 0.008256912231445312, 0.010563850402832031, 0.01287078857421875, 0.015177726745605469, 0.017484664916992188, 0.019791603088378906, 0.022098541259765625, 0.024405479431152344, 0.026712417602539062, 0.02901935577392578, 0.0313262939453125, 0.03363323211669922, 0.03594017028808594, 0.038247108459472656, 0.040554046630859375, 0.042860984802246094, 0.04516792297363281, 0.04747486114501953, 0.04978179931640625, 0.05208873748779297, 0.05439567565917969, 0.056702613830566406, 0.059009552001953125, 0.061316490173339844, 0.06362342834472656, 0.06593036651611328, 0.0682373046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 13.0, 9.0, 14.0, 15.0, 24.0, 44.0, 47.0, 64.0, 119.0, 162.0, 242.0, 435.0, 1039.0, 5065.0, 102889.0, 915724.0, 18672.0, 2223.0, 701.0, 363.0, 199.0, 129.0, 88.0, 57.0, 51.0, 36.0, 24.0, 17.0, 11.0, 15.0, 8.0, 4.0, 3.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2166748046875, -0.21035194396972656, -0.20402908325195312, -0.1977062225341797, -0.19138336181640625, -0.1850605010986328, -0.17873764038085938, -0.17241477966308594, -0.1660919189453125, -0.15976905822753906, -0.15344619750976562, -0.1471233367919922, -0.14080047607421875, -0.1344776153564453, -0.12815475463867188, -0.12183189392089844, -0.115509033203125, -0.10918617248535156, -0.10286331176757812, -0.09654045104980469, -0.09021759033203125, -0.08389472961425781, -0.07757186889648438, -0.07124900817871094, -0.0649261474609375, -0.05860328674316406, -0.052280426025390625, -0.04595756530761719, -0.03963470458984375, -0.03331184387207031, -0.026988983154296875, -0.020666122436523438, -0.01434326171875, -0.008020401000976562, -0.001697540283203125, 0.0046253204345703125, 0.01094818115234375, 0.017271041870117188, 0.023593902587890625, 0.029916763305664062, 0.0362396240234375, 0.04256248474121094, 0.048885345458984375, 0.05520820617675781, 0.06153106689453125, 0.06785392761230469, 0.07417678833007812, 0.08049964904785156, 0.086822509765625, 0.09314537048339844, 0.09946823120117188, 0.10579109191894531, 0.11211395263671875, 0.11843681335449219, 0.12475967407226562, 0.13108253479003906, 0.1374053955078125, 0.14372825622558594, 0.15005111694335938, 0.1563739776611328, 0.16269683837890625, 0.1690196990966797, 0.17534255981445312, 0.18166542053222656, 0.18798828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 11.0, 7.0, 9.0, 34.0, 32.0, 40.0, 53.0, 71.0, 82.0, 78.0, 102.0, 82.0, 74.0, 74.0, 49.0, 42.0, 28.0, 25.0, 22.0, 14.0, 12.0, 12.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.055694580078125, -0.053815364837646484, -0.05193614959716797, -0.05005693435668945, -0.04817771911621094, -0.04629850387573242, -0.044419288635253906, -0.04254007339477539, -0.040660858154296875, -0.03878164291381836, -0.036902427673339844, -0.03502321243286133, -0.03314399719238281, -0.0312647819519043, -0.02938556671142578, -0.027506351470947266, -0.02562713623046875, -0.023747920989990234, -0.02186870574951172, -0.019989490509033203, -0.018110275268554688, -0.016231060028076172, -0.014351844787597656, -0.01247262954711914, -0.010593414306640625, -0.00871419906616211, -0.006834983825683594, -0.004955768585205078, -0.0030765533447265625, -0.0011973381042480469, 0.0006818771362304688, 0.0025610923767089844, 0.0044403076171875, 0.006319522857666016, 0.008198738098144531, 0.010077953338623047, 0.011957168579101562, 0.013836383819580078, 0.015715599060058594, 0.01759481430053711, 0.019474029541015625, 0.02135324478149414, 0.023232460021972656, 0.025111675262451172, 0.026990890502929688, 0.028870105743408203, 0.03074932098388672, 0.032628536224365234, 0.03450775146484375, 0.036386966705322266, 0.03826618194580078, 0.0401453971862793, 0.04202461242675781, 0.04390382766723633, 0.045783042907714844, 0.04766225814819336, 0.049541473388671875, 0.05142068862915039, 0.053299903869628906, 0.05517911911010742, 0.05705833435058594, 0.05893754959106445, 0.06081676483154297, 0.06269598007202148, 0.0645751953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 12.0, 17.0, 37.0, 56.0, 114.0, 210.0, 476.0, 1138.0, 3117.0, 11576.0, 881010.0, 138055.0, 8414.0, 2461.0, 935.0, 439.0, 206.0, 121.0, 51.0, 25.0, 26.0, 14.0, 10.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14318466186523438, -0.13805389404296875, -0.13292312622070312, -0.1277923583984375, -0.12266159057617188, -0.11753082275390625, -0.11240005493164062, -0.107269287109375, -0.10213851928710938, -0.09700775146484375, -0.09187698364257812, -0.0867462158203125, -0.08161544799804688, -0.07648468017578125, -0.07135391235351562, -0.06622314453125, -0.061092376708984375, -0.05596160888671875, -0.050830841064453125, -0.0457000732421875, -0.040569305419921875, -0.03543853759765625, -0.030307769775390625, -0.025177001953125, -0.020046234130859375, -0.01491546630859375, -0.009784698486328125, -0.0046539306640625, 0.000476837158203125, 0.00560760498046875, 0.010738372802734375, 0.015869140625, 0.020999908447265625, 0.02613067626953125, 0.031261444091796875, 0.0363922119140625, 0.041522979736328125, 0.04665374755859375, 0.051784515380859375, 0.056915283203125, 0.062046051025390625, 0.06717681884765625, 0.07230758666992188, 0.0774383544921875, 0.08256912231445312, 0.08769989013671875, 0.09283065795898438, 0.09796142578125, 0.10309219360351562, 0.10822296142578125, 0.11335372924804688, 0.1184844970703125, 0.12361526489257812, 0.12874603271484375, 0.13387680053710938, 0.139007568359375, 0.14413833618164062, 0.14926910400390625, 0.15439987182617188, 0.1595306396484375, 0.16466140747070312, 0.16979217529296875, 0.17492294311523438, 0.1800537109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 5.0, 8.0, 5.0, 7.0, 11.0, 17.0, 25.0, 41.0, 67.0, 135.0, 152.0, 183.0, 125.0, 69.0, 31.0, 21.0, 20.0, 13.0, 12.0, 4.0, 4.0, 6.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021266937255859375, -0.00020641088485717773, -0.00020015239715576172, -0.0001938939094543457, -0.0001876354217529297, -0.00018137693405151367, -0.00017511844635009766, -0.00016885995864868164, -0.00016260147094726562, -0.0001563429832458496, -0.0001500844955444336, -0.00014382600784301758, -0.00013756752014160156, -0.00013130903244018555, -0.00012505054473876953, -0.00011879205703735352, -0.0001125335693359375, -0.00010627508163452148, -0.00010001659393310547, -9.375810623168945e-05, -8.749961853027344e-05, -8.124113082885742e-05, -7.49826431274414e-05, -6.872415542602539e-05, -6.246566772460938e-05, -5.620718002319336e-05, -4.9948692321777344e-05, -4.369020462036133e-05, -3.743171691894531e-05, -3.11732292175293e-05, -2.491474151611328e-05, -1.8656253814697266e-05, -1.239776611328125e-05, -6.139278411865234e-06, 1.1920928955078125e-07, 6.377696990966797e-06, 1.2636184692382812e-05, 1.8894672393798828e-05, 2.5153160095214844e-05, 3.141164779663086e-05, 3.7670135498046875e-05, 4.392862319946289e-05, 5.0187110900878906e-05, 5.644559860229492e-05, 6.270408630371094e-05, 6.896257400512695e-05, 7.522106170654297e-05, 8.147954940795898e-05, 8.7738037109375e-05, 9.399652481079102e-05, 0.00010025501251220703, 0.00010651350021362305, 0.00011277198791503906, 0.00011903047561645508, 0.0001252889633178711, 0.0001315474510192871, 0.00013780593872070312, 0.00014406442642211914, 0.00015032291412353516, 0.00015658140182495117, 0.0001628398895263672, 0.0001690983772277832, 0.00017535686492919922, 0.00018161535263061523, 0.00018787384033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 8.0, 9.0, 7.0, 13.0, 17.0, 15.0, 30.0, 35.0, 66.0, 128.0, 355.0, 1164.0, 5463.0, 426027.0, 607688.0, 5639.0, 1138.0, 368.0, 166.0, 66.0, 44.0, 28.0, 21.0, 11.0, 9.0, 7.0, 10.0, 5.0, 1.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.13186931610107422, -0.12787437438964844, -0.12387943267822266, -0.11988449096679688, -0.1158895492553711, -0.11189460754394531, -0.10789966583251953, -0.10390472412109375, -0.09990978240966797, -0.09591484069824219, -0.0919198989868164, -0.08792495727539062, -0.08393001556396484, -0.07993507385253906, -0.07594013214111328, -0.0719451904296875, -0.06795024871826172, -0.06395530700683594, -0.059960365295410156, -0.055965423583984375, -0.051970481872558594, -0.04797554016113281, -0.04398059844970703, -0.03998565673828125, -0.03599071502685547, -0.03199577331542969, -0.028000831604003906, -0.024005889892578125, -0.020010948181152344, -0.016016006469726562, -0.012021064758300781, -0.008026123046875, -0.004031181335449219, -3.62396240234375e-05, 0.003958702087402344, 0.007953643798828125, 0.011948585510253906, 0.015943527221679688, 0.01993846893310547, 0.02393341064453125, 0.02792835235595703, 0.03192329406738281, 0.035918235778808594, 0.039913177490234375, 0.043908119201660156, 0.04790306091308594, 0.05189800262451172, 0.0558929443359375, 0.05988788604736328, 0.06388282775878906, 0.06787776947021484, 0.07187271118164062, 0.0758676528930664, 0.07986259460449219, 0.08385753631591797, 0.08785247802734375, 0.09184741973876953, 0.09584236145019531, 0.0998373031616211, 0.10383224487304688, 0.10782718658447266, 0.11182212829589844, 0.11581707000732422, 0.11981201171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 16.0, 14.0, 32.0, 53.0, 208.0, 400.0, 143.0, 39.0, 23.0, 18.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.04864501953125, -0.04747152328491211, -0.04629802703857422, -0.04512453079223633, -0.04395103454589844, -0.04277753829956055, -0.041604042053222656, -0.040430545806884766, -0.039257049560546875, -0.038083553314208984, -0.036910057067871094, -0.0357365608215332, -0.03456306457519531, -0.03338956832885742, -0.03221607208251953, -0.03104257583618164, -0.02986907958984375, -0.02869558334350586, -0.02752208709716797, -0.026348590850830078, -0.025175094604492188, -0.024001598358154297, -0.022828102111816406, -0.021654605865478516, -0.020481109619140625, -0.019307613372802734, -0.018134117126464844, -0.016960620880126953, -0.015787124633789062, -0.014613628387451172, -0.013440132141113281, -0.01226663589477539, -0.0110931396484375, -0.00991964340209961, -0.008746147155761719, -0.007572650909423828, -0.0063991546630859375, -0.005225658416748047, -0.004052162170410156, -0.0028786659240722656, -0.001705169677734375, -0.0005316734313964844, 0.0006418228149414062, 0.0018153190612792969, 0.0029888153076171875, 0.004162311553955078, 0.005335807800292969, 0.006509304046630859, 0.00768280029296875, 0.00885629653930664, 0.010029792785644531, 0.011203289031982422, 0.012376785278320312, 0.013550281524658203, 0.014723777770996094, 0.015897274017333984, 0.017070770263671875, 0.018244266510009766, 0.019417762756347656, 0.020591259002685547, 0.021764755249023438, 0.022938251495361328, 0.02411174774169922, 0.02528524398803711, 0.026458740234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 35.0, 745.0, 220.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.697610855102539, -1.6559439897537231, -1.6142770051956177, -1.5726101398468018, -1.5309431552886963, -1.4892762899398804, -1.447609305381775, -1.405942440032959, -1.3642754554748535, -1.3226085901260376, -1.2809416055679321, -1.2392747402191162, -1.1976077556610107, -1.1559408903121948, -1.1142739057540894, -1.0726070404052734, -1.030940055847168, -0.9892731308937073, -0.9476062059402466, -0.9059392809867859, -0.8642723560333252, -0.8226054310798645, -0.7809385061264038, -0.7392716407775879, -0.697604775428772, -0.6559378504753113, -0.6142709255218506, -0.5726040005683899, -0.5309370756149292, -0.4892701506614685, -0.4476032555103302, -0.4059363305568695, -0.3642693758010864, -0.32260245084762573, -0.28093552589416504, -0.23926861584186554, -0.19760169088840485, -0.15593476593494415, -0.11426785588264465, -0.07260093092918396, -0.030934005975723267, 0.010732915252447128, 0.05239983648061752, 0.09406675398349762, 0.1357336789369583, 0.177400603890419, 0.2190675139427185, 0.2607344388961792, 0.3024013638496399, 0.3440682888031006, 0.3857352137565613, 0.427402138710022, 0.46906906366348267, 0.5107359886169434, 0.5524028539657593, 0.5940698385238647, 0.6357367038726807, 0.6774036288261414, 0.719070553779602, 0.7607374787330627, 0.8024044036865234, 0.8440713286399841, 0.8857382535934448, 0.9274051189422607, 0.9690721035003662]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 11.0, 6.0, 12.0, 11.0, 9.0, 17.0, 31.0, 19.0, 34.0, 35.0, 31.0, 46.0, 49.0, 40.0, 45.0, 48.0, 40.0, 51.0, 48.0, 59.0, 52.0, 48.0, 50.0, 35.0, 22.0, 32.0, 24.0, 21.0, 20.0, 15.0, 12.0, 13.0, 5.0, 5.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13452327251434326, -0.13065354526042938, -0.1267838180065155, -0.12291409075260162, -0.11904436349868774, -0.11517463624477386, -0.11130491644144058, -0.1074351891875267, -0.10356546193361282, -0.09969573467969894, -0.09582600742578506, -0.09195628017187119, -0.0880865603685379, -0.08421683311462402, -0.08034710586071014, -0.07647737860679626, -0.07260765135288239, -0.0687379240989685, -0.06486819684505463, -0.060998473316431046, -0.057128746062517166, -0.05325901880860329, -0.049389295279979706, -0.045519568026065826, -0.04164984077215195, -0.03778011351823807, -0.03391038626432419, -0.030040662735700607, -0.026170935481786728, -0.02230120822787285, -0.01843148283660412, -0.014561757445335388, -0.010692030191421509, -0.006822303868830204, -0.0029525775462388992, 0.0009171487763524055, 0.00478687509894371, 0.00865660235285759, 0.01252632774412632, 0.01639605313539505, 0.02026578038930893, 0.02413550764322281, 0.02800523303449154, 0.03187495842576027, 0.03574468567967415, 0.03961441293358803, 0.04348413646221161, 0.04735386371612549, 0.05122359097003937, 0.05509331822395325, 0.058963045477867126, 0.062832772731781, 0.06670249998569489, 0.07057222723960876, 0.07444194704294205, 0.07831167429685593, 0.0821814015507698, 0.08605112880468369, 0.08992085605859756, 0.09379058331251144, 0.09766030311584473, 0.1015300303697586, 0.10539975762367249, 0.10926948487758636, 0.11313921213150024]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 6.0, 8.0, 13.0, 28.0, 27.0, 44.0, 85.0, 157.0, 378.0, 2529.0, 11305.0, 4143417.0, 31615.0, 3164.0, 795.0, 300.0, 151.0, 91.0, 65.0, 31.0, 22.0, 15.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10597896575927734, -0.10130119323730469, -0.09662342071533203, -0.09194564819335938, -0.08726787567138672, -0.08259010314941406, -0.0779123306274414, -0.07323455810546875, -0.0685567855834961, -0.06387901306152344, -0.05920124053955078, -0.054523468017578125, -0.04984569549560547, -0.04516792297363281, -0.040490150451660156, -0.0358123779296875, -0.031134605407714844, -0.026456832885742188, -0.02177906036376953, -0.017101287841796875, -0.012423515319824219, -0.0077457427978515625, -0.0030679702758789062, 0.00160980224609375, 0.006287574768066406, 0.010965347290039062, 0.01564311981201172, 0.020320892333984375, 0.02499866485595703, 0.029676437377929688, 0.034354209899902344, 0.039031982421875, 0.043709754943847656, 0.04838752746582031, 0.05306529998779297, 0.057743072509765625, 0.06242084503173828, 0.06709861755371094, 0.0717763900756836, 0.07645416259765625, 0.0811319351196289, 0.08580970764160156, 0.09048748016357422, 0.09516525268554688, 0.09984302520751953, 0.10452079772949219, 0.10919857025146484, 0.1138763427734375, 0.11855411529541016, 0.12323188781738281, 0.12790966033935547, 0.13258743286132812, 0.13726520538330078, 0.14194297790527344, 0.1466207504272461, 0.15129852294921875, 0.1559762954711914, 0.16065406799316406, 0.16533184051513672, 0.17000961303710938, 0.17468738555908203, 0.1793651580810547, 0.18404293060302734, 0.188720703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 21.0, 133.0, 426.0, 314.0, 76.0, 21.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07568359375, -0.07345008850097656, -0.07121658325195312, -0.06898307800292969, -0.06674957275390625, -0.06451606750488281, -0.062282562255859375, -0.06004905700683594, -0.0578155517578125, -0.05558204650878906, -0.053348541259765625, -0.05111503601074219, -0.04888153076171875, -0.04664802551269531, -0.044414520263671875, -0.04218101501464844, -0.039947509765625, -0.03771400451660156, -0.035480499267578125, -0.03324699401855469, -0.03101348876953125, -0.028779983520507812, -0.026546478271484375, -0.024312973022460938, -0.0220794677734375, -0.019845962524414062, -0.017612457275390625, -0.015378952026367188, -0.01314544677734375, -0.010911941528320312, -0.008678436279296875, -0.0064449310302734375, -0.00421142578125, -0.0019779205322265625, 0.000255584716796875, 0.0024890899658203125, 0.00472259521484375, 0.0069561004638671875, 0.009189605712890625, 0.011423110961914062, 0.0136566162109375, 0.015890121459960938, 0.018123626708984375, 0.020357131958007812, 0.02259063720703125, 0.024824142456054688, 0.027057647705078125, 0.029291152954101562, 0.031524658203125, 0.03375816345214844, 0.035991668701171875, 0.03822517395019531, 0.04045867919921875, 0.04269218444824219, 0.044925689697265625, 0.04715919494628906, 0.0493927001953125, 0.05162620544433594, 0.053859710693359375, 0.05609321594238281, 0.05832672119140625, 0.06056022644042969, 0.06279373168945312, 0.06502723693847656, 0.0672607421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 20.0, 42.0, 61.0, 113.0, 174.0, 370.0, 890.0, 2974.0, 42384.0, 4027327.0, 113647.0, 4288.0, 1068.0, 427.0, 215.0, 92.0, 62.0, 35.0, 21.0, 10.0, 13.0, 8.0, 10.0, 3.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06265735626220703, -0.05988502502441406, -0.057112693786621094, -0.054340362548828125, -0.051568031311035156, -0.04879570007324219, -0.04602336883544922, -0.04325103759765625, -0.04047870635986328, -0.03770637512207031, -0.034934043884277344, -0.032161712646484375, -0.029389381408691406, -0.026617050170898438, -0.02384471893310547, -0.0210723876953125, -0.01830005645751953, -0.015527725219726562, -0.012755393981933594, -0.009983062744140625, -0.007210731506347656, -0.0044384002685546875, -0.0016660690307617188, 0.00110626220703125, 0.0038785934448242188, 0.0066509246826171875, 0.009423255920410156, 0.012195587158203125, 0.014967918395996094, 0.017740249633789062, 0.02051258087158203, 0.023284912109375, 0.02605724334716797, 0.028829574584960938, 0.031601905822753906, 0.034374237060546875, 0.037146568298339844, 0.03991889953613281, 0.04269123077392578, 0.04546356201171875, 0.04823589324951172, 0.05100822448730469, 0.053780555725097656, 0.056552886962890625, 0.059325218200683594, 0.06209754943847656, 0.06486988067626953, 0.0676422119140625, 0.07041454315185547, 0.07318687438964844, 0.0759592056274414, 0.07873153686523438, 0.08150386810302734, 0.08427619934082031, 0.08704853057861328, 0.08982086181640625, 0.09259319305419922, 0.09536552429199219, 0.09813785552978516, 0.10091018676757812, 0.1036825180053711, 0.10645484924316406, 0.10922718048095703, 0.11199951171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 14.0, 7.0, 13.0, 29.0, 42.0, 61.0, 93.0, 169.0, 243.0, 360.0, 663.0, 826.0, 529.0, 328.0, 253.0, 142.0, 94.0, 84.0, 33.0, 28.0, 19.0, 12.0, 8.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045318603515625, -0.044165849685668945, -0.04301309585571289, -0.041860342025756836, -0.04070758819580078, -0.03955483436584473, -0.03840208053588867, -0.03724932670593262, -0.03609657287597656, -0.03494381904602051, -0.03379106521606445, -0.0326383113861084, -0.031485557556152344, -0.03033280372619629, -0.029180049896240234, -0.02802729606628418, -0.026874542236328125, -0.02572178840637207, -0.024569034576416016, -0.02341628074645996, -0.022263526916503906, -0.02111077308654785, -0.019958019256591797, -0.018805265426635742, -0.017652511596679688, -0.016499757766723633, -0.015347003936767578, -0.014194250106811523, -0.013041496276855469, -0.011888742446899414, -0.01073598861694336, -0.009583234786987305, -0.00843048095703125, -0.007277727127075195, -0.006124973297119141, -0.004972219467163086, -0.0038194656372070312, -0.0026667118072509766, -0.0015139579772949219, -0.0003612041473388672, 0.0007915496826171875, 0.0019443035125732422, 0.003097057342529297, 0.0042498111724853516, 0.005402565002441406, 0.006555318832397461, 0.007708072662353516, 0.00886082649230957, 0.010013580322265625, 0.01116633415222168, 0.012319087982177734, 0.013471841812133789, 0.014624595642089844, 0.0157773494720459, 0.016930103302001953, 0.018082857131958008, 0.019235610961914062, 0.020388364791870117, 0.021541118621826172, 0.022693872451782227, 0.02384662628173828, 0.024999380111694336, 0.02615213394165039, 0.027304887771606445, 0.0284576416015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 11.0, 52.0, 685.0, 251.0, 11.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6076231598854065, -0.5864946246147156, -0.5653660297393799, -0.544237494468689, -0.523108959197998, -0.5019804239273071, -0.48085182905197144, -0.4597232937812805, -0.4385947287082672, -0.4174661636352539, -0.396337628364563, -0.3752090632915497, -0.3540804982185364, -0.33295196294784546, -0.31182339787483215, -0.29069483280181885, -0.26956629753112793, -0.24843774735927582, -0.2273091971874237, -0.2061806321144104, -0.1850520819425583, -0.16392353177070618, -0.14279496669769287, -0.12166641652584076, -0.10053786635398865, -0.07940931618213654, -0.05828075855970383, -0.03715220093727112, -0.016023650765419006, 0.0051048994064331055, 0.02623346447944641, 0.04736201465129852, 0.06849062442779541, 0.08961917459964752, 0.11074773222208023, 0.13187628984451294, 0.15300484001636505, 0.17413339018821716, 0.19526195526123047, 0.21639050543308258, 0.2375190556049347, 0.258647620677948, 0.2797761559486389, 0.3009047210216522, 0.3220332860946655, 0.34316182136535645, 0.36429038643836975, 0.38541895151138306, 0.406547486782074, 0.4276760518550873, 0.4488045871257782, 0.4699331521987915, 0.4910616874694824, 0.5121902227401733, 0.533318817615509, 0.5544473528862, 0.5755759477615356, 0.5967044830322266, 0.6178330779075623, 0.6389616131782532, 0.6600901484489441, 0.6812187433242798, 0.7023472785949707, 0.7234758138656616, 0.7446043491363525]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 7.0, 13.0, 18.0, 23.0, 40.0, 48.0, 52.0, 80.0, 79.0, 87.0, 81.0, 88.0, 91.0, 62.0, 64.0, 52.0, 31.0, 28.0, 16.0, 19.0, 12.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16862046718597412, -0.16302843391895294, -0.15743640065193176, -0.15184436738491058, -0.1462523341178894, -0.14066031575202942, -0.13506828248500824, -0.12947624921798706, -0.12388421595096588, -0.1182921826839447, -0.11270014941692352, -0.10710812360048294, -0.10151609033346176, -0.09592405706644058, -0.09033203125, -0.08473999798297882, -0.07914796471595764, -0.07355593144893646, -0.06796389818191528, -0.0623718723654747, -0.05677983909845352, -0.05118780583143234, -0.04559577628970146, -0.04000374674797058, -0.0344117134809494, -0.028819682076573372, -0.023227650672197342, -0.017635619267821312, -0.012043587863445282, -0.006451556459069252, -0.000859525054693222, 0.004732504487037659, 0.010324537754058838, 0.015916569158434868, 0.021508600562810898, 0.027100631967186928, 0.03269266337156296, 0.03828469663858414, 0.04387672618031502, 0.0494687557220459, 0.05506078898906708, 0.06065282225608826, 0.06624485552310944, 0.07183688133955002, 0.0774289146065712, 0.08302094787359238, 0.08861297369003296, 0.09420500695705414, 0.09979704022407532, 0.1053890734910965, 0.11098110675811768, 0.11657313257455826, 0.12216516584157944, 0.12775719165802002, 0.1333492249250412, 0.13894125819206238, 0.14453329145908356, 0.15012532472610474, 0.15571735799312592, 0.1613093912601471, 0.16690140962600708, 0.17249344289302826, 0.17808547616004944, 0.18367750942707062, 0.1892695426940918]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 6.0, 7.0, 10.0, 11.0, 12.0, 15.0, 19.0, 26.0, 27.0, 64.0, 58.0, 102.0, 134.0, 178.0, 298.0, 437.0, 810.0, 2454.0, 26684.0, 972716.0, 39185.0, 2867.0, 952.0, 476.0, 252.0, 219.0, 124.0, 108.0, 57.0, 53.0, 34.0, 28.0, 28.0, 22.0, 18.0, 6.0, 12.0, 16.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1678466796875, -0.16298866271972656, -0.15813064575195312, -0.1532726287841797, -0.14841461181640625, -0.1435565948486328, -0.13869857788085938, -0.13384056091308594, -0.1289825439453125, -0.12412452697753906, -0.11926651000976562, -0.11440849304199219, -0.10955047607421875, -0.10469245910644531, -0.09983444213867188, -0.09497642517089844, -0.090118408203125, -0.08526039123535156, -0.08040237426757812, -0.07554435729980469, -0.07068634033203125, -0.06582832336425781, -0.060970306396484375, -0.05611228942871094, -0.0512542724609375, -0.04639625549316406, -0.041538238525390625, -0.03668022155761719, -0.03182220458984375, -0.026964187622070312, -0.022106170654296875, -0.017248153686523438, -0.01239013671875, -0.0075321197509765625, -0.002674102783203125, 0.0021839141845703125, 0.00704193115234375, 0.011899948120117188, 0.016757965087890625, 0.021615982055664062, 0.0264739990234375, 0.03133201599121094, 0.036190032958984375, 0.04104804992675781, 0.04590606689453125, 0.05076408386230469, 0.055622100830078125, 0.06048011779785156, 0.065338134765625, 0.07019615173339844, 0.07505416870117188, 0.07991218566894531, 0.08477020263671875, 0.08962821960449219, 0.09448623657226562, 0.09934425354003906, 0.1042022705078125, 0.10906028747558594, 0.11391830444335938, 0.11877632141113281, 0.12363433837890625, 0.1284923553466797, 0.13335037231445312, 0.13820838928222656, 0.14306640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 34.0, 163.0, 447.0, 283.0, 51.0, 15.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0745849609375, -0.0723714828491211, -0.07015800476074219, -0.06794452667236328, -0.06573104858398438, -0.06351757049560547, -0.06130409240722656, -0.059090614318847656, -0.05687713623046875, -0.054663658142089844, -0.05245018005371094, -0.05023670196533203, -0.048023223876953125, -0.04580974578857422, -0.04359626770019531, -0.041382789611816406, -0.0391693115234375, -0.036955833435058594, -0.03474235534667969, -0.03252887725830078, -0.030315399169921875, -0.02810192108154297, -0.025888442993164062, -0.023674964904785156, -0.02146148681640625, -0.019248008728027344, -0.017034530639648438, -0.014821052551269531, -0.012607574462890625, -0.010394096374511719, -0.008180618286132812, -0.005967140197753906, -0.003753662109375, -0.0015401840209960938, 0.0006732940673828125, 0.0028867721557617188, 0.005100250244140625, 0.007313728332519531, 0.009527206420898438, 0.011740684509277344, 0.01395416259765625, 0.016167640686035156, 0.018381118774414062, 0.02059459686279297, 0.022808074951171875, 0.02502155303955078, 0.027235031127929688, 0.029448509216308594, 0.0316619873046875, 0.033875465393066406, 0.03608894348144531, 0.03830242156982422, 0.040515899658203125, 0.04272937774658203, 0.04494285583496094, 0.047156333923339844, 0.04936981201171875, 0.051583290100097656, 0.05379676818847656, 0.05601024627685547, 0.058223724365234375, 0.06043720245361328, 0.06265068054199219, 0.0648641586303711, 0.06707763671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 11.0, 18.0, 9.0, 13.0, 17.0, 28.0, 39.0, 52.0, 83.0, 148.0, 203.0, 404.0, 771.0, 2583.0, 32257.0, 948247.0, 58399.0, 3232.0, 905.0, 432.0, 228.0, 138.0, 80.0, 56.0, 60.0, 31.0, 31.0, 18.0, 9.0, 13.0, 7.0, 6.0, 2.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1583251953125, -0.1529712677001953, -0.14761734008789062, -0.14226341247558594, -0.13690948486328125, -0.13155555725097656, -0.12620162963867188, -0.12084770202636719, -0.1154937744140625, -0.11013984680175781, -0.10478591918945312, -0.09943199157714844, -0.09407806396484375, -0.08872413635253906, -0.08337020874023438, -0.07801628112792969, -0.072662353515625, -0.06730842590332031, -0.061954498291015625, -0.05660057067871094, -0.05124664306640625, -0.04589271545410156, -0.040538787841796875, -0.03518486022949219, -0.0298309326171875, -0.024477005004882812, -0.019123077392578125, -0.013769149780273438, -0.00841522216796875, -0.0030612945556640625, 0.002292633056640625, 0.0076465606689453125, 0.01300048828125, 0.018354415893554688, 0.023708343505859375, 0.029062271118164062, 0.03441619873046875, 0.03977012634277344, 0.045124053955078125, 0.05047798156738281, 0.0558319091796875, 0.06118583679199219, 0.06653976440429688, 0.07189369201660156, 0.07724761962890625, 0.08260154724121094, 0.08795547485351562, 0.09330940246582031, 0.098663330078125, 0.10401725769042969, 0.10937118530273438, 0.11472511291503906, 0.12007904052734375, 0.12543296813964844, 0.13078689575195312, 0.1361408233642578, 0.1414947509765625, 0.1468486785888672, 0.15220260620117188, 0.15755653381347656, 0.16291046142578125, 0.16826438903808594, 0.17361831665039062, 0.1789722442626953, 0.184326171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 12.0, 24.0, 7.0, 13.0, 18.0, 22.0, 20.0, 22.0, 42.0, 48.0, 53.0, 48.0, 60.0, 70.0, 62.0, 46.0, 64.0, 56.0, 51.0, 45.0, 36.0, 41.0, 29.0, 17.0, 16.0, 11.0, 16.0, 7.0, 9.0, 13.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.048259735107421875, -0.04674530029296875, -0.045230865478515625, -0.0437164306640625, -0.042201995849609375, -0.04068756103515625, -0.039173126220703125, -0.03765869140625, -0.036144256591796875, -0.03462982177734375, -0.033115386962890625, -0.0316009521484375, -0.030086517333984375, -0.02857208251953125, -0.027057647705078125, -0.025543212890625, -0.024028778076171875, -0.02251434326171875, -0.020999908447265625, -0.0194854736328125, -0.017971038818359375, -0.01645660400390625, -0.014942169189453125, -0.013427734375, -0.011913299560546875, -0.01039886474609375, -0.008884429931640625, -0.0073699951171875, -0.005855560302734375, -0.00434112548828125, -0.002826690673828125, -0.001312255859375, 0.000202178955078125, 0.00171661376953125, 0.003231048583984375, 0.0047454833984375, 0.006259918212890625, 0.00777435302734375, 0.009288787841796875, 0.01080322265625, 0.012317657470703125, 0.01383209228515625, 0.015346527099609375, 0.0168609619140625, 0.018375396728515625, 0.01988983154296875, 0.021404266357421875, 0.022918701171875, 0.024433135986328125, 0.02594757080078125, 0.027462005615234375, 0.0289764404296875, 0.030490875244140625, 0.03200531005859375, 0.033519744873046875, 0.0350341796875, 0.036548614501953125, 0.03806304931640625, 0.039577484130859375, 0.0410919189453125, 0.042606353759765625, 0.04412078857421875, 0.045635223388671875, 0.047149658203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 6.0, 6.0, 13.0, 14.0, 31.0, 51.0, 45.0, 71.0, 145.0, 262.0, 493.0, 1082.0, 2448.0, 6817.0, 20758.0, 158628.0, 801286.0, 38751.0, 10810.0, 3821.0, 1462.0, 702.0, 327.0, 154.0, 128.0, 73.0, 42.0, 31.0, 19.0, 15.0, 12.0, 16.0, 2.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054473876953125, -0.052472591400146484, -0.05047130584716797, -0.04847002029418945, -0.04646873474121094, -0.04446744918823242, -0.042466163635253906, -0.04046487808227539, -0.038463592529296875, -0.03646230697631836, -0.034461021423339844, -0.03245973587036133, -0.030458450317382812, -0.028457164764404297, -0.02645587921142578, -0.024454593658447266, -0.02245330810546875, -0.020452022552490234, -0.01845073699951172, -0.016449451446533203, -0.014448165893554688, -0.012446880340576172, -0.010445594787597656, -0.00844430923461914, -0.006443023681640625, -0.004441738128662109, -0.0024404525756835938, -0.0004391670227050781, 0.0015621185302734375, 0.003563404083251953, 0.005564689636230469, 0.007565975189208984, 0.0095672607421875, 0.011568546295166016, 0.013569831848144531, 0.015571117401123047, 0.017572402954101562, 0.019573688507080078, 0.021574974060058594, 0.02357625961303711, 0.025577545166015625, 0.02757883071899414, 0.029580116271972656, 0.03158140182495117, 0.03358268737792969, 0.0355839729309082, 0.03758525848388672, 0.039586544036865234, 0.04158782958984375, 0.043589115142822266, 0.04559040069580078, 0.0475916862487793, 0.04959297180175781, 0.05159425735473633, 0.053595542907714844, 0.05559682846069336, 0.057598114013671875, 0.05959939956665039, 0.061600685119628906, 0.06360197067260742, 0.06560325622558594, 0.06760454177856445, 0.06960582733154297, 0.07160711288452148, 0.0736083984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 8.0, 10.0, 13.0, 14.0, 21.0, 35.0, 40.0, 46.0, 71.0, 100.0, 106.0, 115.0, 117.0, 66.0, 40.0, 41.0, 21.0, 35.0, 21.0, 16.0, 16.0, 11.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.204843521118164e-05, -5.976483225822449e-05, -5.7481229305267334e-05, -5.519762635231018e-05, -5.291402339935303e-05, -5.0630420446395874e-05, -4.834681749343872e-05, -4.606321454048157e-05, -4.3779611587524414e-05, -4.149600863456726e-05, -3.921240568161011e-05, -3.6928802728652954e-05, -3.46451997756958e-05, -3.236159682273865e-05, -3.0077993869781494e-05, -2.779439091682434e-05, -2.5510787963867188e-05, -2.3227185010910034e-05, -2.094358205795288e-05, -1.8659979104995728e-05, -1.6376376152038574e-05, -1.4092773199081421e-05, -1.1809170246124268e-05, -9.525567293167114e-06, -7.241964340209961e-06, -4.958361387252808e-06, -2.6747584342956543e-06, -3.91155481338501e-07, 1.8924474716186523e-06, 4.176050424575806e-06, 6.459653377532959e-06, 8.743256330490112e-06, 1.1026859283447266e-05, 1.3310462236404419e-05, 1.5594065189361572e-05, 1.7877668142318726e-05, 2.016127109527588e-05, 2.2444874048233032e-05, 2.4728477001190186e-05, 2.701207995414734e-05, 2.9295682907104492e-05, 3.1579285860061646e-05, 3.38628888130188e-05, 3.614649176597595e-05, 3.8430094718933105e-05, 4.071369767189026e-05, 4.299730062484741e-05, 4.5280903577804565e-05, 4.756450653076172e-05, 4.984810948371887e-05, 5.2131712436676025e-05, 5.441531538963318e-05, 5.669891834259033e-05, 5.8982521295547485e-05, 6.126612424850464e-05, 6.354972720146179e-05, 6.583333015441895e-05, 6.81169331073761e-05, 7.040053606033325e-05, 7.26841390132904e-05, 7.496774196624756e-05, 7.725134491920471e-05, 7.953494787216187e-05, 8.181855082511902e-05, 8.410215377807617e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 10.0, 13.0, 19.0, 30.0, 34.0, 40.0, 96.0, 186.0, 372.0, 1653.0, 13398.0, 919667.0, 106165.0, 5385.0, 811.0, 277.0, 139.0, 86.0, 59.0, 28.0, 19.0, 17.0, 14.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1241455078125, -0.1207742691040039, -0.11740303039550781, -0.11403179168701172, -0.11066055297851562, -0.10728931427001953, -0.10391807556152344, -0.10054683685302734, -0.09717559814453125, -0.09380435943603516, -0.09043312072753906, -0.08706188201904297, -0.08369064331054688, -0.08031940460205078, -0.07694816589355469, -0.0735769271850586, -0.0702056884765625, -0.0668344497680664, -0.06346321105957031, -0.06009197235107422, -0.056720733642578125, -0.05334949493408203, -0.04997825622558594, -0.046607017517089844, -0.04323577880859375, -0.039864540100097656, -0.03649330139160156, -0.03312206268310547, -0.029750823974609375, -0.02637958526611328, -0.023008346557617188, -0.019637107849121094, -0.016265869140625, -0.012894630432128906, -0.009523391723632812, -0.006152153015136719, -0.002780914306640625, 0.0005903244018554688, 0.0039615631103515625, 0.007332801818847656, 0.01070404052734375, 0.014075279235839844, 0.017446517944335938, 0.02081775665283203, 0.024188995361328125, 0.02756023406982422, 0.030931472778320312, 0.034302711486816406, 0.0376739501953125, 0.041045188903808594, 0.04441642761230469, 0.04778766632080078, 0.051158905029296875, 0.05453014373779297, 0.05790138244628906, 0.061272621154785156, 0.06464385986328125, 0.06801509857177734, 0.07138633728027344, 0.07475757598876953, 0.07812881469726562, 0.08150005340576172, 0.08487129211425781, 0.0882425308227539, 0.09161376953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 9.0, 15.0, 14.0, 14.0, 32.0, 49.0, 100.0, 171.0, 196.0, 140.0, 77.0, 50.0, 23.0, 13.0, 13.0, 13.0, 5.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.026153564453125, -0.025314807891845703, -0.024476051330566406, -0.02363729476928711, -0.022798538208007812, -0.021959781646728516, -0.02112102508544922, -0.020282268524169922, -0.019443511962890625, -0.018604755401611328, -0.01776599884033203, -0.016927242279052734, -0.016088485717773438, -0.01524972915649414, -0.014410972595214844, -0.013572216033935547, -0.01273345947265625, -0.011894702911376953, -0.011055946350097656, -0.01021718978881836, -0.009378433227539062, -0.008539676666259766, -0.007700920104980469, -0.006862163543701172, -0.006023406982421875, -0.005184650421142578, -0.004345893859863281, -0.0035071372985839844, -0.0026683807373046875, -0.0018296241760253906, -0.0009908676147460938, -0.00015211105346679688, 0.0006866455078125, 0.0015254020690917969, 0.0023641586303710938, 0.0032029151916503906, 0.0040416717529296875, 0.004880428314208984, 0.005719184875488281, 0.006557941436767578, 0.007396697998046875, 0.008235454559326172, 0.009074211120605469, 0.009912967681884766, 0.010751724243164062, 0.01159048080444336, 0.012429237365722656, 0.013267993927001953, 0.01410675048828125, 0.014945507049560547, 0.015784263610839844, 0.01662302017211914, 0.017461776733398438, 0.018300533294677734, 0.01913928985595703, 0.019978046417236328, 0.020816802978515625, 0.021655559539794922, 0.02249431610107422, 0.023333072662353516, 0.024171829223632812, 0.02501058578491211, 0.025849342346191406, 0.026688098907470703, 0.02752685546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 13.0, 54.0, 203.0, 425.0, 229.0, 52.0, 16.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5034151077270508, -0.48789334297180176, -0.4723716080188751, -0.4568498432636261, -0.4413280785083771, -0.42580634355545044, -0.4102845788002014, -0.3947628140449524, -0.37924107909202576, -0.36371931433677673, -0.3481975793838501, -0.3326758146286011, -0.31715404987335205, -0.3016323149204254, -0.2861105501651764, -0.27058881521224976, -0.25506705045700073, -0.2395453006029129, -0.22402353584766388, -0.20850178599357605, -0.19298003613948822, -0.1774582862854004, -0.16193652153015137, -0.14641477167606354, -0.13089299201965332, -0.1153712347149849, -0.09984948486089706, -0.08432772755622864, -0.06880597770214081, -0.05328422039747238, -0.037762463092803955, -0.022240713238716125, -0.006718963384628296, 0.008802791126072407, 0.02432454563677311, 0.03984630107879639, 0.055368054658174515, 0.07088980823755264, 0.08641156554222107, 0.1019333153963089, 0.11745507270097733, 0.13297683000564575, 0.14849857985973358, 0.1640203297138214, 0.17954209446907043, 0.19506384432315826, 0.2105855941772461, 0.22610735893249512, 0.24162910878658295, 0.2571508586406708, 0.2726726233959198, 0.28819435834884644, 0.30371612310409546, 0.3192378878593445, 0.3347596526145935, 0.35028138756752014, 0.36580315232276917, 0.3813249170780182, 0.3968466520309448, 0.41236841678619385, 0.42789018154144287, 0.4434119164943695, 0.45893368124961853, 0.47445541620254517, 0.4899771809577942]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 3.0, 10.0, 12.0, 15.0, 16.0, 34.0, 22.0, 31.0, 56.0, 49.0, 60.0, 73.0, 65.0, 75.0, 59.0, 55.0, 55.0, 58.0, 43.0, 47.0, 44.0, 24.0, 22.0, 12.0, 16.0, 13.0, 7.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17116987705230713, -0.16502514481544495, -0.15888041257858276, -0.1527356654405594, -0.1465909332036972, -0.14044620096683502, -0.13430145382881165, -0.12815672159194946, -0.12201198935508728, -0.1158672571182251, -0.10972251743078232, -0.10357777774333954, -0.09743304550647736, -0.09128831326961517, -0.0851435735821724, -0.07899883389472961, -0.07285410165786743, -0.06670936942100525, -0.06056462973356247, -0.05441989377140999, -0.04827515780925751, -0.042130421847105026, -0.035985685884952545, -0.029840949922800064, -0.023696213960647583, -0.017551477998495102, -0.01140674203634262, -0.00526200607419014, 0.0008827298879623413, 0.007027465850114822, 0.013172201812267303, 0.019316937774419785, 0.025461673736572266, 0.03160640969872475, 0.03775114566087723, 0.04389588162302971, 0.05004061758518219, 0.05618535354733467, 0.06233008950948715, 0.06847482919692993, 0.07461956143379211, 0.0807642936706543, 0.08690903335809708, 0.09305377304553986, 0.09919850528240204, 0.10534323751926422, 0.111487977206707, 0.11763271689414978, 0.12377744913101196, 0.12992218136787415, 0.13606691360473633, 0.1422116607427597, 0.1483563929796219, 0.15450112521648407, 0.16064587235450745, 0.16679060459136963, 0.1729353368282318, 0.179080069065094, 0.18522480130195618, 0.19136954843997955, 0.19751428067684174, 0.20365901291370392, 0.2098037600517273, 0.21594849228858948, 0.22209322452545166]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 12.0, 7.0, 9.0, 25.0, 16.0, 40.0, 43.0, 90.0, 132.0, 303.0, 1189.0, 3513.0, 6270.0, 147583.0, 4008577.0, 19415.0, 3939.0, 1581.0, 805.0, 267.0, 150.0, 93.0, 65.0, 44.0, 29.0, 28.0, 14.0, 14.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.06729793548583984, -0.06483268737792969, -0.06236743927001953, -0.059902191162109375, -0.05743694305419922, -0.05497169494628906, -0.052506446838378906, -0.05004119873046875, -0.047575950622558594, -0.04511070251464844, -0.04264545440673828, -0.040180206298828125, -0.03771495819091797, -0.03524971008300781, -0.032784461975097656, -0.0303192138671875, -0.027853965759277344, -0.025388717651367188, -0.02292346954345703, -0.020458221435546875, -0.01799297332763672, -0.015527725219726562, -0.013062477111816406, -0.01059722900390625, -0.008131980895996094, -0.0056667327880859375, -0.0032014846801757812, -0.000736236572265625, 0.0017290115356445312, 0.0041942596435546875, 0.006659507751464844, 0.009124755859375, 0.011590003967285156, 0.014055252075195312, 0.01652050018310547, 0.018985748291015625, 0.02145099639892578, 0.023916244506835938, 0.026381492614746094, 0.02884674072265625, 0.031311988830566406, 0.03377723693847656, 0.03624248504638672, 0.038707733154296875, 0.04117298126220703, 0.04363822937011719, 0.046103477478027344, 0.0485687255859375, 0.051033973693847656, 0.05349922180175781, 0.05596446990966797, 0.058429718017578125, 0.06089496612548828, 0.06336021423339844, 0.0658254623413086, 0.06829071044921875, 0.0707559585571289, 0.07322120666503906, 0.07568645477294922, 0.07815170288085938, 0.08061695098876953, 0.08308219909667969, 0.08554744720458984, 0.0880126953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 36.0, 158.0, 392.0, 302.0, 79.0, 19.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0699462890625, -0.06787872314453125, -0.0658111572265625, -0.06374359130859375, -0.061676025390625, -0.05960845947265625, -0.0575408935546875, -0.05547332763671875, -0.05340576171875, -0.05133819580078125, -0.0492706298828125, -0.04720306396484375, -0.045135498046875, -0.04306793212890625, -0.0410003662109375, -0.03893280029296875, -0.036865234375, -0.03479766845703125, -0.0327301025390625, -0.03066253662109375, -0.028594970703125, -0.02652740478515625, -0.0244598388671875, -0.02239227294921875, -0.02032470703125, -0.01825714111328125, -0.0161895751953125, -0.01412200927734375, -0.012054443359375, -0.00998687744140625, -0.0079193115234375, -0.00585174560546875, -0.0037841796875, -0.00171661376953125, 0.0003509521484375, 0.00241851806640625, 0.004486083984375, 0.00655364990234375, 0.0086212158203125, 0.01068878173828125, 0.01275634765625, 0.01482391357421875, 0.0168914794921875, 0.01895904541015625, 0.021026611328125, 0.02309417724609375, 0.0251617431640625, 0.02722930908203125, 0.029296875, 0.03136444091796875, 0.0334320068359375, 0.03549957275390625, 0.037567138671875, 0.03963470458984375, 0.0417022705078125, 0.04376983642578125, 0.04583740234375, 0.04790496826171875, 0.0499725341796875, 0.05204010009765625, 0.054107666015625, 0.05617523193359375, 0.0582427978515625, 0.06031036376953125, 0.0623779296875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 13.0, 11.0, 21.0, 27.0, 44.0, 77.0, 113.0, 243.0, 413.0, 1055.0, 3805.0, 33861.0, 3652893.0, 487478.0, 10804.0, 2012.0, 688.0, 316.0, 151.0, 87.0, 60.0, 29.0, 22.0, 15.0, 9.0, 9.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06700801849365234, -0.06468009948730469, -0.06235218048095703, -0.060024261474609375, -0.05769634246826172, -0.05536842346191406, -0.053040504455566406, -0.05071258544921875, -0.048384666442871094, -0.04605674743652344, -0.04372882843017578, -0.041400909423828125, -0.03907299041748047, -0.03674507141113281, -0.034417152404785156, -0.0320892333984375, -0.029761314392089844, -0.027433395385742188, -0.02510547637939453, -0.022777557373046875, -0.02044963836669922, -0.018121719360351562, -0.015793800354003906, -0.01346588134765625, -0.011137962341308594, -0.008810043334960938, -0.006482124328613281, -0.004154205322265625, -0.0018262863159179688, 0.0005016326904296875, 0.0028295516967773438, 0.005157470703125, 0.007485389709472656, 0.009813308715820312, 0.012141227722167969, 0.014469146728515625, 0.01679706573486328, 0.019124984741210938, 0.021452903747558594, 0.02378082275390625, 0.026108741760253906, 0.028436660766601562, 0.03076457977294922, 0.033092498779296875, 0.03542041778564453, 0.03774833679199219, 0.040076255798339844, 0.0424041748046875, 0.044732093811035156, 0.04706001281738281, 0.04938793182373047, 0.051715850830078125, 0.05404376983642578, 0.05637168884277344, 0.058699607849121094, 0.06102752685546875, 0.0633554458618164, 0.06568336486816406, 0.06801128387451172, 0.07033920288085938, 0.07266712188720703, 0.07499504089355469, 0.07732295989990234, 0.07965087890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 5.0, 14.0, 18.0, 26.0, 33.0, 48.0, 73.0, 133.0, 179.0, 243.0, 378.0, 508.0, 591.0, 544.0, 376.0, 276.0, 194.0, 138.0, 73.0, 70.0, 42.0, 39.0, 27.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027923583984375, -0.027040958404541016, -0.02615833282470703, -0.025275707244873047, -0.024393081665039062, -0.023510456085205078, -0.022627830505371094, -0.02174520492553711, -0.020862579345703125, -0.01997995376586914, -0.019097328186035156, -0.018214702606201172, -0.017332077026367188, -0.016449451446533203, -0.015566825866699219, -0.014684200286865234, -0.01380157470703125, -0.012918949127197266, -0.012036323547363281, -0.011153697967529297, -0.010271072387695312, -0.009388446807861328, -0.008505821228027344, -0.007623195648193359, -0.006740570068359375, -0.005857944488525391, -0.004975318908691406, -0.004092693328857422, -0.0032100677490234375, -0.002327442169189453, -0.0014448165893554688, -0.0005621910095214844, 0.0003204345703125, 0.0012030601501464844, 0.0020856857299804688, 0.002968311309814453, 0.0038509368896484375, 0.004733562469482422, 0.005616188049316406, 0.006498813629150391, 0.007381439208984375, 0.00826406478881836, 0.009146690368652344, 0.010029315948486328, 0.010911941528320312, 0.011794567108154297, 0.012677192687988281, 0.013559818267822266, 0.01444244384765625, 0.015325069427490234, 0.01620769500732422, 0.017090320587158203, 0.017972946166992188, 0.018855571746826172, 0.019738197326660156, 0.02062082290649414, 0.021503448486328125, 0.02238607406616211, 0.023268699645996094, 0.024151325225830078, 0.025033950805664062, 0.025916576385498047, 0.02679920196533203, 0.027681827545166016, 0.028564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 35.0, 154.0, 408.0, 299.0, 85.0, 14.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29196077585220337, -0.28144949674606323, -0.2709381878376007, -0.2604268789291382, -0.24991559982299805, -0.23940430581569672, -0.22889301180839539, -0.21838171780109406, -0.20787042379379272, -0.1973591297864914, -0.18684783577919006, -0.17633654177188873, -0.1658252477645874, -0.15531395375728607, -0.14480265974998474, -0.1342913657426834, -0.12378007173538208, -0.11326877772808075, -0.10275748372077942, -0.09224618971347809, -0.08173489570617676, -0.07122360169887543, -0.0607123076915741, -0.050201013684272766, -0.039689719676971436, -0.029178425669670105, -0.018667131662368774, -0.008155837655067444, 0.0023554563522338867, 0.012866750359535217, 0.023378044366836548, 0.03388933837413788, 0.04440063238143921, 0.05491192638874054, 0.06542322039604187, 0.0759345144033432, 0.08644580841064453, 0.09695710241794586, 0.10746839642524719, 0.11797969043254852, 0.12849098443984985, 0.13900227844715118, 0.14951357245445251, 0.16002486646175385, 0.17053616046905518, 0.1810474544763565, 0.19155874848365784, 0.20207004249095917, 0.2125813364982605, 0.22309263050556183, 0.23360392451286316, 0.2441152185201645, 0.2546265125274658, 0.26513779163360596, 0.2756491005420685, 0.286160409450531, 0.29667168855667114, 0.3071829676628113, 0.3176942765712738, 0.32820558547973633, 0.33871686458587646, 0.3492281436920166, 0.3597394526004791, 0.37025076150894165, 0.3807620406150818]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 16.0, 12.0, 30.0, 26.0, 31.0, 34.0, 35.0, 47.0, 56.0, 62.0, 49.0, 65.0, 46.0, 55.0, 45.0, 37.0, 62.0, 46.0, 41.0, 34.0, 34.0, 27.0, 21.0, 16.0, 9.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11320865154266357, -0.10996858775615692, -0.10672852396965027, -0.10348846018314362, -0.10024839639663696, -0.09700833261013031, -0.09376827627420425, -0.0905282124876976, -0.08728814870119095, -0.0840480849146843, -0.08080802112817764, -0.07756795734167099, -0.07432790100574493, -0.07108783721923828, -0.06784777343273163, -0.06460770964622498, -0.06136764585971832, -0.05812758207321167, -0.05488751828670502, -0.05164745822548866, -0.04840739443898201, -0.04516733065247536, -0.041927270591259, -0.03868720680475235, -0.0354471430182457, -0.032207079231739044, -0.02896701730787754, -0.025726955384016037, -0.022486891597509384, -0.01924682781100273, -0.016006765887141228, -0.012766703963279724, -0.009526640176773071, -0.006286577321588993, -0.003046514466404915, 0.00019354838877916336, 0.0034336112439632416, 0.006673675030469894, 0.009913736954331398, 0.013153798878192902, 0.016393862664699554, 0.019633926451206207, 0.02287398837506771, 0.026114050298929214, 0.029354114085435867, 0.03259417787194252, 0.035834237933158875, 0.03907430171966553, 0.04231436550617218, 0.04555442929267883, 0.048794493079185486, 0.05203455314040184, 0.05527461692690849, 0.058514680713415146, 0.0617547407746315, 0.06499480456113815, 0.0682348683476448, 0.07147493213415146, 0.07471499592065811, 0.07795505970716476, 0.08119511604309082, 0.08443517982959747, 0.08767524361610413, 0.09091530740261078, 0.09415537118911743]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 10.0, 11.0, 12.0, 17.0, 25.0, 19.0, 26.0, 33.0, 38.0, 45.0, 52.0, 88.0, 111.0, 117.0, 185.0, 258.0, 330.0, 518.0, 873.0, 2107.0, 14428.0, 567752.0, 444861.0, 12059.0, 1932.0, 823.0, 471.0, 326.0, 227.0, 182.0, 126.0, 105.0, 67.0, 62.0, 50.0, 40.0, 34.0, 20.0, 27.0, 22.0, 17.0, 10.0, 9.0, 8.0, 6.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.094970703125, -0.09208965301513672, -0.08920860290527344, -0.08632755279541016, -0.08344650268554688, -0.0805654525756836, -0.07768440246582031, -0.07480335235595703, -0.07192230224609375, -0.06904125213623047, -0.06616020202636719, -0.0632791519165039, -0.060398101806640625, -0.057517051696777344, -0.05463600158691406, -0.05175495147705078, -0.0488739013671875, -0.04599285125732422, -0.04311180114746094, -0.040230751037597656, -0.037349700927734375, -0.034468650817871094, -0.03158760070800781, -0.02870655059814453, -0.02582550048828125, -0.02294445037841797, -0.020063400268554688, -0.017182350158691406, -0.014301300048828125, -0.011420249938964844, -0.008539199829101562, -0.005658149719238281, -0.002777099609375, 0.00010395050048828125, 0.0029850006103515625, 0.005866050720214844, 0.008747100830078125, 0.011628150939941406, 0.014509201049804688, 0.01739025115966797, 0.02027130126953125, 0.02315235137939453, 0.026033401489257812, 0.028914451599121094, 0.031795501708984375, 0.034676551818847656, 0.03755760192871094, 0.04043865203857422, 0.0433197021484375, 0.04620075225830078, 0.04908180236816406, 0.051962852478027344, 0.054843902587890625, 0.057724952697753906, 0.06060600280761719, 0.06348705291748047, 0.06636810302734375, 0.06924915313720703, 0.07213020324707031, 0.0750112533569336, 0.07789230346679688, 0.08077335357666016, 0.08365440368652344, 0.08653545379638672, 0.08941650390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 23.0, 112.0, 355.0, 367.0, 109.0, 27.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0677490234375, -0.06569957733154297, -0.06365013122558594, -0.061600685119628906, -0.059551239013671875, -0.057501792907714844, -0.05545234680175781, -0.05340290069580078, -0.05135345458984375, -0.04930400848388672, -0.04725456237792969, -0.045205116271972656, -0.043155670166015625, -0.041106224060058594, -0.03905677795410156, -0.03700733184814453, -0.0349578857421875, -0.03290843963623047, -0.030858993530273438, -0.028809547424316406, -0.026760101318359375, -0.024710655212402344, -0.022661209106445312, -0.02061176300048828, -0.01856231689453125, -0.01651287078857422, -0.014463424682617188, -0.012413978576660156, -0.010364532470703125, -0.008315086364746094, -0.0062656402587890625, -0.004216194152832031, -0.002166748046875, -0.00011730194091796875, 0.0019321441650390625, 0.003981590270996094, 0.006031036376953125, 0.008080482482910156, 0.010129928588867188, 0.012179374694824219, 0.01422882080078125, 0.01627826690673828, 0.018327713012695312, 0.020377159118652344, 0.022426605224609375, 0.024476051330566406, 0.026525497436523438, 0.02857494354248047, 0.0306243896484375, 0.03267383575439453, 0.03472328186035156, 0.036772727966308594, 0.038822174072265625, 0.040871620178222656, 0.04292106628417969, 0.04497051239013672, 0.04701995849609375, 0.04906940460205078, 0.05111885070800781, 0.053168296813964844, 0.055217742919921875, 0.057267189025878906, 0.05931663513183594, 0.06136608123779297, 0.06341552734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 2.0, 7.0, 9.0, 10.0, 16.0, 15.0, 25.0, 24.0, 44.0, 73.0, 125.0, 177.0, 423.0, 928.0, 3032.0, 69056.0, 957748.0, 13518.0, 1865.0, 676.0, 318.0, 158.0, 82.0, 58.0, 36.0, 20.0, 25.0, 13.0, 15.0, 10.0, 10.0, 6.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1761474609375, -0.17101478576660156, -0.16588211059570312, -0.1607494354248047, -0.15561676025390625, -0.1504840850830078, -0.14535140991210938, -0.14021873474121094, -0.1350860595703125, -0.12995338439941406, -0.12482070922851562, -0.11968803405761719, -0.11455535888671875, -0.10942268371582031, -0.10429000854492188, -0.09915733337402344, -0.094024658203125, -0.08889198303222656, -0.08375930786132812, -0.07862663269042969, -0.07349395751953125, -0.06836128234863281, -0.06322860717773438, -0.05809593200683594, -0.0529632568359375, -0.04783058166503906, -0.042697906494140625, -0.03756523132324219, -0.03243255615234375, -0.027299880981445312, -0.022167205810546875, -0.017034530639648438, -0.01190185546875, -0.0067691802978515625, -0.001636505126953125, 0.0034961700439453125, 0.00862884521484375, 0.013761520385742188, 0.018894195556640625, 0.024026870727539062, 0.0291595458984375, 0.03429222106933594, 0.039424896240234375, 0.04455757141113281, 0.04969024658203125, 0.05482292175292969, 0.059955596923828125, 0.06508827209472656, 0.070220947265625, 0.07535362243652344, 0.08048629760742188, 0.08561897277832031, 0.09075164794921875, 0.09588432312011719, 0.10101699829101562, 0.10614967346191406, 0.1112823486328125, 0.11641502380371094, 0.12154769897460938, 0.1266803741455078, 0.13181304931640625, 0.1369457244873047, 0.14207839965820312, 0.14721107482910156, 0.15234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 9.0, 17.0, 9.0, 14.0, 21.0, 24.0, 25.0, 28.0, 33.0, 34.0, 38.0, 51.0, 49.0, 47.0, 46.0, 57.0, 43.0, 48.0, 52.0, 37.0, 49.0, 37.0, 40.0, 28.0, 25.0, 23.0, 16.0, 18.0, 13.0, 9.0, 11.0, 5.0, 9.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.03936767578125, -0.03816032409667969, -0.036952972412109375, -0.03574562072753906, -0.03453826904296875, -0.03333091735839844, -0.032123565673828125, -0.030916213989257812, -0.0297088623046875, -0.028501510620117188, -0.027294158935546875, -0.026086807250976562, -0.02487945556640625, -0.023672103881835938, -0.022464752197265625, -0.021257400512695312, -0.020050048828125, -0.018842697143554688, -0.017635345458984375, -0.016427993774414062, -0.01522064208984375, -0.014013290405273438, -0.012805938720703125, -0.011598587036132812, -0.0103912353515625, -0.009183883666992188, -0.007976531982421875, -0.0067691802978515625, -0.00556182861328125, -0.0043544769287109375, -0.003147125244140625, -0.0019397735595703125, -0.000732421875, 0.0004749298095703125, 0.001682281494140625, 0.0028896331787109375, 0.00409698486328125, 0.0053043365478515625, 0.006511688232421875, 0.0077190399169921875, 0.0089263916015625, 0.010133743286132812, 0.011341094970703125, 0.012548446655273438, 0.01375579833984375, 0.014963150024414062, 0.016170501708984375, 0.017377853393554688, 0.018585205078125, 0.019792556762695312, 0.020999908447265625, 0.022207260131835938, 0.02341461181640625, 0.024621963500976562, 0.025829315185546875, 0.027036666870117188, 0.0282440185546875, 0.029451370239257812, 0.030658721923828125, 0.03186607360839844, 0.03307342529296875, 0.03428077697753906, 0.035488128662109375, 0.03669548034667969, 0.03790283203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 13.0, 16.0, 16.0, 30.0, 53.0, 57.0, 90.0, 139.0, 241.0, 388.0, 684.0, 1309.0, 3046.0, 9108.0, 45347.0, 528133.0, 409452.0, 36764.0, 8083.0, 2733.0, 1197.0, 637.0, 363.0, 234.0, 139.0, 77.0, 55.0, 41.0, 33.0, 23.0, 14.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0216827392578125, -0.020906925201416016, -0.02013111114501953, -0.019355297088623047, -0.018579483032226562, -0.017803668975830078, -0.017027854919433594, -0.01625204086303711, -0.015476226806640625, -0.01470041275024414, -0.013924598693847656, -0.013148784637451172, -0.012372970581054688, -0.011597156524658203, -0.010821342468261719, -0.010045528411865234, -0.00926971435546875, -0.008493900299072266, -0.007718086242675781, -0.006942272186279297, -0.0061664581298828125, -0.005390644073486328, -0.004614830017089844, -0.0038390159606933594, -0.003063201904296875, -0.0022873878479003906, -0.0015115737915039062, -0.0007357597351074219, 4.00543212890625e-05, 0.0008158683776855469, 0.0015916824340820312, 0.0023674964904785156, 0.003143310546875, 0.003919124603271484, 0.004694938659667969, 0.005470752716064453, 0.0062465667724609375, 0.007022380828857422, 0.007798194885253906, 0.00857400894165039, 0.009349822998046875, 0.01012563705444336, 0.010901451110839844, 0.011677265167236328, 0.012453079223632812, 0.013228893280029297, 0.014004707336425781, 0.014780521392822266, 0.01555633544921875, 0.016332149505615234, 0.01710796356201172, 0.017883777618408203, 0.018659591674804688, 0.019435405731201172, 0.020211219787597656, 0.02098703384399414, 0.021762847900390625, 0.02253866195678711, 0.023314476013183594, 0.024090290069580078, 0.024866104125976562, 0.025641918182373047, 0.02641773223876953, 0.027193546295166016, 0.0279693603515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 4.0, 15.0, 10.0, 12.0, 12.0, 22.0, 28.0, 35.0, 45.0, 71.0, 78.0, 107.0, 113.0, 106.0, 95.0, 63.0, 38.0, 32.0, 25.0, 18.0, 12.0, 7.0, 6.0, 8.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265806198120117e-05, -7.059238851070404e-05, -6.852671504020691e-05, -6.646104156970978e-05, -6.439536809921265e-05, -6.232969462871552e-05, -6.0264021158218384e-05, -5.819834768772125e-05, -5.613267421722412e-05, -5.406700074672699e-05, -5.200132727622986e-05, -4.993565380573273e-05, -4.7869980335235596e-05, -4.5804306864738464e-05, -4.373863339424133e-05, -4.16729599237442e-05, -3.960728645324707e-05, -3.754161298274994e-05, -3.547593951225281e-05, -3.3410266041755676e-05, -3.1344592571258545e-05, -2.9278919100761414e-05, -2.7213245630264282e-05, -2.514757215976715e-05, -2.308189868927002e-05, -2.1016225218772888e-05, -1.8950551748275757e-05, -1.6884878277778625e-05, -1.4819204807281494e-05, -1.2753531336784363e-05, -1.0687857866287231e-05, -8.6221843957901e-06, -6.556510925292969e-06, -4.490837454795837e-06, -2.425163984298706e-06, -3.594905138015747e-07, 1.7061829566955566e-06, 3.771856427192688e-06, 5.837529897689819e-06, 7.90320336818695e-06, 9.968876838684082e-06, 1.2034550309181213e-05, 1.4100223779678345e-05, 1.6165897250175476e-05, 1.8231570720672607e-05, 2.029724419116974e-05, 2.236291766166687e-05, 2.4428591132164e-05, 2.6494264602661133e-05, 2.8559938073158264e-05, 3.0625611543655396e-05, 3.269128501415253e-05, 3.475695848464966e-05, 3.682263195514679e-05, 3.888830542564392e-05, 4.095397889614105e-05, 4.3019652366638184e-05, 4.5085325837135315e-05, 4.7150999307632446e-05, 4.921667277812958e-05, 5.128234624862671e-05, 5.334801971912384e-05, 5.541369318962097e-05, 5.74793666601181e-05, 5.9545040130615234e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 14.0, 11.0, 12.0, 29.0, 30.0, 58.0, 91.0, 174.0, 341.0, 798.0, 2575.0, 23682.0, 886254.0, 126727.0, 5463.0, 1258.0, 431.0, 218.0, 149.0, 67.0, 60.0, 28.0, 19.0, 7.0, 9.0, 9.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050323486328125, -0.048914432525634766, -0.04750537872314453, -0.0460963249206543, -0.04468727111816406, -0.04327821731567383, -0.041869163513183594, -0.04046010971069336, -0.039051055908203125, -0.03764200210571289, -0.036232948303222656, -0.03482389450073242, -0.03341484069824219, -0.03200578689575195, -0.03059673309326172, -0.029187679290771484, -0.02777862548828125, -0.026369571685791016, -0.02496051788330078, -0.023551464080810547, -0.022142410278320312, -0.020733356475830078, -0.019324302673339844, -0.01791524887084961, -0.016506195068359375, -0.01509714126586914, -0.013688087463378906, -0.012279033660888672, -0.010869979858398438, -0.009460926055908203, -0.008051872253417969, -0.006642818450927734, -0.0052337646484375, -0.0038247108459472656, -0.0024156570434570312, -0.0010066032409667969, 0.0004024505615234375, 0.0018115043640136719, 0.0032205581665039062, 0.004629611968994141, 0.006038665771484375, 0.007447719573974609, 0.008856773376464844, 0.010265827178955078, 0.011674880981445312, 0.013083934783935547, 0.014492988586425781, 0.015902042388916016, 0.01731109619140625, 0.018720149993896484, 0.02012920379638672, 0.021538257598876953, 0.022947311401367188, 0.024356365203857422, 0.025765419006347656, 0.02717447280883789, 0.028583526611328125, 0.02999258041381836, 0.031401634216308594, 0.03281068801879883, 0.03421974182128906, 0.0356287956237793, 0.03703784942626953, 0.038446903228759766, 0.03985595703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 6.0, 9.0, 10.0, 19.0, 23.0, 29.0, 41.0, 47.0, 55.0, 79.0, 72.0, 113.0, 107.0, 90.0, 70.0, 51.0, 22.0, 36.0, 26.0, 10.0, 14.0, 15.0, 17.0, 12.0, 11.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01297760009765625, -0.012528538703918457, -0.012079477310180664, -0.011630415916442871, -0.011181354522705078, -0.010732293128967285, -0.010283231735229492, -0.0098341703414917, -0.009385108947753906, -0.008936047554016113, -0.00848698616027832, -0.008037924766540527, -0.007588863372802734, -0.007139801979064941, -0.0066907405853271484, -0.0062416791915893555, -0.0057926177978515625, -0.0053435564041137695, -0.0048944950103759766, -0.004445433616638184, -0.003996372222900391, -0.0035473108291625977, -0.0030982494354248047, -0.0026491880416870117, -0.0022001266479492188, -0.0017510652542114258, -0.0013020038604736328, -0.0008529424667358398, -0.0004038810729980469, 4.5180320739746094e-05, 0.0004942417144775391, 0.000943303108215332, 0.001392364501953125, 0.001841425895690918, 0.002290487289428711, 0.002739548683166504, 0.003188610076904297, 0.00363767147064209, 0.004086732864379883, 0.004535794258117676, 0.004984855651855469, 0.005433917045593262, 0.005882978439331055, 0.006332039833068848, 0.006781101226806641, 0.007230162620544434, 0.0076792240142822266, 0.00812828540802002, 0.008577346801757812, 0.009026408195495605, 0.009475469589233398, 0.009924530982971191, 0.010373592376708984, 0.010822653770446777, 0.01127171516418457, 0.011720776557922363, 0.012169837951660156, 0.01261889934539795, 0.013067960739135742, 0.013517022132873535, 0.013966083526611328, 0.014415144920349121, 0.014864206314086914, 0.015313267707824707, 0.0157623291015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 14.0, 49.0, 158.0, 346.0, 250.0, 132.0, 31.0, 16.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32951870560646057, -0.32184770703315735, -0.3141767382621765, -0.3065057396888733, -0.29883474111557007, -0.29116377234458923, -0.283492773771286, -0.2758217751979828, -0.26815080642700195, -0.26047980785369873, -0.2528088390827179, -0.24513784050941467, -0.23746685683727264, -0.22979587316513062, -0.2221248745918274, -0.21445389091968536, -0.20678289234638214, -0.1991119086742401, -0.1914409101009369, -0.18376992642879486, -0.17609894275665283, -0.1684279441833496, -0.16075696051120758, -0.15308597683906555, -0.14541497826576233, -0.1377439945936203, -0.13007299602031708, -0.12240201234817505, -0.11473102867603302, -0.1070600375533104, -0.09938904643058777, -0.09171806275844574, -0.0840470939874649, -0.07637610286474228, -0.06870511919260025, -0.061034128069877625, -0.0533631406724453, -0.04569215327501297, -0.038021162152290344, -0.030350174754858017, -0.02267918735742569, -0.015008199028670788, -0.007337210699915886, 0.0003337785601615906, 0.008004765957593918, 0.015675753355026245, 0.02334674447774887, 0.031017731875181198, 0.038688719272613525, 0.04635970667004585, 0.05403069406747818, 0.061701685190200806, 0.06937266886234283, 0.07704365998506546, 0.08471465110778809, 0.09238563477993011, 0.10005662590265274, 0.10772761702537537, 0.1153986006975174, 0.12306959182024002, 0.13074058294296265, 0.13841156661510468, 0.1460825502872467, 0.15375354886054993, 0.16142453253269196]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 9.0, 16.0, 11.0, 18.0, 25.0, 28.0, 35.0, 48.0, 44.0, 59.0, 63.0, 65.0, 55.0, 67.0, 57.0, 57.0, 58.0, 57.0, 37.0, 36.0, 34.0, 18.0, 30.0, 25.0, 13.0, 6.0, 9.0, 3.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16439300775527954, -0.15996703505516052, -0.1555410623550415, -0.1511150747537613, -0.14668910205364227, -0.14226312935352325, -0.13783714175224304, -0.13341116905212402, -0.128985196352005, -0.12455922365188599, -0.12013324350118637, -0.11570726335048676, -0.11128129065036774, -0.10685531795024872, -0.1024293377995491, -0.09800335764884949, -0.09357738494873047, -0.08915141224861145, -0.08472543209791183, -0.08029945194721222, -0.0758734792470932, -0.07144750654697418, -0.06702152639627457, -0.06259554624557495, -0.05816957354545593, -0.053743597120046616, -0.0493176206946373, -0.04489164426922798, -0.040465667843818665, -0.03603969141840935, -0.03161371499300003, -0.027187738567590714, -0.022761762142181396, -0.01833578571677208, -0.013909809291362762, -0.009483832865953445, -0.005057856440544128, -0.0006318800151348114, 0.0037940964102745056, 0.008220072835683823, 0.01264604926109314, 0.017072025686502457, 0.021498002111911774, 0.02592397853732109, 0.030349954962730408, 0.034775931388139725, 0.03920190781354904, 0.04362788423895836, 0.048053860664367676, 0.05247983708977699, 0.05690581351518631, 0.06133178994059563, 0.06575776636600494, 0.07018373906612396, 0.07460971921682358, 0.0790356993675232, 0.08346167206764221, 0.08788764476776123, 0.09231362491846085, 0.09673960506916046, 0.10116557776927948, 0.1055915504693985, 0.11001753062009811, 0.11444351077079773, 0.11886948347091675]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 17.0, 15.0, 26.0, 30.0, 50.0, 48.0, 87.0, 152.0, 262.0, 831.0, 2281.0, 4356.0, 7403.0, 64382.0, 3981059.0, 117434.0, 9033.0, 3226.0, 1392.0, 1049.0, 424.0, 207.0, 150.0, 72.0, 57.0, 53.0, 40.0, 28.0, 26.0, 11.0, 15.0, 11.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.055850982666015625, -0.05396270751953125, -0.052074432373046875, -0.0501861572265625, -0.048297882080078125, -0.04640960693359375, -0.044521331787109375, -0.042633056640625, -0.040744781494140625, -0.03885650634765625, -0.036968231201171875, -0.0350799560546875, -0.033191680908203125, -0.03130340576171875, -0.029415130615234375, -0.02752685546875, -0.025638580322265625, -0.02375030517578125, -0.021862030029296875, -0.0199737548828125, -0.018085479736328125, -0.01619720458984375, -0.014308929443359375, -0.012420654296875, -0.010532379150390625, -0.00864410400390625, -0.006755828857421875, -0.0048675537109375, -0.002979278564453125, -0.00109100341796875, 0.000797271728515625, 0.002685546875, 0.004573822021484375, 0.00646209716796875, 0.008350372314453125, 0.0102386474609375, 0.012126922607421875, 0.01401519775390625, 0.015903472900390625, 0.017791748046875, 0.019680023193359375, 0.02156829833984375, 0.023456573486328125, 0.0253448486328125, 0.027233123779296875, 0.02912139892578125, 0.031009674072265625, 0.03289794921875, 0.034786224365234375, 0.03667449951171875, 0.038562774658203125, 0.0404510498046875, 0.042339324951171875, 0.04422760009765625, 0.046115875244140625, 0.048004150390625, 0.049892425537109375, 0.05178070068359375, 0.053668975830078125, 0.0555572509765625, 0.057445526123046875, 0.05933380126953125, 0.061222076416015625, 0.0631103515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 12.0, 99.0, 281.0, 396.0, 172.0, 30.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06506109237670898, -0.06304454803466797, -0.06102800369262695, -0.05901145935058594, -0.05699491500854492, -0.054978370666503906, -0.05296182632446289, -0.050945281982421875, -0.04892873764038086, -0.046912193298339844, -0.04489564895629883, -0.04287910461425781, -0.0408625602722168, -0.03884601593017578, -0.036829471588134766, -0.03481292724609375, -0.032796382904052734, -0.03077983856201172, -0.028763294219970703, -0.026746749877929688, -0.024730205535888672, -0.022713661193847656, -0.02069711685180664, -0.018680572509765625, -0.01666402816772461, -0.014647483825683594, -0.012630939483642578, -0.010614395141601562, -0.008597850799560547, -0.006581306457519531, -0.004564762115478516, -0.0025482177734375, -0.0005316734313964844, 0.0014848709106445312, 0.003501415252685547, 0.0055179595947265625, 0.007534503936767578, 0.009551048278808594, 0.01156759262084961, 0.013584136962890625, 0.01560068130493164, 0.017617225646972656, 0.019633769989013672, 0.021650314331054688, 0.023666858673095703, 0.02568340301513672, 0.027699947357177734, 0.02971649169921875, 0.031733036041259766, 0.03374958038330078, 0.0357661247253418, 0.03778266906738281, 0.03979921340942383, 0.041815757751464844, 0.04383230209350586, 0.045848846435546875, 0.04786539077758789, 0.049881935119628906, 0.05189847946166992, 0.05391502380371094, 0.05593156814575195, 0.05794811248779297, 0.059964656829833984, 0.061981201171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 6.0, 11.0, 17.0, 13.0, 19.0, 47.0, 62.0, 80.0, 130.0, 243.0, 570.0, 2417.0, 71162.0, 4098435.0, 18316.0, 1746.0, 476.0, 217.0, 119.0, 70.0, 29.0, 27.0, 23.0, 14.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06658935546875, -0.06347370147705078, -0.06035804748535156, -0.057242393493652344, -0.054126739501953125, -0.051011085510253906, -0.04789543151855469, -0.04477977752685547, -0.04166412353515625, -0.03854846954345703, -0.03543281555175781, -0.032317161560058594, -0.029201507568359375, -0.026085853576660156, -0.022970199584960938, -0.01985454559326172, -0.0167388916015625, -0.013623237609863281, -0.010507583618164062, -0.007391929626464844, -0.004276275634765625, -0.0011606216430664062, 0.0019550323486328125, 0.005070686340332031, 0.00818634033203125, 0.011301994323730469, 0.014417648315429688, 0.017533302307128906, 0.020648956298828125, 0.023764610290527344, 0.026880264282226562, 0.02999591827392578, 0.033111572265625, 0.03622722625732422, 0.03934288024902344, 0.042458534240722656, 0.045574188232421875, 0.048689842224121094, 0.05180549621582031, 0.05492115020751953, 0.05803680419921875, 0.06115245819091797, 0.06426811218261719, 0.0673837661743164, 0.07049942016601562, 0.07361507415771484, 0.07673072814941406, 0.07984638214111328, 0.0829620361328125, 0.08607769012451172, 0.08919334411621094, 0.09230899810791016, 0.09542465209960938, 0.0985403060913086, 0.10165596008300781, 0.10477161407470703, 0.10788726806640625, 0.11100292205810547, 0.11411857604980469, 0.1172342300415039, 0.12034988403320312, 0.12346553802490234, 0.12658119201660156, 0.12969684600830078, 0.1328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 12.0, 22.0, 24.0, 46.0, 82.0, 114.0, 166.0, 276.0, 508.0, 779.0, 745.0, 487.0, 243.0, 165.0, 100.0, 82.0, 67.0, 38.0, 27.0, 14.0, 16.0, 11.0, 5.0, 8.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036224365234375, -0.035361289978027344, -0.03449821472167969, -0.03363513946533203, -0.032772064208984375, -0.03190898895263672, -0.031045913696289062, -0.030182838439941406, -0.02931976318359375, -0.028456687927246094, -0.027593612670898438, -0.02673053741455078, -0.025867462158203125, -0.02500438690185547, -0.024141311645507812, -0.023278236389160156, -0.0224151611328125, -0.021552085876464844, -0.020689010620117188, -0.01982593536376953, -0.018962860107421875, -0.01809978485107422, -0.017236709594726562, -0.016373634338378906, -0.01551055908203125, -0.014647483825683594, -0.013784408569335938, -0.012921333312988281, -0.012058258056640625, -0.011195182800292969, -0.010332107543945312, -0.009469032287597656, -0.00860595703125, -0.007742881774902344, -0.0068798065185546875, -0.006016731262207031, -0.005153656005859375, -0.004290580749511719, -0.0034275054931640625, -0.0025644302368164062, -0.00170135498046875, -0.0008382797241210938, 2.47955322265625e-05, 0.0008878707885742188, 0.001750946044921875, 0.0026140213012695312, 0.0034770965576171875, 0.004340171813964844, 0.0052032470703125, 0.006066322326660156, 0.0069293975830078125, 0.007792472839355469, 0.008655548095703125, 0.009518623352050781, 0.010381698608398438, 0.011244773864746094, 0.01210784912109375, 0.012970924377441406, 0.013833999633789062, 0.014697074890136719, 0.015560150146484375, 0.01642322540283203, 0.017286300659179688, 0.018149375915527344, 0.019012451171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 35.0, 183.0, 396.0, 271.0, 82.0, 21.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3306017816066742, -0.32248300313949585, -0.3143642246723175, -0.30624544620513916, -0.2981266677379608, -0.29000788927078247, -0.2818891108036041, -0.2737703323364258, -0.26565152406692505, -0.2575327455997467, -0.24941396713256836, -0.24129518866539001, -0.23317641019821167, -0.22505763173103333, -0.2169388383626938, -0.20882005989551544, -0.2007012963294983, -0.19258251786231995, -0.1844637393951416, -0.17634496092796326, -0.1682261824607849, -0.16010740399360657, -0.15198861062526703, -0.14386983215808868, -0.13575105369091034, -0.127632275223732, -0.11951349675655365, -0.11139471083879471, -0.10327593237161636, -0.09515715390443802, -0.08703836798667908, -0.07891958951950073, -0.07080078125, -0.06268200278282166, -0.05456322059035301, -0.04644443839788437, -0.038325659930706024, -0.03020688146352768, -0.022088099271059036, -0.013969317078590393, -0.005850538611412048, 0.0022682417184114456, 0.01038702204823494, 0.018505802378058434, 0.026624582707881927, 0.03474336117506027, 0.042862143367528915, 0.05098092555999756, 0.0590997040271759, 0.06721848249435425, 0.07533726096153259, 0.08345604687929153, 0.09157482534646988, 0.09969360381364822, 0.10781238973140717, 0.11593116819858551, 0.12404994666576385, 0.1321687251329422, 0.14028750360012054, 0.1484062820672989, 0.15652507543563843, 0.16464385390281677, 0.17276263236999512, 0.18088141083717346, 0.1890001893043518]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 20.0, 20.0, 29.0, 28.0, 39.0, 46.0, 49.0, 67.0, 55.0, 58.0, 66.0, 81.0, 54.0, 70.0, 62.0, 51.0, 44.0, 38.0, 34.0, 33.0, 13.0, 14.0, 9.0, 8.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11437290906906128, -0.11101101338863373, -0.10764911770820618, -0.10428722202777863, -0.10092532634735107, -0.09756343066692352, -0.09420154243707657, -0.09083964675664902, -0.08747775107622147, -0.08411585539579391, -0.08075395971536636, -0.07739206403493881, -0.07403017580509186, -0.0706682801246643, -0.06730638444423676, -0.0639444887638092, -0.06058259308338165, -0.0572206974029541, -0.05385880172252655, -0.0504969097673893, -0.047135014086961746, -0.043773118406534195, -0.04041122645139694, -0.03704933077096939, -0.03368743509054184, -0.03032553941011429, -0.026963645592331886, -0.023601751774549484, -0.020239856094121933, -0.01687796041369438, -0.01351606659591198, -0.010154172778129578, -0.006792277097702026, -0.0034303823485970497, -6.848759949207306e-05, 0.0032934071496129036, 0.00665530189871788, 0.010017197579145432, 0.013379091396927834, 0.016740985214710236, 0.020102880895137787, 0.023464776575565338, 0.02682667039334774, 0.030188564211130142, 0.033550459891557693, 0.036912355571985245, 0.0402742475271225, 0.04363614320755005, 0.0469980388879776, 0.05035993456840515, 0.0537218302488327, 0.057083722203969955, 0.06044561788439751, 0.06380751729011536, 0.06716940551996231, 0.07053130120038986, 0.07389319688081741, 0.07725509256124496, 0.08061698824167252, 0.08397888392210007, 0.08734077215194702, 0.09070266783237457, 0.09406456351280212, 0.09742645919322968, 0.10078835487365723]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 5.0, 16.0, 24.0, 14.0, 25.0, 27.0, 37.0, 56.0, 75.0, 99.0, 106.0, 154.0, 246.0, 342.0, 455.0, 861.0, 2063.0, 11319.0, 385453.0, 625560.0, 16362.0, 2405.0, 939.0, 587.0, 319.0, 241.0, 180.0, 145.0, 105.0, 85.0, 54.0, 38.0, 36.0, 31.0, 17.0, 9.0, 11.0, 6.0, 12.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 5.0], "bins": [-0.08221435546875, -0.07993507385253906, -0.07765579223632812, -0.07537651062011719, -0.07309722900390625, -0.07081794738769531, -0.06853866577148438, -0.06625938415527344, -0.0639801025390625, -0.06170082092285156, -0.059421539306640625, -0.05714225769042969, -0.05486297607421875, -0.05258369445800781, -0.050304412841796875, -0.04802513122558594, -0.045745849609375, -0.04346656799316406, -0.041187286376953125, -0.03890800476074219, -0.03662872314453125, -0.03434944152832031, -0.032070159912109375, -0.029790878295898438, -0.0275115966796875, -0.025232315063476562, -0.022953033447265625, -0.020673751831054688, -0.01839447021484375, -0.016115188598632812, -0.013835906982421875, -0.011556625366210938, -0.00927734375, -0.0069980621337890625, -0.004718780517578125, -0.0024394989013671875, -0.00016021728515625, 0.0021190643310546875, 0.004398345947265625, 0.0066776275634765625, 0.0089569091796875, 0.011236190795898438, 0.013515472412109375, 0.015794754028320312, 0.01807403564453125, 0.020353317260742188, 0.022632598876953125, 0.024911880493164062, 0.027191162109375, 0.029470443725585938, 0.031749725341796875, 0.03402900695800781, 0.03630828857421875, 0.03858757019042969, 0.040866851806640625, 0.04314613342285156, 0.0454254150390625, 0.04770469665527344, 0.049983978271484375, 0.05226325988769531, 0.05454254150390625, 0.05682182312011719, 0.059101104736328125, 0.06138038635253906, 0.06365966796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 92.0, 277.0, 403.0, 175.0, 33.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0645751953125, -0.06263542175292969, -0.060695648193359375, -0.05875587463378906, -0.05681610107421875, -0.05487632751464844, -0.052936553955078125, -0.05099678039550781, -0.0490570068359375, -0.04711723327636719, -0.045177459716796875, -0.04323768615722656, -0.04129791259765625, -0.03935813903808594, -0.037418365478515625, -0.03547859191894531, -0.033538818359375, -0.03159904479980469, -0.029659271240234375, -0.027719497680664062, -0.02577972412109375, -0.023839950561523438, -0.021900177001953125, -0.019960403442382812, -0.0180206298828125, -0.016080856323242188, -0.014141082763671875, -0.012201309204101562, -0.01026153564453125, -0.008321762084960938, -0.006381988525390625, -0.0044422149658203125, -0.00250244140625, -0.0005626678466796875, 0.001377105712890625, 0.0033168792724609375, 0.00525665283203125, 0.0071964263916015625, 0.009136199951171875, 0.011075973510742188, 0.0130157470703125, 0.014955520629882812, 0.016895294189453125, 0.018835067749023438, 0.02077484130859375, 0.022714614868164062, 0.024654388427734375, 0.026594161987304688, 0.028533935546875, 0.030473709106445312, 0.032413482666015625, 0.03435325622558594, 0.03629302978515625, 0.03823280334472656, 0.040172576904296875, 0.04211235046386719, 0.0440521240234375, 0.04599189758300781, 0.047931671142578125, 0.04987144470214844, 0.05181121826171875, 0.05375099182128906, 0.055690765380859375, 0.05763053894042969, 0.0595703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 10.0, 16.0, 19.0, 21.0, 25.0, 29.0, 27.0, 36.0, 48.0, 43.0, 71.0, 91.0, 121.0, 227.0, 328.0, 613.0, 1336.0, 4568.0, 26274.0, 294981.0, 637482.0, 68752.0, 9067.0, 2160.0, 855.0, 450.0, 273.0, 160.0, 111.0, 79.0, 68.0, 29.0, 41.0, 28.0, 29.0, 19.0, 16.0, 23.0, 6.0, 2.0, 10.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0455322265625, -0.044161319732666016, -0.04279041290283203, -0.04141950607299805, -0.04004859924316406, -0.03867769241333008, -0.037306785583496094, -0.03593587875366211, -0.034564971923828125, -0.03319406509399414, -0.031823158264160156, -0.030452251434326172, -0.029081344604492188, -0.027710437774658203, -0.02633953094482422, -0.024968624114990234, -0.02359771728515625, -0.022226810455322266, -0.02085590362548828, -0.019484996795654297, -0.018114089965820312, -0.016743183135986328, -0.015372276306152344, -0.01400136947631836, -0.012630462646484375, -0.01125955581665039, -0.009888648986816406, -0.008517742156982422, -0.0071468353271484375, -0.005775928497314453, -0.004405021667480469, -0.0030341148376464844, -0.0016632080078125, -0.0002923011779785156, 0.0010786056518554688, 0.002449512481689453, 0.0038204193115234375, 0.005191326141357422, 0.006562232971191406, 0.00793313980102539, 0.009304046630859375, 0.01067495346069336, 0.012045860290527344, 0.013416767120361328, 0.014787673950195312, 0.016158580780029297, 0.01752948760986328, 0.018900394439697266, 0.02027130126953125, 0.021642208099365234, 0.02301311492919922, 0.024384021759033203, 0.025754928588867188, 0.027125835418701172, 0.028496742248535156, 0.02986764907836914, 0.031238555908203125, 0.03260946273803711, 0.033980369567871094, 0.03535127639770508, 0.03672218322753906, 0.03809309005737305, 0.03946399688720703, 0.040834903717041016, 0.042205810546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 12.0, 7.0, 9.0, 14.0, 12.0, 7.0, 25.0, 24.0, 24.0, 28.0, 30.0, 36.0, 33.0, 41.0, 40.0, 43.0, 32.0, 50.0, 33.0, 43.0, 40.0, 33.0, 38.0, 26.0, 30.0, 43.0, 29.0, 25.0, 27.0, 18.0, 16.0, 19.0, 19.0, 10.0, 10.0, 15.0, 11.0, 7.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0254974365234375, -0.02466559410095215, -0.023833751678466797, -0.023001909255981445, -0.022170066833496094, -0.021338224411010742, -0.02050638198852539, -0.01967453956604004, -0.018842697143554688, -0.018010854721069336, -0.017179012298583984, -0.016347169876098633, -0.015515327453613281, -0.01468348503112793, -0.013851642608642578, -0.013019800186157227, -0.012187957763671875, -0.011356115341186523, -0.010524272918701172, -0.00969243049621582, -0.008860588073730469, -0.008028745651245117, -0.007196903228759766, -0.006365060806274414, -0.0055332183837890625, -0.004701375961303711, -0.0038695335388183594, -0.003037691116333008, -0.0022058486938476562, -0.0013740062713623047, -0.0005421638488769531, 0.00028967857360839844, 0.00112152099609375, 0.0019533634185791016, 0.002785205841064453, 0.0036170482635498047, 0.004448890686035156, 0.005280733108520508, 0.006112575531005859, 0.006944417953491211, 0.0077762603759765625, 0.008608102798461914, 0.009439945220947266, 0.010271787643432617, 0.011103630065917969, 0.01193547248840332, 0.012767314910888672, 0.013599157333374023, 0.014430999755859375, 0.015262842178344727, 0.016094684600830078, 0.01692652702331543, 0.01775836944580078, 0.018590211868286133, 0.019422054290771484, 0.020253896713256836, 0.021085739135742188, 0.02191758155822754, 0.02274942398071289, 0.023581266403198242, 0.024413108825683594, 0.025244951248168945, 0.026076793670654297, 0.02690863609313965, 0.027740478515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 7.0, 9.0, 14.0, 13.0, 19.0, 30.0, 50.0, 62.0, 94.0, 173.0, 236.0, 288.0, 458.0, 723.0, 1119.0, 1737.0, 3087.0, 6507.0, 17019.0, 88354.0, 752327.0, 138333.0, 21427.0, 7471.0, 3592.0, 1973.0, 1119.0, 728.0, 508.0, 333.0, 218.0, 164.0, 97.0, 87.0, 58.0, 34.0, 23.0, 19.0, 14.0, 10.0, 9.0, 8.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019012451171875, -0.01836991310119629, -0.017727375030517578, -0.017084836959838867, -0.016442298889160156, -0.015799760818481445, -0.015157222747802734, -0.014514684677124023, -0.013872146606445312, -0.013229608535766602, -0.01258707046508789, -0.01194453239440918, -0.011301994323730469, -0.010659456253051758, -0.010016918182373047, -0.009374380111694336, -0.008731842041015625, -0.008089303970336914, -0.007446765899658203, -0.006804227828979492, -0.006161689758300781, -0.00551915168762207, -0.004876613616943359, -0.0042340755462646484, -0.0035915374755859375, -0.0029489994049072266, -0.0023064613342285156, -0.0016639232635498047, -0.0010213851928710938, -0.0003788471221923828, 0.0002636909484863281, 0.0009062290191650391, 0.00154876708984375, 0.002191305160522461, 0.002833843231201172, 0.003476381301879883, 0.004118919372558594, 0.004761457443237305, 0.005403995513916016, 0.0060465335845947266, 0.0066890716552734375, 0.0073316097259521484, 0.00797414779663086, 0.00861668586730957, 0.009259223937988281, 0.009901762008666992, 0.010544300079345703, 0.011186838150024414, 0.011829376220703125, 0.012471914291381836, 0.013114452362060547, 0.013756990432739258, 0.014399528503417969, 0.01504206657409668, 0.01568460464477539, 0.0163271427154541, 0.016969680786132812, 0.017612218856811523, 0.018254756927490234, 0.018897294998168945, 0.019539833068847656, 0.020182371139526367, 0.020824909210205078, 0.02146744728088379, 0.0221099853515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 7.0, 9.0, 19.0, 17.0, 18.0, 23.0, 29.0, 29.0, 66.0, 60.0, 138.0, 154.0, 107.0, 74.0, 56.0, 31.0, 23.0, 18.0, 16.0, 14.0, 15.0, 9.0, 9.0, 5.0, 11.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.395578384399414e-05, -6.152968853712082e-05, -5.91035932302475e-05, -5.6677497923374176e-05, -5.4251402616500854e-05, -5.182530730962753e-05, -4.939921200275421e-05, -4.697311669588089e-05, -4.454702138900757e-05, -4.212092608213425e-05, -3.9694830775260925e-05, -3.7268735468387604e-05, -3.484264016151428e-05, -3.241654485464096e-05, -2.999044954776764e-05, -2.7564354240894318e-05, -2.5138258934020996e-05, -2.2712163627147675e-05, -2.0286068320274353e-05, -1.785997301340103e-05, -1.543387770652771e-05, -1.3007782399654388e-05, -1.0581687092781067e-05, -8.155591785907745e-06, -5.729496479034424e-06, -3.3034011721611023e-06, -8.773058652877808e-07, 1.5487894415855408e-06, 3.974884748458862e-06, 6.400980055332184e-06, 8.827075362205505e-06, 1.1253170669078827e-05, 1.3679265975952148e-05, 1.610536128282547e-05, 1.853145658969879e-05, 2.0957551896572113e-05, 2.3383647203445435e-05, 2.5809742510318756e-05, 2.8235837817192078e-05, 3.06619331240654e-05, 3.308802843093872e-05, 3.551412373781204e-05, 3.7940219044685364e-05, 4.0366314351558685e-05, 4.279240965843201e-05, 4.521850496530533e-05, 4.764460027217865e-05, 5.007069557905197e-05, 5.249679088592529e-05, 5.4922886192798615e-05, 5.7348981499671936e-05, 5.977507680654526e-05, 6.220117211341858e-05, 6.46272674202919e-05, 6.705336272716522e-05, 6.947945803403854e-05, 7.190555334091187e-05, 7.433164864778519e-05, 7.675774395465851e-05, 7.918383926153183e-05, 8.160993456840515e-05, 8.403602987527847e-05, 8.64621251821518e-05, 8.888822048902512e-05, 9.131431579589844e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 11.0, 25.0, 27.0, 26.0, 58.0, 79.0, 147.0, 238.0, 473.0, 961.0, 2164.0, 5702.0, 22963.0, 236618.0, 707359.0, 55458.0, 10180.0, 3337.0, 1326.0, 578.0, 329.0, 166.0, 110.0, 60.0, 39.0, 21.0, 19.0, 12.0, 8.0, 10.0, 3.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.018902063369750977, -0.018181324005126953, -0.01746058464050293, -0.016739845275878906, -0.016019105911254883, -0.01529836654663086, -0.014577627182006836, -0.013856887817382812, -0.013136148452758789, -0.012415409088134766, -0.011694669723510742, -0.010973930358886719, -0.010253190994262695, -0.009532451629638672, -0.008811712265014648, -0.008090972900390625, -0.0073702335357666016, -0.006649494171142578, -0.005928754806518555, -0.005208015441894531, -0.004487276077270508, -0.0037665367126464844, -0.003045797348022461, -0.0023250579833984375, -0.001604318618774414, -0.0008835792541503906, -0.0001628398895263672, 0.0005578994750976562, 0.0012786388397216797, 0.001999378204345703, 0.0027201175689697266, 0.00344085693359375, 0.0041615962982177734, 0.004882335662841797, 0.00560307502746582, 0.006323814392089844, 0.007044553756713867, 0.007765293121337891, 0.008486032485961914, 0.009206771850585938, 0.009927511215209961, 0.010648250579833984, 0.011368989944458008, 0.012089729309082031, 0.012810468673706055, 0.013531208038330078, 0.014251947402954102, 0.014972686767578125, 0.01569342613220215, 0.016414165496826172, 0.017134904861450195, 0.01785564422607422, 0.018576383590698242, 0.019297122955322266, 0.02001786231994629, 0.020738601684570312, 0.021459341049194336, 0.02218008041381836, 0.022900819778442383, 0.023621559143066406, 0.02434229850769043, 0.025063037872314453, 0.025783777236938477, 0.0265045166015625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 8.0, 9.0, 7.0, 27.0, 26.0, 40.0, 68.0, 118.0, 157.0, 169.0, 103.0, 93.0, 53.0, 38.0, 18.0, 16.0, 11.0, 3.0, 10.0, 6.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0193328857421875, -0.018838882446289062, -0.018344879150390625, -0.017850875854492188, -0.01735687255859375, -0.016862869262695312, -0.016368865966796875, -0.015874862670898438, -0.015380859375, -0.014886856079101562, -0.014392852783203125, -0.013898849487304688, -0.01340484619140625, -0.012910842895507812, -0.012416839599609375, -0.011922836303710938, -0.0114288330078125, -0.010934829711914062, -0.010440826416015625, -0.009946823120117188, -0.00945281982421875, -0.008958816528320312, -0.008464813232421875, -0.007970809936523438, -0.007476806640625, -0.0069828033447265625, -0.006488800048828125, -0.0059947967529296875, -0.00550079345703125, -0.0050067901611328125, -0.004512786865234375, -0.0040187835693359375, -0.0035247802734375, -0.0030307769775390625, -0.002536773681640625, -0.0020427703857421875, -0.00154876708984375, -0.0010547637939453125, -0.000560760498046875, -6.67572021484375e-05, 0.00042724609375, 0.0009212493896484375, 0.001415252685546875, 0.0019092559814453125, 0.00240325927734375, 0.0028972625732421875, 0.003391265869140625, 0.0038852691650390625, 0.0043792724609375, 0.0048732757568359375, 0.005367279052734375, 0.0058612823486328125, 0.00635528564453125, 0.0068492889404296875, 0.007343292236328125, 0.007837295532226562, 0.008331298828125, 0.008825302124023438, 0.009319305419921875, 0.009813308715820312, 0.01030731201171875, 0.010801315307617188, 0.011295318603515625, 0.011789321899414062, 0.0122833251953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 18.0, 303.0, 621.0, 55.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7951155304908752, -0.7753276228904724, -0.7555397152900696, -0.735751748085022, -0.7159638404846191, -0.6961759328842163, -0.6763880252838135, -0.6566001176834106, -0.636812150478363, -0.6170242428779602, -0.5972363352775574, -0.5774483680725098, -0.5576604604721069, -0.5378725528717041, -0.5180846452713013, -0.49829670786857605, -0.4785088002681732, -0.4587208926677704, -0.43893295526504517, -0.41914504766464233, -0.3993571102619171, -0.3795692026615143, -0.35978126525878906, -0.33999335765838623, -0.3202054500579834, -0.30041754245758057, -0.28062960505485535, -0.2608416974544525, -0.2410537600517273, -0.22126585245132446, -0.20147792994976044, -0.1816900074481964, -0.1619020402431488, -0.14211411774158478, -0.12232619524002075, -0.10253828018903732, -0.0827503576874733, -0.06296243518590927, -0.04317452013492584, -0.023386597633361816, -0.0035986751317977905, 0.016189245507121086, 0.03597716614603996, 0.05576508492231369, 0.07555300742387772, 0.09534092992544174, 0.11512884497642517, 0.1349167674779892, 0.15470468997955322, 0.17449261248111725, 0.19428053498268127, 0.2140684425830841, 0.23385637998580933, 0.25364428758621216, 0.273432195186615, 0.2932201325893402, 0.31300806999206543, 0.33279597759246826, 0.3525839149951935, 0.3723718225955963, 0.39215975999832153, 0.41194766759872437, 0.4317355751991272, 0.4515235126018524, 0.47131142020225525]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 5.0, 10.0, 6.0, 15.0, 17.0, 26.0, 19.0, 35.0, 31.0, 38.0, 56.0, 44.0, 46.0, 55.0, 80.0, 67.0, 69.0, 54.0, 51.0, 46.0, 47.0, 32.0, 39.0, 22.0, 32.0, 22.0, 12.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.16861772537231445, -0.16424690186977386, -0.15987607836723328, -0.1555052548646927, -0.1511344313621521, -0.1467636078596115, -0.14239278435707092, -0.13802196085453033, -0.13365113735198975, -0.12928031384944916, -0.12490949034690857, -0.12053866684436798, -0.11616784334182739, -0.1117970198392868, -0.10742619633674622, -0.10305537283420563, -0.09868454933166504, -0.09431372582912445, -0.08994290232658386, -0.08557207882404327, -0.08120125532150269, -0.0768304318189621, -0.07245960831642151, -0.06808878481388092, -0.06371796131134033, -0.059347137808799744, -0.054976314306259155, -0.05060549080371857, -0.04623466730117798, -0.04186384379863739, -0.0374930202960968, -0.03312219679355621, -0.028751373291015625, -0.024380549788475037, -0.020009726285934448, -0.01563890278339386, -0.011268079280853271, -0.006897255778312683, -0.0025264322757720947, 0.0018443912267684937, 0.006215214729309082, 0.01058603823184967, 0.014956861734390259, 0.019327685236930847, 0.023698508739471436, 0.028069332242012024, 0.03244015574455261, 0.0368109792470932, 0.04118180274963379, 0.04555262625217438, 0.049923449754714966, 0.054294273257255554, 0.05866509675979614, 0.06303592026233673, 0.06740674376487732, 0.07177756726741791, 0.0761483907699585, 0.08051921427249908, 0.08489003777503967, 0.08926086127758026, 0.09363168478012085, 0.09800250828266144, 0.10237333178520203, 0.10674415528774261, 0.1111149787902832]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 13.0, 11.0, 28.0, 54.0, 100.0, 150.0, 470.0, 2084.0, 5914.0, 20152.0, 3985124.0, 168290.0, 8094.0, 1905.0, 1134.0, 312.0, 171.0, 88.0, 65.0, 38.0, 25.0, 15.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08563232421875, -0.08301639556884766, -0.08040046691894531, -0.07778453826904297, -0.07516860961914062, -0.07255268096923828, -0.06993675231933594, -0.0673208236694336, -0.06470489501953125, -0.062088966369628906, -0.05947303771972656, -0.05685710906982422, -0.054241180419921875, -0.05162525177001953, -0.04900932312011719, -0.046393394470214844, -0.0437774658203125, -0.041161537170410156, -0.03854560852050781, -0.03592967987060547, -0.033313751220703125, -0.03069782257080078, -0.028081893920898438, -0.025465965270996094, -0.02285003662109375, -0.020234107971191406, -0.017618179321289062, -0.015002250671386719, -0.012386322021484375, -0.009770393371582031, -0.0071544647216796875, -0.004538536071777344, -0.001922607421875, 0.0006933212280273438, 0.0033092498779296875, 0.005925178527832031, 0.008541107177734375, 0.011157035827636719, 0.013772964477539062, 0.016388893127441406, 0.01900482177734375, 0.021620750427246094, 0.024236679077148438, 0.02685260772705078, 0.029468536376953125, 0.03208446502685547, 0.03470039367675781, 0.037316322326660156, 0.0399322509765625, 0.042548179626464844, 0.04516410827636719, 0.04778003692626953, 0.050395965576171875, 0.05301189422607422, 0.05562782287597656, 0.058243751525878906, 0.06085968017578125, 0.0634756088256836, 0.06609153747558594, 0.06870746612548828, 0.07132339477539062, 0.07393932342529297, 0.07655525207519531, 0.07917118072509766, 0.081787109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 12.0, 83.0, 283.0, 387.0, 195.0, 27.0, 11.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.06530046463012695, -0.0632791519165039, -0.06125783920288086, -0.05923652648925781, -0.057215213775634766, -0.05519390106201172, -0.05317258834838867, -0.051151275634765625, -0.04912996292114258, -0.04710865020751953, -0.045087337493896484, -0.04306602478027344, -0.04104471206665039, -0.039023399353027344, -0.0370020866394043, -0.03498077392578125, -0.0329594612121582, -0.030938148498535156, -0.02891683578491211, -0.026895523071289062, -0.024874210357666016, -0.02285289764404297, -0.020831584930419922, -0.018810272216796875, -0.016788959503173828, -0.014767646789550781, -0.012746334075927734, -0.010725021362304688, -0.00870370864868164, -0.006682395935058594, -0.004661083221435547, -0.0026397705078125, -0.0006184577941894531, 0.0014028549194335938, 0.0034241676330566406, 0.0054454803466796875, 0.007466793060302734, 0.009488105773925781, 0.011509418487548828, 0.013530731201171875, 0.015552043914794922, 0.01757335662841797, 0.019594669342041016, 0.021615982055664062, 0.02363729476928711, 0.025658607482910156, 0.027679920196533203, 0.02970123291015625, 0.0317225456237793, 0.033743858337402344, 0.03576517105102539, 0.03778648376464844, 0.039807796478271484, 0.04182910919189453, 0.04385042190551758, 0.045871734619140625, 0.04789304733276367, 0.04991436004638672, 0.051935672760009766, 0.05395698547363281, 0.05597829818725586, 0.057999610900878906, 0.06002092361450195, 0.062042236328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 11.0, 21.0, 14.0, 29.0, 52.0, 104.0, 233.0, 771.0, 9480.0, 4152151.0, 29621.0, 1286.0, 272.0, 111.0, 51.0, 22.0, 16.0, 9.0, 11.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11166858673095703, -0.10730934143066406, -0.1029500961303711, -0.09859085083007812, -0.09423160552978516, -0.08987236022949219, -0.08551311492919922, -0.08115386962890625, -0.07679462432861328, -0.07243537902832031, -0.06807613372802734, -0.06371688842773438, -0.059357643127441406, -0.05499839782714844, -0.05063915252685547, -0.0462799072265625, -0.04192066192626953, -0.03756141662597656, -0.033202171325683594, -0.028842926025390625, -0.024483680725097656, -0.020124435424804688, -0.01576519012451172, -0.01140594482421875, -0.007046699523925781, -0.0026874542236328125, 0.0016717910766601562, 0.006031036376953125, 0.010390281677246094, 0.014749526977539062, 0.01910877227783203, 0.023468017578125, 0.02782726287841797, 0.03218650817871094, 0.036545753479003906, 0.040904998779296875, 0.045264244079589844, 0.04962348937988281, 0.05398273468017578, 0.05834197998046875, 0.06270122528076172, 0.06706047058105469, 0.07141971588134766, 0.07577896118164062, 0.0801382064819336, 0.08449745178222656, 0.08885669708251953, 0.0932159423828125, 0.09757518768310547, 0.10193443298339844, 0.1062936782836914, 0.11065292358398438, 0.11501216888427734, 0.11937141418457031, 0.12373065948486328, 0.12808990478515625, 0.13244915008544922, 0.1368083953857422, 0.14116764068603516, 0.14552688598632812, 0.1498861312866211, 0.15424537658691406, 0.15860462188720703, 0.1629638671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 2.0, 9.0, 19.0, 28.0, 46.0, 107.0, 182.0, 453.0, 1002.0, 1158.0, 500.0, 240.0, 129.0, 72.0, 49.0, 23.0, 20.0, 11.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.045379638671875, -0.04418826103210449, -0.042996883392333984, -0.04180550575256348, -0.04061412811279297, -0.03942275047302246, -0.03823137283325195, -0.037039995193481445, -0.03584861755371094, -0.03465723991394043, -0.03346586227416992, -0.032274484634399414, -0.031083106994628906, -0.0298917293548584, -0.02870035171508789, -0.027508974075317383, -0.026317596435546875, -0.025126218795776367, -0.02393484115600586, -0.02274346351623535, -0.021552085876464844, -0.020360708236694336, -0.019169330596923828, -0.01797795295715332, -0.016786575317382812, -0.015595197677612305, -0.014403820037841797, -0.013212442398071289, -0.012021064758300781, -0.010829687118530273, -0.009638309478759766, -0.008446931838989258, -0.00725555419921875, -0.006064176559448242, -0.004872798919677734, -0.0036814212799072266, -0.0024900436401367188, -0.001298666000366211, -0.00010728836059570312, 0.0010840892791748047, 0.0022754669189453125, 0.0034668445587158203, 0.004658222198486328, 0.005849599838256836, 0.007040977478027344, 0.008232355117797852, 0.00942373275756836, 0.010615110397338867, 0.011806488037109375, 0.012997865676879883, 0.01418924331665039, 0.015380620956420898, 0.016571998596191406, 0.017763376235961914, 0.018954753875732422, 0.02014613151550293, 0.021337509155273438, 0.022528886795043945, 0.023720264434814453, 0.02491164207458496, 0.02610301971435547, 0.027294397354125977, 0.028485774993896484, 0.029677152633666992, 0.0308685302734375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 73.0, 430.0, 402.0, 71.0, 16.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5248697400093079, -0.5129035115242004, -0.5009373426437378, -0.48897111415863037, -0.47700491547584534, -0.4650387167930603, -0.4530724883079529, -0.44110628962516785, -0.4291400909423828, -0.4171738922595978, -0.40520766377449036, -0.3932414650917053, -0.3812752664089203, -0.36930906772613525, -0.35734283924102783, -0.3453766405582428, -0.3334104120731354, -0.32144421339035034, -0.3094779849052429, -0.2975117862224579, -0.28554558753967285, -0.27357935905456543, -0.2616131603717804, -0.24964696168899536, -0.23768074810504913, -0.2257145345211029, -0.21374833583831787, -0.20178212225437164, -0.18981590867042542, -0.17784970998764038, -0.16588349640369415, -0.15391728281974792, -0.14195111393928528, -0.12998490035533905, -0.11801870167255402, -0.10605248808860779, -0.09408628195524216, -0.08212007582187653, -0.0701538622379303, -0.05818765610456467, -0.046221449971199036, -0.034255243837833405, -0.022289033979177475, -0.010322824120521545, 0.0016433820128440857, 0.013609588146209717, 0.025575801730155945, 0.037542007863521576, 0.04950821399688721, 0.06147442013025284, 0.07344062626361847, 0.0854068398475647, 0.09737304598093033, 0.10933925211429596, 0.12130546569824219, 0.13327166438102722, 0.14523787796497345, 0.15720409154891968, 0.1691702902317047, 0.18113650381565094, 0.19310271739959717, 0.2050689160823822, 0.21703512966632843, 0.22900134325027466, 0.2409675419330597]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 8.0, 8.0, 17.0, 29.0, 22.0, 19.0, 29.0, 40.0, 32.0, 45.0, 23.0, 37.0, 41.0, 37.0, 40.0, 47.0, 45.0, 40.0, 39.0, 37.0, 48.0, 45.0, 34.0, 21.0, 33.0, 27.0, 21.0, 24.0, 17.0, 13.0, 11.0, 9.0, 11.0, 4.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07431608438491821, -0.0722103863954544, -0.0701046958565712, -0.06799899786710739, -0.06589330732822418, -0.06378760933876038, -0.06168191134929657, -0.05957621708512306, -0.057470522820949554, -0.05536482855677605, -0.05325913429260254, -0.05115343630313873, -0.049047742038965225, -0.04694204777479172, -0.04483634978532791, -0.042730655521154404, -0.040624961256980896, -0.03851926699280739, -0.03641357272863388, -0.034307874739170074, -0.03220218047499657, -0.03009648621082306, -0.027990790084004402, -0.025885093957185745, -0.023779399693012238, -0.02167370542883873, -0.019568009302020073, -0.017462313175201416, -0.015356618911027908, -0.013250923715531826, -0.011145228520035744, -0.009039533324539661, -0.006933838129043579, -0.004828142933547497, -0.0027224477380514145, -0.0006167525425553322, 0.0014889426529407501, 0.0035946378484368324, 0.005700333043932915, 0.007806028239428997, 0.00991172343492508, 0.012017418630421162, 0.014123113825917244, 0.0162288099527359, 0.01833450421690941, 0.020440198481082916, 0.022545894607901573, 0.02465159073472023, 0.026757284998893738, 0.028862979263067245, 0.030968675389885902, 0.03307437151670456, 0.03518006578087807, 0.037285760045051575, 0.03939145803451538, 0.04149715229868889, 0.043602846562862396, 0.045708540827035904, 0.04781423509120941, 0.04991993308067322, 0.052025627344846725, 0.05413132160902023, 0.05623701959848404, 0.05834271386265755, 0.060448408126831055]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 7.0, 8.0, 9.0, 16.0, 18.0, 23.0, 34.0, 45.0, 59.0, 71.0, 104.0, 155.0, 215.0, 321.0, 550.0, 955.0, 2365.0, 17855.0, 763281.0, 251188.0, 7543.0, 1560.0, 787.0, 455.0, 291.0, 171.0, 127.0, 99.0, 64.0, 57.0, 39.0, 16.0, 17.0, 15.0, 10.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0982666015625, -0.09485816955566406, -0.09144973754882812, -0.08804130554199219, -0.08463287353515625, -0.08122444152832031, -0.07781600952148438, -0.07440757751464844, -0.0709991455078125, -0.06759071350097656, -0.06418228149414062, -0.06077384948730469, -0.05736541748046875, -0.05395698547363281, -0.050548553466796875, -0.04714012145996094, -0.043731689453125, -0.04032325744628906, -0.036914825439453125, -0.03350639343261719, -0.03009796142578125, -0.026689529418945312, -0.023281097412109375, -0.019872665405273438, -0.0164642333984375, -0.013055801391601562, -0.009647369384765625, -0.0062389373779296875, -0.00283050537109375, 0.0005779266357421875, 0.003986358642578125, 0.0073947906494140625, 0.01080322265625, 0.014211654663085938, 0.017620086669921875, 0.021028518676757812, 0.02443695068359375, 0.027845382690429688, 0.031253814697265625, 0.03466224670410156, 0.0380706787109375, 0.04147911071777344, 0.044887542724609375, 0.04829597473144531, 0.05170440673828125, 0.05511283874511719, 0.058521270751953125, 0.06192970275878906, 0.065338134765625, 0.06874656677246094, 0.07215499877929688, 0.07556343078613281, 0.07897186279296875, 0.08238029479980469, 0.08578872680664062, 0.08919715881347656, 0.0926055908203125, 0.09601402282714844, 0.09942245483398438, 0.10283088684082031, 0.10623931884765625, 0.10964775085449219, 0.11305618286132812, 0.11646461486816406, 0.119873046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 67.0, 249.0, 407.0, 222.0, 31.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.0642404556274414, -0.06225776672363281, -0.06027507781982422, -0.058292388916015625, -0.05630970001220703, -0.05432701110839844, -0.052344322204589844, -0.05036163330078125, -0.048378944396972656, -0.04639625549316406, -0.04441356658935547, -0.042430877685546875, -0.04044818878173828, -0.03846549987792969, -0.036482810974121094, -0.0345001220703125, -0.032517433166503906, -0.030534744262695312, -0.02855205535888672, -0.026569366455078125, -0.02458667755126953, -0.022603988647460938, -0.020621299743652344, -0.01863861083984375, -0.016655921936035156, -0.014673233032226562, -0.012690544128417969, -0.010707855224609375, -0.008725166320800781, -0.0067424774169921875, -0.004759788513183594, -0.002777099609375, -0.0007944107055664062, 0.0011882781982421875, 0.0031709671020507812, 0.005153656005859375, 0.007136344909667969, 0.009119033813476562, 0.011101722717285156, 0.01308441162109375, 0.015067100524902344, 0.017049789428710938, 0.01903247833251953, 0.021015167236328125, 0.02299785614013672, 0.024980545043945312, 0.026963233947753906, 0.0289459228515625, 0.030928611755371094, 0.03291130065917969, 0.03489398956298828, 0.036876678466796875, 0.03885936737060547, 0.04084205627441406, 0.042824745178222656, 0.04480743408203125, 0.046790122985839844, 0.04877281188964844, 0.05075550079345703, 0.052738189697265625, 0.05472087860107422, 0.05670356750488281, 0.058686256408691406, 0.0606689453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 10.0, 10.0, 9.0, 22.0, 31.0, 36.0, 42.0, 102.0, 152.0, 230.0, 392.0, 769.0, 1880.0, 11754.0, 458502.0, 556445.0, 14299.0, 2026.0, 771.0, 420.0, 199.0, 150.0, 103.0, 60.0, 33.0, 28.0, 22.0, 9.0, 17.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07078075408935547, -0.06795310974121094, -0.0651254653930664, -0.062297821044921875, -0.059470176696777344, -0.05664253234863281, -0.05381488800048828, -0.05098724365234375, -0.04815959930419922, -0.04533195495605469, -0.042504310607910156, -0.039676666259765625, -0.036849021911621094, -0.03402137756347656, -0.03119373321533203, -0.0283660888671875, -0.02553844451904297, -0.022710800170898438, -0.019883155822753906, -0.017055511474609375, -0.014227867126464844, -0.011400222778320312, -0.008572578430175781, -0.00574493408203125, -0.0029172897338867188, -8.96453857421875e-05, 0.0027379989624023438, 0.005565643310546875, 0.008393287658691406, 0.011220932006835938, 0.014048576354980469, 0.016876220703125, 0.01970386505126953, 0.022531509399414062, 0.025359153747558594, 0.028186798095703125, 0.031014442443847656, 0.03384208679199219, 0.03666973114013672, 0.03949737548828125, 0.04232501983642578, 0.04515266418457031, 0.047980308532714844, 0.050807952880859375, 0.053635597229003906, 0.05646324157714844, 0.05929088592529297, 0.0621185302734375, 0.06494617462158203, 0.06777381896972656, 0.0706014633178711, 0.07342910766601562, 0.07625675201416016, 0.07908439636230469, 0.08191204071044922, 0.08473968505859375, 0.08756732940673828, 0.09039497375488281, 0.09322261810302734, 0.09605026245117188, 0.0988779067993164, 0.10170555114746094, 0.10453319549560547, 0.10736083984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 3.0, 14.0, 12.0, 12.0, 18.0, 16.0, 23.0, 32.0, 36.0, 46.0, 40.0, 47.0, 44.0, 53.0, 59.0, 49.0, 54.0, 54.0, 50.0, 57.0, 54.0, 35.0, 40.0, 33.0, 22.0, 17.0, 21.0, 9.0, 14.0, 5.0, 5.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.04265475273132324, -0.041486263275146484, -0.04031777381896973, -0.03914928436279297, -0.03798079490661621, -0.03681230545043945, -0.035643815994262695, -0.03447532653808594, -0.03330683708190918, -0.03213834762573242, -0.030969858169555664, -0.029801368713378906, -0.02863287925720215, -0.02746438980102539, -0.026295900344848633, -0.025127410888671875, -0.023958921432495117, -0.02279043197631836, -0.0216219425201416, -0.020453453063964844, -0.019284963607788086, -0.018116474151611328, -0.01694798469543457, -0.015779495239257812, -0.014611005783081055, -0.013442516326904297, -0.012274026870727539, -0.011105537414550781, -0.009937047958374023, -0.008768558502197266, -0.007600069046020508, -0.00643157958984375, -0.005263090133666992, -0.004094600677490234, -0.0029261112213134766, -0.0017576217651367188, -0.0005891323089599609, 0.0005793571472167969, 0.0017478466033935547, 0.0029163360595703125, 0.00408482551574707, 0.005253314971923828, 0.006421804428100586, 0.007590293884277344, 0.008758783340454102, 0.00992727279663086, 0.011095762252807617, 0.012264251708984375, 0.013432741165161133, 0.01460123062133789, 0.01576972007751465, 0.016938209533691406, 0.018106698989868164, 0.019275188446044922, 0.02044367790222168, 0.021612167358398438, 0.022780656814575195, 0.023949146270751953, 0.02511763572692871, 0.02628612518310547, 0.027454614639282227, 0.028623104095458984, 0.029791593551635742, 0.0309600830078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 1.0, 8.0, 8.0, 16.0, 19.0, 18.0, 34.0, 61.0, 70.0, 105.0, 157.0, 262.0, 491.0, 1066.0, 2303.0, 6208.0, 21194.0, 114599.0, 693563.0, 167753.0, 27657.0, 7586.0, 2747.0, 1235.0, 573.0, 301.0, 183.0, 119.0, 61.0, 46.0, 32.0, 20.0, 13.0, 13.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0293426513671875, -0.02849435806274414, -0.02764606475830078, -0.026797771453857422, -0.025949478149414062, -0.025101184844970703, -0.024252891540527344, -0.023404598236083984, -0.022556304931640625, -0.021708011627197266, -0.020859718322753906, -0.020011425018310547, -0.019163131713867188, -0.018314838409423828, -0.01746654510498047, -0.01661825180053711, -0.01576995849609375, -0.01492166519165039, -0.014073371887207031, -0.013225078582763672, -0.012376785278320312, -0.011528491973876953, -0.010680198669433594, -0.009831905364990234, -0.008983612060546875, -0.008135318756103516, -0.007287025451660156, -0.006438732147216797, -0.0055904388427734375, -0.004742145538330078, -0.0038938522338867188, -0.0030455589294433594, -0.002197265625, -0.0013489723205566406, -0.0005006790161132812, 0.0003476142883300781, 0.0011959075927734375, 0.002044200897216797, 0.0028924942016601562, 0.0037407875061035156, 0.004589080810546875, 0.005437374114990234, 0.006285667419433594, 0.007133960723876953, 0.007982254028320312, 0.008830547332763672, 0.009678840637207031, 0.01052713394165039, 0.01137542724609375, 0.01222372055053711, 0.013072013854980469, 0.013920307159423828, 0.014768600463867188, 0.015616893768310547, 0.016465187072753906, 0.017313480377197266, 0.018161773681640625, 0.019010066986083984, 0.019858360290527344, 0.020706653594970703, 0.021554946899414062, 0.022403240203857422, 0.02325153350830078, 0.02409982681274414, 0.0249481201171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 19.0, 12.0, 26.0, 39.0, 52.0, 89.0, 157.0, 214.0, 128.0, 76.0, 44.0, 36.0, 27.0, 10.0, 9.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016164779663085938, -0.0001577325165271759, -0.00015381723642349243, -0.00014990195631980896, -0.0001459866762161255, -0.00014207139611244202, -0.00013815611600875854, -0.00013424083590507507, -0.0001303255558013916, -0.00012641027569770813, -0.00012249499559402466, -0.00011857971549034119, -0.00011466443538665771, -0.00011074915528297424, -0.00010683387517929077, -0.0001029185950756073, -9.900331497192383e-05, -9.508803486824036e-05, -9.117275476455688e-05, -8.725747466087341e-05, -8.334219455718994e-05, -7.942691445350647e-05, -7.5511634349823e-05, -7.159635424613953e-05, -6.768107414245605e-05, -6.376579403877258e-05, -5.985051393508911e-05, -5.593523383140564e-05, -5.201995372772217e-05, -4.8104673624038696e-05, -4.4189393520355225e-05, -4.027411341667175e-05, -3.635883331298828e-05, -3.244355320930481e-05, -2.8528273105621338e-05, -2.4612993001937866e-05, -2.0697712898254395e-05, -1.6782432794570923e-05, -1.2867152690887451e-05, -8.95187258720398e-06, -5.036592483520508e-06, -1.1213123798370361e-06, 2.7939677238464355e-06, 6.709247827529907e-06, 1.0624527931213379e-05, 1.453980803489685e-05, 1.8455088138580322e-05, 2.2370368242263794e-05, 2.6285648345947266e-05, 3.0200928449630737e-05, 3.411620855331421e-05, 3.803148865699768e-05, 4.194676876068115e-05, 4.5862048864364624e-05, 4.9777328968048096e-05, 5.369260907173157e-05, 5.760788917541504e-05, 6.152316927909851e-05, 6.543844938278198e-05, 6.935372948646545e-05, 7.326900959014893e-05, 7.71842896938324e-05, 8.109956979751587e-05, 8.501484990119934e-05, 8.893013000488281e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 9.0, 14.0, 19.0, 28.0, 41.0, 37.0, 60.0, 71.0, 109.0, 200.0, 324.0, 549.0, 1232.0, 3243.0, 12490.0, 84662.0, 766053.0, 153276.0, 18482.0, 4315.0, 1482.0, 746.0, 371.0, 241.0, 134.0, 106.0, 64.0, 45.0, 31.0, 24.0, 18.0, 10.0, 12.0, 3.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029815673828125, -0.028809070587158203, -0.027802467346191406, -0.02679586410522461, -0.025789260864257812, -0.024782657623291016, -0.02377605438232422, -0.022769451141357422, -0.021762847900390625, -0.020756244659423828, -0.01974964141845703, -0.018743038177490234, -0.017736434936523438, -0.01672983169555664, -0.015723228454589844, -0.014716625213623047, -0.01371002197265625, -0.012703418731689453, -0.011696815490722656, -0.01069021224975586, -0.009683609008789062, -0.008677005767822266, -0.007670402526855469, -0.006663799285888672, -0.005657196044921875, -0.004650592803955078, -0.0036439895629882812, -0.0026373863220214844, -0.0016307830810546875, -0.0006241798400878906, 0.00038242340087890625, 0.0013890266418457031, 0.0023956298828125, 0.003402233123779297, 0.004408836364746094, 0.005415439605712891, 0.0064220428466796875, 0.007428646087646484, 0.008435249328613281, 0.009441852569580078, 0.010448455810546875, 0.011455059051513672, 0.012461662292480469, 0.013468265533447266, 0.014474868774414062, 0.01548147201538086, 0.016488075256347656, 0.017494678497314453, 0.01850128173828125, 0.019507884979248047, 0.020514488220214844, 0.02152109146118164, 0.022527694702148438, 0.023534297943115234, 0.02454090118408203, 0.025547504425048828, 0.026554107666015625, 0.027560710906982422, 0.02856731414794922, 0.029573917388916016, 0.030580520629882812, 0.03158712387084961, 0.032593727111816406, 0.0336003303527832, 0.03460693359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 6.0, 18.0, 13.0, 23.0, 22.0, 20.0, 36.0, 36.0, 66.0, 91.0, 122.0, 128.0, 84.0, 81.0, 49.0, 27.0, 31.0, 17.0, 23.0, 18.0, 7.0, 13.0, 12.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147705078125, -0.014266252517700195, -0.01376199722290039, -0.013257741928100586, -0.012753486633300781, -0.012249231338500977, -0.011744976043701172, -0.011240720748901367, -0.010736465454101562, -0.010232210159301758, -0.009727954864501953, -0.009223699569702148, -0.008719444274902344, -0.008215188980102539, -0.007710933685302734, -0.00720667839050293, -0.006702423095703125, -0.00619816780090332, -0.005693912506103516, -0.005189657211303711, -0.004685401916503906, -0.0041811466217041016, -0.003676891326904297, -0.003172636032104492, -0.0026683807373046875, -0.002164125442504883, -0.0016598701477050781, -0.0011556148529052734, -0.0006513595581054688, -0.00014710426330566406, 0.0003571510314941406, 0.0008614063262939453, 0.00136566162109375, 0.0018699169158935547, 0.0023741722106933594, 0.002878427505493164, 0.0033826828002929688, 0.0038869380950927734, 0.004391193389892578, 0.004895448684692383, 0.0053997039794921875, 0.005903959274291992, 0.006408214569091797, 0.0069124698638916016, 0.007416725158691406, 0.007920980453491211, 0.008425235748291016, 0.00892949104309082, 0.009433746337890625, 0.00993800163269043, 0.010442256927490234, 0.010946512222290039, 0.011450767517089844, 0.011955022811889648, 0.012459278106689453, 0.012963533401489258, 0.013467788696289062, 0.013972043991088867, 0.014476299285888672, 0.014980554580688477, 0.015484809875488281, 0.015989065170288086, 0.01649332046508789, 0.016997575759887695, 0.0175018310546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 322.0, 632.0, 45.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41871970891952515, -0.3891350328922272, -0.3595503568649292, -0.32996565103530884, -0.30038100481033325, -0.2707962989807129, -0.24121162295341492, -0.21162694692611694, -0.18204227089881897, -0.152457594871521, -0.12287291139364243, -0.09328822791576385, -0.06370355188846588, -0.03411887586116791, -0.00453418493270874, 0.025050491094589233, 0.05463516712188721, 0.08421984314918518, 0.11380452662706375, 0.14338921010494232, 0.1729738861322403, 0.20255856215953827, 0.23214325308799744, 0.2617279291152954, 0.2913126051425934, 0.32089728116989136, 0.35048195719718933, 0.3800666332244873, 0.40965133905410767, 0.43923598527908325, 0.4688206911087036, 0.4984053671360016, 0.5279901027679443, 0.5575748085975647, 0.5871594548225403, 0.6167441606521606, 0.6463288068771362, 0.6759135127067566, 0.705498218536377, 0.7350828647613525, 0.7646675109863281, 0.7942522168159485, 0.8238368630409241, 0.8534215688705444, 0.88300621509552, 0.9125909209251404, 0.9421756267547607, 0.9717602729797363, 1.001344919204712, 1.0309295654296875, 1.0605143308639526, 1.0900989770889282, 1.1196836233139038, 1.1492682695388794, 1.1788530349731445, 1.2084376811981201, 1.2380224466323853, 1.2676070928573608, 1.297191858291626, 1.3267765045166016, 1.3563611507415771, 1.3859457969665527, 1.4155305624008179, 1.4451152086257935, 1.474699854850769]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 6.0, 5.0, 14.0, 21.0, 27.0, 39.0, 46.0, 65.0, 66.0, 84.0, 64.0, 99.0, 69.0, 85.0, 71.0, 40.0, 48.0, 41.0, 32.0, 26.0, 13.0, 12.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22911089658737183, -0.22271935641765594, -0.21632781624794006, -0.20993627607822418, -0.2035447359085083, -0.19715319573879242, -0.19076165556907654, -0.18437010049819946, -0.17797857522964478, -0.1715870350599289, -0.165195494890213, -0.15880395472049713, -0.15241241455078125, -0.14602087438106537, -0.1396293342113495, -0.1332377791404724, -0.12684623897075653, -0.12045469880104065, -0.11406315863132477, -0.10767161846160889, -0.101280078291893, -0.09488853812217712, -0.08849699050188065, -0.08210545033216476, -0.07571391016244888, -0.069322369992733, -0.06293082982301712, -0.05653928592801094, -0.05014774575829506, -0.04375620558857918, -0.037364661693573, -0.030973121523857117, -0.024581581354141235, -0.018190041184425354, -0.011798499152064323, -0.005406957119703293, 0.0009845830500125885, 0.00737612321972847, 0.01376766711473465, 0.02015920728445053, 0.026550747454166412, 0.032942287623882294, 0.039333827793598175, 0.045725371688604355, 0.052116911858320236, 0.05850845202803612, 0.0648999959230423, 0.07129153609275818, 0.07768307626247406, 0.08407461643218994, 0.09046615660190582, 0.0968576967716217, 0.10324923694133759, 0.10964077711105347, 0.11603232473134995, 0.12242386490106583, 0.1288154125213623, 0.13520695269107819, 0.14159849286079407, 0.14799003303050995, 0.15438157320022583, 0.1607731133699417, 0.1671646535396576, 0.17355620861053467, 0.17994773387908936]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 15.0, 20.0, 34.0, 46.0, 86.0, 172.0, 733.0, 2365.0, 4818.0, 13080.0, 2224695.0, 1929919.0, 11970.0, 3779.0, 1183.0, 824.0, 239.0, 101.0, 60.0, 37.0, 28.0, 12.0, 12.0, 13.0, 11.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06900978088378906, -0.06685256958007812, -0.06469535827636719, -0.06253814697265625, -0.06038093566894531, -0.058223724365234375, -0.05606651306152344, -0.0539093017578125, -0.05175209045410156, -0.049594879150390625, -0.04743766784667969, -0.04528045654296875, -0.04312324523925781, -0.040966033935546875, -0.03880882263183594, -0.036651611328125, -0.03449440002441406, -0.032337188720703125, -0.030179977416992188, -0.02802276611328125, -0.025865554809570312, -0.023708343505859375, -0.021551132202148438, -0.0193939208984375, -0.017236709594726562, -0.015079498291015625, -0.012922286987304688, -0.01076507568359375, -0.008607864379882812, -0.006450653076171875, -0.0042934417724609375, -0.00213623046875, 2.09808349609375e-05, 0.002178192138671875, 0.0043354034423828125, 0.00649261474609375, 0.008649826049804688, 0.010807037353515625, 0.012964248657226562, 0.0151214599609375, 0.017278671264648438, 0.019435882568359375, 0.021593093872070312, 0.02375030517578125, 0.025907516479492188, 0.028064727783203125, 0.030221939086914062, 0.032379150390625, 0.03453636169433594, 0.036693572998046875, 0.03885078430175781, 0.04100799560546875, 0.04316520690917969, 0.045322418212890625, 0.04747962951660156, 0.0496368408203125, 0.05179405212402344, 0.053951263427734375, 0.05610847473144531, 0.05826568603515625, 0.06042289733886719, 0.06258010864257812, 0.06473731994628906, 0.06689453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 23.0, 106.0, 303.0, 363.0, 166.0, 24.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06793212890625, -0.06588459014892578, -0.06383705139160156, -0.061789512634277344, -0.059741973876953125, -0.057694435119628906, -0.05564689636230469, -0.05359935760498047, -0.05155181884765625, -0.04950428009033203, -0.04745674133300781, -0.045409202575683594, -0.043361663818359375, -0.041314125061035156, -0.03926658630371094, -0.03721904754638672, -0.0351715087890625, -0.03312397003173828, -0.031076431274414062, -0.029028892517089844, -0.026981353759765625, -0.024933815002441406, -0.022886276245117188, -0.02083873748779297, -0.01879119873046875, -0.01674365997314453, -0.014696121215820312, -0.012648582458496094, -0.010601043701171875, -0.008553504943847656, -0.0065059661865234375, -0.004458427429199219, -0.002410888671875, -0.00036334991455078125, 0.0016841888427734375, 0.0037317276000976562, 0.005779266357421875, 0.007826805114746094, 0.009874343872070312, 0.011921882629394531, 0.01396942138671875, 0.01601696014404297, 0.018064498901367188, 0.020112037658691406, 0.022159576416015625, 0.024207115173339844, 0.026254653930664062, 0.02830219268798828, 0.0303497314453125, 0.03239727020263672, 0.03444480895996094, 0.036492347717285156, 0.038539886474609375, 0.040587425231933594, 0.04263496398925781, 0.04468250274658203, 0.04673004150390625, 0.04877758026123047, 0.05082511901855469, 0.052872657775878906, 0.054920196533203125, 0.056967735290527344, 0.05901527404785156, 0.06106281280517578, 0.0631103515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 9.0, 8.0, 12.0, 13.0, 31.0, 43.0, 47.0, 139.0, 421.0, 1859.0, 36526.0, 4105475.0, 46853.0, 2120.0, 437.0, 147.0, 57.0, 26.0, 24.0, 12.0, 7.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.07347393035888672, -0.07089805603027344, -0.06832218170166016, -0.06574630737304688, -0.0631704330444336, -0.06059455871582031, -0.05801868438720703, -0.05544281005859375, -0.05286693572998047, -0.05029106140136719, -0.047715187072753906, -0.045139312744140625, -0.042563438415527344, -0.03998756408691406, -0.03741168975830078, -0.0348358154296875, -0.03225994110107422, -0.029684066772460938, -0.027108192443847656, -0.024532318115234375, -0.021956443786621094, -0.019380569458007812, -0.01680469512939453, -0.01422882080078125, -0.011652946472167969, -0.009077072143554688, -0.006501197814941406, -0.003925323486328125, -0.0013494491577148438, 0.0012264251708984375, 0.0038022994995117188, 0.006378173828125, 0.008954048156738281, 0.011529922485351562, 0.014105796813964844, 0.016681671142578125, 0.019257545471191406, 0.021833419799804688, 0.02440929412841797, 0.02698516845703125, 0.02956104278564453, 0.03213691711425781, 0.034712791442871094, 0.037288665771484375, 0.039864540100097656, 0.04244041442871094, 0.04501628875732422, 0.0475921630859375, 0.05016803741455078, 0.05274391174316406, 0.055319786071777344, 0.057895660400390625, 0.060471534729003906, 0.06304740905761719, 0.06562328338623047, 0.06819915771484375, 0.07077503204345703, 0.07335090637207031, 0.0759267807006836, 0.07850265502929688, 0.08107852935791016, 0.08365440368652344, 0.08623027801513672, 0.08880615234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 12.0, 19.0, 23.0, 62.0, 92.0, 143.0, 327.0, 745.0, 1167.0, 740.0, 301.0, 169.0, 93.0, 55.0, 39.0, 24.0, 15.0, 11.0, 5.0, 3.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035369873046875, -0.03445100784301758, -0.033532142639160156, -0.032613277435302734, -0.03169441223144531, -0.03077554702758789, -0.02985668182373047, -0.028937816619873047, -0.028018951416015625, -0.027100086212158203, -0.02618122100830078, -0.02526235580444336, -0.024343490600585938, -0.023424625396728516, -0.022505760192871094, -0.021586894989013672, -0.02066802978515625, -0.019749164581298828, -0.018830299377441406, -0.017911434173583984, -0.016992568969726562, -0.01607370376586914, -0.015154838562011719, -0.014235973358154297, -0.013317108154296875, -0.012398242950439453, -0.011479377746582031, -0.01056051254272461, -0.009641647338867188, -0.008722782135009766, -0.007803916931152344, -0.006885051727294922, -0.0059661865234375, -0.005047321319580078, -0.004128456115722656, -0.0032095909118652344, -0.0022907257080078125, -0.0013718605041503906, -0.00045299530029296875, 0.0004658699035644531, 0.001384735107421875, 0.002303600311279297, 0.0032224655151367188, 0.004141330718994141, 0.0050601959228515625, 0.005979061126708984, 0.006897926330566406, 0.007816791534423828, 0.00873565673828125, 0.009654521942138672, 0.010573387145996094, 0.011492252349853516, 0.012411117553710938, 0.01332998275756836, 0.014248847961425781, 0.015167713165283203, 0.016086578369140625, 0.017005443572998047, 0.01792430877685547, 0.01884317398071289, 0.019762039184570312, 0.020680904388427734, 0.021599769592285156, 0.022518634796142578, 0.0234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 155.0, 718.0, 108.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6978673934936523, -0.6817833185195923, -0.665699303150177, -0.6496152281761169, -0.6335312128067017, -0.6174471378326416, -0.6013630628585815, -0.5852790474891663, -0.5691949725151062, -0.5531108975410461, -0.5370268821716309, -0.5209428071975708, -0.5048587918281555, -0.48877471685409546, -0.4726906716823578, -0.4566066265106201, -0.44052258133888245, -0.4244385361671448, -0.4083544909954071, -0.39227044582366943, -0.3761863708496094, -0.3601023256778717, -0.34401828050613403, -0.32793423533439636, -0.3118501901626587, -0.295766144990921, -0.27968209981918335, -0.2635980248451233, -0.24751397967338562, -0.23142993450164795, -0.21534588932991028, -0.1992618441581726, -0.18317779898643494, -0.16709375381469727, -0.1510096937417984, -0.13492564857006073, -0.11884159594774246, -0.1027575433254242, -0.08667349815368652, -0.07058944553136826, -0.05450539290904999, -0.03842134028673172, -0.02233729138970375, -0.006253242492675781, 0.009830810129642487, 0.025914862751960754, 0.041998907923698425, 0.05808296054601669, 0.07416701316833496, 0.09025106579065323, 0.1063351184129715, 0.12241916358470917, 0.13850322365760803, 0.1545872688293457, 0.17067131400108337, 0.18675535917282104, 0.2028394192457199, 0.21892346441745758, 0.23500752449035645, 0.2510915696620941, 0.2671756148338318, 0.28325968980789185, 0.29934370517730713, 0.3154277801513672, 0.33151182532310486]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 10.0, 10.0, 15.0, 18.0, 29.0, 43.0, 42.0, 58.0, 63.0, 76.0, 82.0, 66.0, 74.0, 73.0, 62.0, 67.0, 48.0, 40.0, 37.0, 26.0, 24.0, 17.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11094796657562256, -0.10793082416057587, -0.10491368174552917, -0.10189653187990189, -0.0988793894648552, -0.0958622470498085, -0.09284509718418121, -0.08982795476913452, -0.08681081235408783, -0.08379366993904114, -0.08077652752399445, -0.07775937765836716, -0.07474223524332047, -0.07172509282827377, -0.06870794296264648, -0.06569080054759979, -0.0626736581325531, -0.05965651571750641, -0.05663936957716942, -0.05362222343683243, -0.050605081021785736, -0.047587938606739044, -0.044570792466402054, -0.041553646326065063, -0.03853650391101837, -0.03551936149597168, -0.03250221535563469, -0.029485071077942848, -0.026467926800251007, -0.023450782522559166, -0.020433638244867325, -0.017416493967175484, -0.014399349689483643, -0.011382205411791801, -0.00836506113409996, -0.005347916856408119, -0.002330772578716278, 0.000686371698975563, 0.003703515976667404, 0.006720660254359245, 0.009737804532051086, 0.012754948809742928, 0.01577209308743477, 0.01878923736512661, 0.02180638164281845, 0.024823525920510292, 0.027840670198202133, 0.030857814475893974, 0.033874958753585815, 0.03689210116863251, 0.0399092473089695, 0.04292639344930649, 0.04594353586435318, 0.04896067827939987, 0.05197782441973686, 0.05499497056007385, 0.058012112975120544, 0.061029255390167236, 0.06404639780521393, 0.06706354767084122, 0.07008069008588791, 0.0730978325009346, 0.07611498236656189, 0.07913212478160858, 0.08214926719665527]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 10.0, 10.0, 17.0, 17.0, 24.0, 33.0, 52.0, 84.0, 128.0, 144.0, 280.0, 435.0, 852.0, 2335.0, 32368.0, 953041.0, 53686.0, 2731.0, 899.0, 471.0, 301.0, 215.0, 151.0, 86.0, 54.0, 35.0, 28.0, 17.0, 17.0, 10.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.089111328125, -0.0862874984741211, -0.08346366882324219, -0.08063983917236328, -0.07781600952148438, -0.07499217987060547, -0.07216835021972656, -0.06934452056884766, -0.06652069091796875, -0.06369686126708984, -0.06087303161621094, -0.05804920196533203, -0.055225372314453125, -0.05240154266357422, -0.04957771301269531, -0.046753883361816406, -0.0439300537109375, -0.041106224060058594, -0.03828239440917969, -0.03545856475830078, -0.032634735107421875, -0.02981090545654297, -0.026987075805664062, -0.024163246154785156, -0.02133941650390625, -0.018515586853027344, -0.015691757202148438, -0.012867927551269531, -0.010044097900390625, -0.007220268249511719, -0.0043964385986328125, -0.0015726089477539062, 0.001251220703125, 0.004075050354003906, 0.0068988800048828125, 0.009722709655761719, 0.012546539306640625, 0.015370368957519531, 0.018194198608398438, 0.021018028259277344, 0.02384185791015625, 0.026665687561035156, 0.029489517211914062, 0.03231334686279297, 0.035137176513671875, 0.03796100616455078, 0.04078483581542969, 0.043608665466308594, 0.0464324951171875, 0.049256324768066406, 0.05208015441894531, 0.05490398406982422, 0.057727813720703125, 0.06055164337158203, 0.06337547302246094, 0.06619930267333984, 0.06902313232421875, 0.07184696197509766, 0.07467079162597656, 0.07749462127685547, 0.08031845092773438, 0.08314228057861328, 0.08596611022949219, 0.0887899398803711, 0.09161376953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 20.0, 65.0, 248.0, 378.0, 224.0, 50.0, 9.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.06388711929321289, -0.06191730499267578, -0.05994749069213867, -0.05797767639160156, -0.05600786209106445, -0.054038047790527344, -0.052068233489990234, -0.050098419189453125, -0.048128604888916016, -0.046158790588378906, -0.0441889762878418, -0.04221916198730469, -0.04024934768676758, -0.03827953338623047, -0.03630971908569336, -0.03433990478515625, -0.03237009048461914, -0.03040027618408203, -0.028430461883544922, -0.026460647583007812, -0.024490833282470703, -0.022521018981933594, -0.020551204681396484, -0.018581390380859375, -0.016611576080322266, -0.014641761779785156, -0.012671947479248047, -0.010702133178710938, -0.008732318878173828, -0.006762504577636719, -0.004792690277099609, -0.0028228759765625, -0.0008530616760253906, 0.0011167526245117188, 0.003086566925048828, 0.0050563812255859375, 0.007026195526123047, 0.008996009826660156, 0.010965824127197266, 0.012935638427734375, 0.014905452728271484, 0.016875267028808594, 0.018845081329345703, 0.020814895629882812, 0.022784709930419922, 0.02475452423095703, 0.02672433853149414, 0.02869415283203125, 0.03066396713256836, 0.03263378143310547, 0.03460359573364258, 0.03657341003417969, 0.0385432243347168, 0.040513038635253906, 0.042482852935791016, 0.044452667236328125, 0.046422481536865234, 0.048392295837402344, 0.05036211013793945, 0.05233192443847656, 0.05430173873901367, 0.05627155303955078, 0.05824136734008789, 0.060211181640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 9.0, 8.0, 9.0, 13.0, 11.0, 24.0, 12.0, 23.0, 33.0, 45.0, 78.0, 119.0, 167.0, 349.0, 699.0, 2239.0, 27655.0, 895745.0, 115222.0, 3950.0, 1003.0, 418.0, 236.0, 125.0, 82.0, 65.0, 41.0, 29.0, 30.0, 12.0, 15.0, 19.0, 16.0, 14.0, 6.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07220458984375, -0.06992435455322266, -0.06764411926269531, -0.06536388397216797, -0.06308364868164062, -0.06080341339111328, -0.05852317810058594, -0.056242942810058594, -0.05396270751953125, -0.051682472229003906, -0.04940223693847656, -0.04712200164794922, -0.044841766357421875, -0.04256153106689453, -0.04028129577636719, -0.038001060485839844, -0.0357208251953125, -0.033440589904785156, -0.031160354614257812, -0.02888011932373047, -0.026599884033203125, -0.02431964874267578, -0.022039413452148438, -0.019759178161621094, -0.01747894287109375, -0.015198707580566406, -0.012918472290039062, -0.010638236999511719, -0.008358001708984375, -0.006077766418457031, -0.0037975311279296875, -0.0015172958374023438, 0.000762939453125, 0.0030431747436523438, 0.0053234100341796875, 0.007603645324707031, 0.009883880615234375, 0.012164115905761719, 0.014444351196289062, 0.016724586486816406, 0.01900482177734375, 0.021285057067871094, 0.023565292358398438, 0.02584552764892578, 0.028125762939453125, 0.03040599822998047, 0.03268623352050781, 0.034966468811035156, 0.0372467041015625, 0.039526939392089844, 0.04180717468261719, 0.04408740997314453, 0.046367645263671875, 0.04864788055419922, 0.05092811584472656, 0.053208351135253906, 0.05548858642578125, 0.057768821716308594, 0.06004905700683594, 0.06232929229736328, 0.06460952758789062, 0.06688976287841797, 0.06916999816894531, 0.07145023345947266, 0.07373046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 10.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 9.0, 16.0, 15.0, 25.0, 30.0, 31.0, 24.0, 35.0, 47.0, 37.0, 40.0, 45.0, 37.0, 43.0, 40.0, 50.0, 38.0, 44.0, 47.0, 31.0, 32.0, 31.0, 22.0, 35.0, 25.0, 20.0, 16.0, 15.0, 7.0, 12.0, 13.0, 10.0, 9.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.025805950164794922, -0.024939537048339844, -0.024073123931884766, -0.023206710815429688, -0.02234029769897461, -0.02147388458251953, -0.020607471466064453, -0.019741058349609375, -0.018874645233154297, -0.01800823211669922, -0.01714181900024414, -0.016275405883789062, -0.015408992767333984, -0.014542579650878906, -0.013676166534423828, -0.01280975341796875, -0.011943340301513672, -0.011076927185058594, -0.010210514068603516, -0.009344100952148438, -0.00847768783569336, -0.007611274719238281, -0.006744861602783203, -0.005878448486328125, -0.005012035369873047, -0.004145622253417969, -0.0032792091369628906, -0.0024127960205078125, -0.0015463829040527344, -0.0006799697875976562, 0.00018644332885742188, 0.0010528564453125, 0.0019192695617675781, 0.0027856826782226562, 0.0036520957946777344, 0.0045185089111328125, 0.005384922027587891, 0.006251335144042969, 0.007117748260498047, 0.007984161376953125, 0.008850574493408203, 0.009716987609863281, 0.01058340072631836, 0.011449813842773438, 0.012316226959228516, 0.013182640075683594, 0.014049053192138672, 0.01491546630859375, 0.015781879425048828, 0.016648292541503906, 0.017514705657958984, 0.018381118774414062, 0.01924753189086914, 0.02011394500732422, 0.020980358123779297, 0.021846771240234375, 0.022713184356689453, 0.02357959747314453, 0.02444601058959961, 0.025312423706054688, 0.026178836822509766, 0.027045249938964844, 0.027911663055419922, 0.028778076171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 6.0, 10.0, 18.0, 24.0, 54.0, 99.0, 155.0, 327.0, 737.0, 1976.0, 6289.0, 26062.0, 215041.0, 692552.0, 84184.0, 14567.0, 4059.0, 1317.0, 525.0, 238.0, 112.0, 53.0, 43.0, 28.0, 18.0, 17.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.02099609375, -0.02043330669403076, -0.019870519638061523, -0.019307732582092285, -0.018744945526123047, -0.01818215847015381, -0.01761937141418457, -0.017056584358215332, -0.016493797302246094, -0.015931010246276855, -0.015368223190307617, -0.014805436134338379, -0.01424264907836914, -0.013679862022399902, -0.013117074966430664, -0.012554287910461426, -0.011991500854492188, -0.01142871379852295, -0.010865926742553711, -0.010303139686584473, -0.009740352630615234, -0.009177565574645996, -0.008614778518676758, -0.00805199146270752, -0.007489204406738281, -0.006926417350769043, -0.006363630294799805, -0.005800843238830566, -0.005238056182861328, -0.00467526912689209, -0.0041124820709228516, -0.0035496950149536133, -0.002986907958984375, -0.0024241209030151367, -0.0018613338470458984, -0.0012985467910766602, -0.0007357597351074219, -0.0001729726791381836, 0.0003898143768310547, 0.000952601432800293, 0.0015153884887695312, 0.0020781755447387695, 0.002640962600708008, 0.003203749656677246, 0.0037665367126464844, 0.004329323768615723, 0.004892110824584961, 0.005454897880554199, 0.0060176849365234375, 0.006580471992492676, 0.007143259048461914, 0.007706046104431152, 0.00826883316040039, 0.008831620216369629, 0.009394407272338867, 0.009957194328308105, 0.010519981384277344, 0.011082768440246582, 0.01164555549621582, 0.012208342552185059, 0.012771129608154297, 0.013333916664123535, 0.013896703720092773, 0.014459490776062012, 0.01502227783203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 22.0, 27.0, 35.0, 53.0, 61.0, 76.0, 109.0, 122.0, 100.0, 72.0, 75.0, 59.0, 28.0, 19.0, 19.0, 12.0, 14.0, 8.0, 5.0, 12.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.702278137207031e-05, -8.457992225885391e-05, -8.213706314563751e-05, -7.969420403242111e-05, -7.725134491920471e-05, -7.480848580598831e-05, -7.236562669277191e-05, -6.992276757955551e-05, -6.747990846633911e-05, -6.503704935312271e-05, -6.259419023990631e-05, -6.015133112668991e-05, -5.770847201347351e-05, -5.526561290025711e-05, -5.282275378704071e-05, -5.037989467382431e-05, -4.793703556060791e-05, -4.549417644739151e-05, -4.305131733417511e-05, -4.060845822095871e-05, -3.816559910774231e-05, -3.572273999452591e-05, -3.327988088130951e-05, -3.083702176809311e-05, -2.839416265487671e-05, -2.595130354166031e-05, -2.350844442844391e-05, -2.106558531522751e-05, -1.862272620201111e-05, -1.6179867088794708e-05, -1.3737007975578308e-05, -1.1294148862361908e-05, -8.851289749145508e-06, -6.408430635929108e-06, -3.9655715227127075e-06, -1.5227124094963074e-06, 9.201467037200928e-07, 3.363005816936493e-06, 5.805864930152893e-06, 8.248724043369293e-06, 1.0691583156585693e-05, 1.3134442269802094e-05, 1.5577301383018494e-05, 1.8020160496234894e-05, 2.0463019609451294e-05, 2.2905878722667694e-05, 2.5348737835884094e-05, 2.7791596949100494e-05, 3.0234456062316895e-05, 3.2677315175533295e-05, 3.5120174288749695e-05, 3.7563033401966095e-05, 4.0005892515182495e-05, 4.2448751628398895e-05, 4.4891610741615295e-05, 4.7334469854831696e-05, 4.9777328968048096e-05, 5.2220188081264496e-05, 5.4663047194480896e-05, 5.7105906307697296e-05, 5.9548765420913696e-05, 6.19916245341301e-05, 6.44344836473465e-05, 6.68773427605629e-05, 6.93202018737793e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 15.0, 16.0, 23.0, 30.0, 44.0, 67.0, 93.0, 156.0, 245.0, 516.0, 1011.0, 2311.0, 5744.0, 15550.0, 55009.0, 467893.0, 424148.0, 50959.0, 15030.0, 5339.0, 2209.0, 947.0, 451.0, 268.0, 150.0, 91.0, 68.0, 36.0, 35.0, 18.0, 11.0, 10.0, 12.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0149078369140625, -0.014374971389770508, -0.013842105865478516, -0.013309240341186523, -0.012776374816894531, -0.012243509292602539, -0.011710643768310547, -0.011177778244018555, -0.010644912719726562, -0.01011204719543457, -0.009579181671142578, -0.009046316146850586, -0.008513450622558594, -0.007980585098266602, -0.007447719573974609, -0.006914854049682617, -0.006381988525390625, -0.005849123001098633, -0.005316257476806641, -0.0047833919525146484, -0.004250526428222656, -0.003717660903930664, -0.003184795379638672, -0.0026519298553466797, -0.0021190643310546875, -0.0015861988067626953, -0.0010533332824707031, -0.0005204677581787109, 1.239776611328125e-05, 0.0005452632904052734, 0.0010781288146972656, 0.0016109943389892578, 0.00214385986328125, 0.002676725387573242, 0.0032095909118652344, 0.0037424564361572266, 0.004275321960449219, 0.004808187484741211, 0.005341053009033203, 0.005873918533325195, 0.0064067840576171875, 0.00693964958190918, 0.007472515106201172, 0.008005380630493164, 0.008538246154785156, 0.009071111679077148, 0.00960397720336914, 0.010136842727661133, 0.010669708251953125, 0.011202573776245117, 0.01173543930053711, 0.012268304824829102, 0.012801170349121094, 0.013334035873413086, 0.013866901397705078, 0.01439976692199707, 0.014932632446289062, 0.015465497970581055, 0.015998363494873047, 0.01653122901916504, 0.01706409454345703, 0.017596960067749023, 0.018129825592041016, 0.018662691116333008, 0.019195556640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 7.0, 7.0, 7.0, 30.0, 30.0, 29.0, 47.0, 45.0, 66.0, 67.0, 98.0, 91.0, 88.0, 75.0, 48.0, 43.0, 39.0, 18.0, 22.0, 17.0, 14.0, 16.0, 11.0, 10.0, 11.0, 8.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008575439453125, -0.008283019065856934, -0.007990598678588867, -0.007698178291320801, -0.007405757904052734, -0.007113337516784668, -0.0068209171295166016, -0.006528496742248535, -0.006236076354980469, -0.005943655967712402, -0.005651235580444336, -0.0053588151931762695, -0.005066394805908203, -0.004773974418640137, -0.00448155403137207, -0.004189133644104004, -0.0038967132568359375, -0.003604292869567871, -0.0033118724822998047, -0.0030194520950317383, -0.002727031707763672, -0.0024346113204956055, -0.002142190933227539, -0.0018497705459594727, -0.0015573501586914062, -0.0012649297714233398, -0.0009725093841552734, -0.000680088996887207, -0.0003876686096191406, -9.524822235107422e-05, 0.0001971721649169922, 0.0004895925521850586, 0.000782012939453125, 0.0010744333267211914, 0.0013668537139892578, 0.0016592741012573242, 0.0019516944885253906, 0.002244114875793457, 0.0025365352630615234, 0.00282895565032959, 0.0031213760375976562, 0.0034137964248657227, 0.003706216812133789, 0.0039986371994018555, 0.004291057586669922, 0.004583477973937988, 0.004875898361206055, 0.005168318748474121, 0.0054607391357421875, 0.005753159523010254, 0.00604557991027832, 0.006338000297546387, 0.006630420684814453, 0.0069228410720825195, 0.007215261459350586, 0.007507681846618652, 0.007800102233886719, 0.008092522621154785, 0.008384943008422852, 0.008677363395690918, 0.008969783782958984, 0.00926220417022705, 0.009554624557495117, 0.009847044944763184, 0.01013946533203125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 11.0, 19.0, 294.0, 635.0, 48.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12614059448242188, -0.10892495512962341, -0.09170930832624435, -0.0744936615228653, -0.057278022170066833, -0.04006238281726837, -0.022846736013889313, -0.005631089210510254, 0.011584550142288208, 0.02880019322037697, 0.04601583629846573, 0.06323148310184479, 0.08044712245464325, 0.09766276180744171, 0.11487840861082077, 0.13209405541419983, 0.1493096947669983, 0.16652533411979675, 0.18374097347259521, 0.20095662772655487, 0.21817226707935333, 0.2353879064321518, 0.25260356068611145, 0.2698192000389099, 0.2870348393917084, 0.30425047874450684, 0.3214661180973053, 0.33868175745010376, 0.3558974266052246, 0.3731130361557007, 0.39032870531082153, 0.40754434466362, 0.42475998401641846, 0.4419756233692169, 0.4591912627220154, 0.47640690207481384, 0.4936225414276123, 0.5108382105827332, 0.5280538201332092, 0.5452694892883301, 0.5624850988388062, 0.579700767993927, 0.5969163775444031, 0.6141320466995239, 0.63134765625, 0.6485633254051208, 0.6657789349555969, 0.6829946041107178, 0.7002102732658386, 0.7174259424209595, 0.7346415519714355, 0.7518572211265564, 0.7690728306770325, 0.7862884998321533, 0.8035041093826294, 0.8207197785377502, 0.8379354476928711, 0.8551511168479919, 0.872366726398468, 0.8895823955535889, 0.9067980051040649, 0.9240136742591858, 0.9412292838096619, 0.9584449529647827, 0.9756605625152588]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 5.0, 12.0, 7.0, 8.0, 14.0, 17.0, 11.0, 15.0, 21.0, 20.0, 20.0, 26.0, 38.0, 33.0, 34.0, 35.0, 38.0, 33.0, 50.0, 36.0, 37.0, 50.0, 41.0, 35.0, 40.0, 43.0, 34.0, 34.0, 32.0, 29.0, 20.0, 18.0, 30.0, 15.0, 11.0, 6.0, 11.0, 10.0, 8.0, 11.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08181983232498169, -0.07927834987640381, -0.07673685997724533, -0.07419537752866745, -0.07165388762950897, -0.06911240518093109, -0.06657092273235321, -0.06402944028377533, -0.06148795038461685, -0.05894646421074867, -0.05640497803688049, -0.05386349558830261, -0.05132200941443443, -0.048780523240566254, -0.04623904079198837, -0.043697554618120193, -0.041156068444252014, -0.038614582270383835, -0.036073096096515656, -0.033531613647937775, -0.030990127474069595, -0.028448641300201416, -0.025907156988978386, -0.023365672677755356, -0.020824186503887177, -0.018282700330018997, -0.015741216018795967, -0.013199730776250362, -0.010658245533704758, -0.008116760291159153, -0.005575275048613548, -0.003033790737390518, -0.0004923045635223389, 0.002049180679023266, 0.0045906659215688705, 0.007132151164114475, 0.00967363640666008, 0.012215121649205685, 0.01475660689175129, 0.01729809120297432, 0.0198395773768425, 0.022381063550710678, 0.024922547861933708, 0.02746403217315674, 0.030005518347024918, 0.0325470045208931, 0.03508848696947098, 0.03762997314333916, 0.040171459317207336, 0.042712945491075516, 0.045254431664943695, 0.047795914113521576, 0.050337400287389755, 0.052878886461257935, 0.055420368909835815, 0.057961855083703995, 0.060503341257572174, 0.06304482370615005, 0.06558631360530853, 0.06812779605388641, 0.0706692785024643, 0.07321076840162277, 0.07575225085020065, 0.07829374074935913, 0.08083522319793701]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 11.0, 19.0, 42.0, 72.0, 129.0, 464.0, 1304.0, 3211.0, 6013.0, 29229.0, 3872487.0, 265261.0, 10142.0, 3340.0, 1143.0, 787.0, 273.0, 134.0, 58.0, 45.0, 21.0, 22.0, 16.0, 8.0, 11.0, 2.0, 10.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06610107421875, -0.06414270401000977, -0.06218433380126953, -0.0602259635925293, -0.05826759338378906, -0.05630922317504883, -0.054350852966308594, -0.05239248275756836, -0.050434112548828125, -0.04847574234008789, -0.046517372131347656, -0.04455900192260742, -0.04260063171386719, -0.04064226150512695, -0.03868389129638672, -0.036725521087646484, -0.03476715087890625, -0.032808780670166016, -0.03085041046142578, -0.028892040252685547, -0.026933670043945312, -0.024975299835205078, -0.023016929626464844, -0.02105855941772461, -0.019100189208984375, -0.01714181900024414, -0.015183448791503906, -0.013225078582763672, -0.011266708374023438, -0.009308338165283203, -0.007349967956542969, -0.005391597747802734, -0.0034332275390625, -0.0014748573303222656, 0.00048351287841796875, 0.002441883087158203, 0.0044002532958984375, 0.006358623504638672, 0.008316993713378906, 0.01027536392211914, 0.012233734130859375, 0.01419210433959961, 0.016150474548339844, 0.018108844757080078, 0.020067214965820312, 0.022025585174560547, 0.02398395538330078, 0.025942325592041016, 0.02790069580078125, 0.029859066009521484, 0.03181743621826172, 0.03377580642700195, 0.03573417663574219, 0.03769254684448242, 0.039650917053222656, 0.04160928726196289, 0.043567657470703125, 0.04552602767944336, 0.047484397888183594, 0.04944276809692383, 0.05140113830566406, 0.0533595085144043, 0.05531787872314453, 0.057276248931884766, 0.059234619140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 13.0, 47.0, 213.0, 406.0, 245.0, 62.0, 12.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06490135192871094, -0.06284713745117188, -0.06079292297363281, -0.05873870849609375, -0.05668449401855469, -0.054630279541015625, -0.05257606506347656, -0.0505218505859375, -0.04846763610839844, -0.046413421630859375, -0.04435920715332031, -0.04230499267578125, -0.04025077819824219, -0.038196563720703125, -0.03614234924316406, -0.034088134765625, -0.03203392028808594, -0.029979705810546875, -0.027925491333007812, -0.02587127685546875, -0.023817062377929688, -0.021762847900390625, -0.019708633422851562, -0.0176544189453125, -0.015600204467773438, -0.013545989990234375, -0.011491775512695312, -0.00943756103515625, -0.0073833465576171875, -0.005329132080078125, -0.0032749176025390625, -0.001220703125, 0.0008335113525390625, 0.002887725830078125, 0.0049419403076171875, 0.00699615478515625, 0.009050369262695312, 0.011104583740234375, 0.013158798217773438, 0.0152130126953125, 0.017267227172851562, 0.019321441650390625, 0.021375656127929688, 0.02342987060546875, 0.025484085083007812, 0.027538299560546875, 0.029592514038085938, 0.031646728515625, 0.03370094299316406, 0.035755157470703125, 0.03780937194824219, 0.03986358642578125, 0.04191780090332031, 0.043972015380859375, 0.04602622985839844, 0.0480804443359375, 0.05013465881347656, 0.052188873291015625, 0.05424308776855469, 0.05629730224609375, 0.05835151672363281, 0.060405731201171875, 0.06245994567871094, 0.06451416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 26.0, 46.0, 74.0, 202.0, 581.0, 2281.0, 23919.0, 3407433.0, 745327.0, 12177.0, 1522.0, 413.0, 160.0, 58.0, 28.0, 14.0, 9.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046905517578125, -0.045223236083984375, -0.04354095458984375, -0.041858673095703125, -0.0401763916015625, -0.038494110107421875, -0.03681182861328125, -0.035129547119140625, -0.033447265625, -0.031764984130859375, -0.03008270263671875, -0.028400421142578125, -0.0267181396484375, -0.025035858154296875, -0.02335357666015625, -0.021671295166015625, -0.019989013671875, -0.018306732177734375, -0.01662445068359375, -0.014942169189453125, -0.0132598876953125, -0.011577606201171875, -0.00989532470703125, -0.008213043212890625, -0.00653076171875, -0.004848480224609375, -0.00316619873046875, -0.001483917236328125, 0.0001983642578125, 0.001880645751953125, 0.00356292724609375, 0.005245208740234375, 0.006927490234375, 0.008609771728515625, 0.01029205322265625, 0.011974334716796875, 0.0136566162109375, 0.015338897705078125, 0.01702117919921875, 0.018703460693359375, 0.0203857421875, 0.022068023681640625, 0.02375030517578125, 0.025432586669921875, 0.0271148681640625, 0.028797149658203125, 0.03047943115234375, 0.032161712646484375, 0.033843994140625, 0.035526275634765625, 0.03720855712890625, 0.038890838623046875, 0.0405731201171875, 0.042255401611328125, 0.04393768310546875, 0.045619964599609375, 0.04730224609375, 0.048984527587890625, 0.05066680908203125, 0.052349090576171875, 0.0540313720703125, 0.055713653564453125, 0.05739593505859375, 0.059078216552734375, 0.060760498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 12.0, 25.0, 61.0, 131.0, 338.0, 1127.0, 1467.0, 514.0, 204.0, 89.0, 52.0, 23.0, 13.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.04829120635986328, -0.04699134826660156, -0.045691490173339844, -0.044391632080078125, -0.043091773986816406, -0.04179191589355469, -0.04049205780029297, -0.03919219970703125, -0.03789234161376953, -0.03659248352050781, -0.035292625427246094, -0.033992767333984375, -0.032692909240722656, -0.03139305114746094, -0.03009319305419922, -0.0287933349609375, -0.02749347686767578, -0.026193618774414062, -0.024893760681152344, -0.023593902587890625, -0.022294044494628906, -0.020994186401367188, -0.01969432830810547, -0.01839447021484375, -0.01709461212158203, -0.015794754028320312, -0.014494895935058594, -0.013195037841796875, -0.011895179748535156, -0.010595321655273438, -0.009295463562011719, -0.00799560546875, -0.006695747375488281, -0.0053958892822265625, -0.004096031188964844, -0.002796173095703125, -0.0014963150024414062, -0.0001964569091796875, 0.0011034011840820312, 0.00240325927734375, 0.0037031173706054688, 0.0050029754638671875, 0.006302833557128906, 0.007602691650390625, 0.008902549743652344, 0.010202407836914062, 0.011502265930175781, 0.0128021240234375, 0.014101982116699219, 0.015401840209960938, 0.016701698303222656, 0.018001556396484375, 0.019301414489746094, 0.020601272583007812, 0.02190113067626953, 0.02320098876953125, 0.02450084686279297, 0.025800704956054688, 0.027100563049316406, 0.028400421142578125, 0.029700279235839844, 0.031000137329101562, 0.03229999542236328, 0.033599853515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 13.0, 184.0, 698.0, 102.0, 9.0, 2.0, 2.0, 2.0], "bins": [-0.8547520041465759, -0.840095043182373, -0.8254380226135254, -0.8107810616493225, -0.7961240410804749, -0.781467080116272, -0.7668100595474243, -0.7521530985832214, -0.7374961376190186, -0.7228391766548157, -0.708182156085968, -0.6935251951217651, -0.6788681745529175, -0.6642112135887146, -0.6495541930198669, -0.6348972320556641, -0.6202402114868164, -0.6055832505226135, -0.5909262299537659, -0.576269268989563, -0.5616122484207153, -0.5469552874565125, -0.5322982668876648, -0.5176413059234619, -0.5029842853546143, -0.488327294588089, -0.4736703038215637, -0.45901331305503845, -0.4443563222885132, -0.4296993613243103, -0.41504237055778503, -0.40038537979125977, -0.3857284486293793, -0.371071457862854, -0.35641446709632874, -0.34175747632980347, -0.3271005153656006, -0.31244349479675293, -0.29778653383255005, -0.2831295430660248, -0.2684725522994995, -0.25381556153297424, -0.23915857076644897, -0.2245015949010849, -0.20984460413455963, -0.19518761336803436, -0.1805306375026703, -0.16587364673614502, -0.15121665596961975, -0.13655966520309448, -0.12190268188714981, -0.10724569857120514, -0.09258870780467987, -0.0779317170381546, -0.06327473372220993, -0.04861775040626526, -0.03396075963973999, -0.01930377259850502, -0.00464678555727005, 0.01001020148396492, 0.02466718852519989, 0.03932417929172516, 0.05398116260766983, 0.0686381459236145, 0.08329513669013977]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 5.0, 8.0, 15.0, 22.0, 21.0, 28.0, 30.0, 18.0, 35.0, 43.0, 52.0, 58.0, 46.0, 49.0, 59.0, 65.0, 52.0, 42.0, 41.0, 53.0, 42.0, 36.0, 33.0, 35.0, 19.0, 25.0, 11.0, 13.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06521707773208618, -0.06319104135036469, -0.06116500496864319, -0.05913896486163139, -0.0571129284799099, -0.0550868920981884, -0.053060851991176605, -0.05103481560945511, -0.04900877922773361, -0.046982742846012115, -0.04495670646429062, -0.042930666357278824, -0.04090462997555733, -0.03887859359383583, -0.036852553486824036, -0.03482651710510254, -0.03280048072338104, -0.030774444341659546, -0.0287484060972929, -0.026722367852926254, -0.024696331471204758, -0.02267029508948326, -0.020644256845116615, -0.01861821860074997, -0.016592182219028473, -0.014566144905984402, -0.01254010759294033, -0.01051407027989626, -0.008488032966852188, -0.006461995653808117, -0.004435958340764046, -0.0024099210277199745, -0.0003838837146759033, 0.0016421535983681679, 0.003668190911412239, 0.00569422822445631, 0.0077202655375003815, 0.009746302850544453, 0.011772340163588524, 0.013798377476632595, 0.015824414789676666, 0.017850451171398163, 0.01987648941576481, 0.021902527660131454, 0.02392856404185295, 0.025954600423574448, 0.027980638667941093, 0.03000667691230774, 0.032032713294029236, 0.03405874967575073, 0.03608478605747223, 0.038110826164484024, 0.04013686254620552, 0.04216289892792702, 0.04418893903493881, 0.04621497541666031, 0.048241011798381805, 0.0502670481801033, 0.0522930845618248, 0.054319124668836594, 0.05634516105055809, 0.05837119743227959, 0.06039723753929138, 0.06242327392101288, 0.06444931030273438]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 11.0, 13.0, 16.0, 15.0, 23.0, 33.0, 47.0, 62.0, 62.0, 87.0, 141.0, 179.0, 265.0, 394.0, 588.0, 1060.0, 2630.0, 20877.0, 507024.0, 489384.0, 19998.0, 2688.0, 1035.0, 564.0, 364.0, 248.0, 174.0, 121.0, 114.0, 75.0, 72.0, 51.0, 43.0, 30.0, 14.0, 11.0, 14.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06298828125, -0.061135292053222656, -0.05928230285644531, -0.05742931365966797, -0.055576324462890625, -0.05372333526611328, -0.05187034606933594, -0.050017356872558594, -0.04816436767578125, -0.046311378479003906, -0.04445838928222656, -0.04260540008544922, -0.040752410888671875, -0.03889942169189453, -0.03704643249511719, -0.035193443298339844, -0.0333404541015625, -0.031487464904785156, -0.029634475708007812, -0.02778148651123047, -0.025928497314453125, -0.02407550811767578, -0.022222518920898438, -0.020369529724121094, -0.01851654052734375, -0.016663551330566406, -0.014810562133789062, -0.012957572937011719, -0.011104583740234375, -0.009251594543457031, -0.0073986053466796875, -0.005545616149902344, -0.003692626953125, -0.0018396377563476562, 1.33514404296875e-05, 0.0018663406372070312, 0.003719329833984375, 0.005572319030761719, 0.0074253082275390625, 0.009278297424316406, 0.01113128662109375, 0.012984275817871094, 0.014837265014648438, 0.01669025421142578, 0.018543243408203125, 0.02039623260498047, 0.022249221801757812, 0.024102210998535156, 0.0259552001953125, 0.027808189392089844, 0.029661178588867188, 0.03151416778564453, 0.033367156982421875, 0.03522014617919922, 0.03707313537597656, 0.038926124572753906, 0.04077911376953125, 0.042632102966308594, 0.04448509216308594, 0.04633808135986328, 0.048191070556640625, 0.05004405975341797, 0.05189704895019531, 0.053750038146972656, 0.05560302734375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 36.0, 138.0, 356.0, 326.0, 117.0, 15.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.0637974739074707, -0.061799049377441406, -0.05980062484741211, -0.05780220031738281, -0.055803775787353516, -0.05380535125732422, -0.05180692672729492, -0.049808502197265625, -0.04781007766723633, -0.04581165313720703, -0.043813228607177734, -0.04181480407714844, -0.03981637954711914, -0.037817955017089844, -0.03581953048706055, -0.03382110595703125, -0.03182268142700195, -0.029824256896972656, -0.02782583236694336, -0.025827407836914062, -0.023828983306884766, -0.02183055877685547, -0.019832134246826172, -0.017833709716796875, -0.015835285186767578, -0.013836860656738281, -0.011838436126708984, -0.009840011596679688, -0.00784158706665039, -0.005843162536621094, -0.003844738006591797, -0.0018463134765625, 0.00015211105346679688, 0.0021505355834960938, 0.004148960113525391, 0.0061473846435546875, 0.008145809173583984, 0.010144233703613281, 0.012142658233642578, 0.014141082763671875, 0.016139507293701172, 0.01813793182373047, 0.020136356353759766, 0.022134780883789062, 0.02413320541381836, 0.026131629943847656, 0.028130054473876953, 0.03012847900390625, 0.03212690353393555, 0.034125328063964844, 0.03612375259399414, 0.03812217712402344, 0.040120601654052734, 0.04211902618408203, 0.04411745071411133, 0.046115875244140625, 0.04811429977416992, 0.05011272430419922, 0.052111148834228516, 0.05410957336425781, 0.05610799789428711, 0.058106422424316406, 0.0601048469543457, 0.062103271484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 8.0, 10.0, 9.0, 35.0, 25.0, 44.0, 35.0, 72.0, 81.0, 106.0, 160.0, 322.0, 699.0, 2612.0, 21797.0, 308368.0, 642027.0, 64184.0, 5609.0, 1144.0, 422.0, 252.0, 124.0, 97.0, 74.0, 37.0, 37.0, 39.0, 23.0, 15.0, 19.0, 18.0, 7.0, 8.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.03753042221069336, -0.03615093231201172, -0.03477144241333008, -0.03339195251464844, -0.0320124626159668, -0.030632972717285156, -0.029253482818603516, -0.027873992919921875, -0.026494503021240234, -0.025115013122558594, -0.023735523223876953, -0.022356033325195312, -0.020976543426513672, -0.01959705352783203, -0.01821756362915039, -0.01683807373046875, -0.01545858383178711, -0.014079093933105469, -0.012699604034423828, -0.011320114135742188, -0.009940624237060547, -0.008561134338378906, -0.007181644439697266, -0.005802154541015625, -0.004422664642333984, -0.0030431747436523438, -0.0016636848449707031, -0.0002841949462890625, 0.0010952949523925781, 0.0024747848510742188, 0.0038542747497558594, 0.0052337646484375, 0.006613254547119141, 0.007992744445800781, 0.009372234344482422, 0.010751724243164062, 0.012131214141845703, 0.013510704040527344, 0.014890193939208984, 0.016269683837890625, 0.017649173736572266, 0.019028663635253906, 0.020408153533935547, 0.021787643432617188, 0.023167133331298828, 0.02454662322998047, 0.02592611312866211, 0.02730560302734375, 0.02868509292602539, 0.03006458282470703, 0.03144407272338867, 0.03282356262207031, 0.03420305252075195, 0.035582542419433594, 0.036962032318115234, 0.038341522216796875, 0.039721012115478516, 0.041100502014160156, 0.0424799919128418, 0.04385948181152344, 0.04523897171020508, 0.04661846160888672, 0.04799795150756836, 0.04937744140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 8.0, 10.0, 6.0, 13.0, 14.0, 12.0, 24.0, 25.0, 25.0, 38.0, 43.0, 42.0, 45.0, 40.0, 42.0, 59.0, 54.0, 59.0, 45.0, 46.0, 49.0, 46.0, 34.0, 37.0, 34.0, 32.0, 21.0, 15.0, 23.0, 11.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.033660888671875, -0.03272652626037598, -0.03179216384887695, -0.03085780143737793, -0.029923439025878906, -0.028989076614379883, -0.02805471420288086, -0.027120351791381836, -0.026185989379882812, -0.02525162696838379, -0.024317264556884766, -0.023382902145385742, -0.02244853973388672, -0.021514177322387695, -0.020579814910888672, -0.01964545249938965, -0.018711090087890625, -0.0177767276763916, -0.016842365264892578, -0.015908002853393555, -0.014973640441894531, -0.014039278030395508, -0.013104915618896484, -0.012170553207397461, -0.011236190795898438, -0.010301828384399414, -0.00936746597290039, -0.008433103561401367, -0.007498741149902344, -0.00656437873840332, -0.005630016326904297, -0.0046956539154052734, -0.00376129150390625, -0.0028269290924072266, -0.0018925666809082031, -0.0009582042694091797, -2.384185791015625e-05, 0.0009105205535888672, 0.0018448829650878906, 0.002779245376586914, 0.0037136077880859375, 0.004647970199584961, 0.005582332611083984, 0.006516695022583008, 0.007451057434082031, 0.008385419845581055, 0.009319782257080078, 0.010254144668579102, 0.011188507080078125, 0.012122869491577148, 0.013057231903076172, 0.013991594314575195, 0.014925956726074219, 0.015860319137573242, 0.016794681549072266, 0.01772904396057129, 0.018663406372070312, 0.019597768783569336, 0.02053213119506836, 0.021466493606567383, 0.022400856018066406, 0.02333521842956543, 0.024269580841064453, 0.025203943252563477, 0.0261383056640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 19.0, 22.0, 42.0, 78.0, 161.0, 310.0, 702.0, 1620.0, 4639.0, 14851.0, 74813.0, 653321.0, 252636.0, 32245.0, 8290.0, 2733.0, 1079.0, 470.0, 224.0, 132.0, 64.0, 33.0, 15.0, 10.0, 12.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0175323486328125, -0.017013072967529297, -0.016493797302246094, -0.01597452163696289, -0.015455245971679688, -0.014935970306396484, -0.014416694641113281, -0.013897418975830078, -0.013378143310546875, -0.012858867645263672, -0.012339591979980469, -0.011820316314697266, -0.011301040649414062, -0.01078176498413086, -0.010262489318847656, -0.009743213653564453, -0.00922393798828125, -0.008704662322998047, -0.008185386657714844, -0.007666110992431641, -0.0071468353271484375, -0.006627559661865234, -0.006108283996582031, -0.005589008331298828, -0.005069732666015625, -0.004550457000732422, -0.004031181335449219, -0.0035119056701660156, -0.0029926300048828125, -0.0024733543395996094, -0.0019540786743164062, -0.0014348030090332031, -0.00091552734375, -0.0003962516784667969, 0.00012302398681640625, 0.0006422996520996094, 0.0011615753173828125, 0.0016808509826660156, 0.0022001266479492188, 0.002719402313232422, 0.003238677978515625, 0.003757953643798828, 0.004277229309082031, 0.004796504974365234, 0.0053157806396484375, 0.005835056304931641, 0.006354331970214844, 0.006873607635498047, 0.00739288330078125, 0.007912158966064453, 0.008431434631347656, 0.00895071029663086, 0.009469985961914062, 0.009989261627197266, 0.010508537292480469, 0.011027812957763672, 0.011547088623046875, 0.012066364288330078, 0.012585639953613281, 0.013104915618896484, 0.013624191284179688, 0.01414346694946289, 0.014662742614746094, 0.015182018280029297, 0.0157012939453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 4.0, 8.0, 8.0, 13.0, 18.0, 24.0, 30.0, 41.0, 32.0, 61.0, 80.0, 80.0, 79.0, 79.0, 77.0, 77.0, 53.0, 47.0, 47.0, 38.0, 23.0, 18.0, 12.0, 15.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4836273193359375e-05, -5.3009018301963806e-05, -5.118176341056824e-05, -4.935450851917267e-05, -4.75272536277771e-05, -4.569999873638153e-05, -4.387274384498596e-05, -4.204548895359039e-05, -4.0218234062194824e-05, -3.8390979170799255e-05, -3.6563724279403687e-05, -3.473646938800812e-05, -3.290921449661255e-05, -3.108195960521698e-05, -2.925470471382141e-05, -2.7427449822425842e-05, -2.5600194931030273e-05, -2.3772940039634705e-05, -2.1945685148239136e-05, -2.0118430256843567e-05, -1.8291175365447998e-05, -1.646392047405243e-05, -1.463666558265686e-05, -1.2809410691261292e-05, -1.0982155799865723e-05, -9.154900908470154e-06, -7.327646017074585e-06, -5.500391125679016e-06, -3.6731362342834473e-06, -1.8458813428878784e-06, -1.862645149230957e-08, 1.8086284399032593e-06, 3.635883331298828e-06, 5.463138222694397e-06, 7.290393114089966e-06, 9.117648005485535e-06, 1.0944902896881104e-05, 1.2772157788276672e-05, 1.4599412679672241e-05, 1.642666757106781e-05, 1.825392246246338e-05, 2.0081177353858948e-05, 2.1908432245254517e-05, 2.3735687136650085e-05, 2.5562942028045654e-05, 2.7390196919441223e-05, 2.9217451810836792e-05, 3.104470670223236e-05, 3.287196159362793e-05, 3.46992164850235e-05, 3.652647137641907e-05, 3.8353726267814636e-05, 4.0180981159210205e-05, 4.2008236050605774e-05, 4.383549094200134e-05, 4.566274583339691e-05, 4.749000072479248e-05, 4.931725561618805e-05, 5.114451050758362e-05, 5.297176539897919e-05, 5.4799020290374756e-05, 5.6626275181770325e-05, 5.8453530073165894e-05, 6.028078496456146e-05, 6.210803985595703e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 9.0, 8.0, 14.0, 25.0, 31.0, 41.0, 74.0, 138.0, 251.0, 733.0, 1864.0, 5236.0, 18493.0, 132331.0, 768799.0, 97500.0, 15409.0, 4660.0, 1642.0, 673.0, 283.0, 138.0, 78.0, 44.0, 22.0, 10.0, 15.0, 5.0, 6.0, 1.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185089111328125, -0.01788020133972168, -0.01725149154663086, -0.01662278175354004, -0.01599407196044922, -0.015365362167358398, -0.014736652374267578, -0.014107942581176758, -0.013479232788085938, -0.012850522994995117, -0.012221813201904297, -0.011593103408813477, -0.010964393615722656, -0.010335683822631836, -0.009706974029541016, -0.009078264236450195, -0.008449554443359375, -0.007820844650268555, -0.007192134857177734, -0.006563425064086914, -0.005934715270996094, -0.0053060054779052734, -0.004677295684814453, -0.004048585891723633, -0.0034198760986328125, -0.002791166305541992, -0.002162456512451172, -0.0015337467193603516, -0.0009050369262695312, -0.00027632713317871094, 0.0003523826599121094, 0.0009810924530029297, 0.00160980224609375, 0.0022385120391845703, 0.0028672218322753906, 0.003495931625366211, 0.004124641418457031, 0.0047533512115478516, 0.005382061004638672, 0.006010770797729492, 0.0066394805908203125, 0.007268190383911133, 0.007896900177001953, 0.008525609970092773, 0.009154319763183594, 0.009783029556274414, 0.010411739349365234, 0.011040449142456055, 0.011669158935546875, 0.012297868728637695, 0.012926578521728516, 0.013555288314819336, 0.014183998107910156, 0.014812707901000977, 0.015441417694091797, 0.016070127487182617, 0.016698837280273438, 0.017327547073364258, 0.017956256866455078, 0.0185849666595459, 0.01921367645263672, 0.01984238624572754, 0.02047109603881836, 0.02109980583190918, 0.021728515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 8.0, 9.0, 8.0, 19.0, 18.0, 19.0, 34.0, 43.0, 58.0, 72.0, 96.0, 107.0, 123.0, 103.0, 62.0, 46.0, 49.0, 25.0, 13.0, 18.0, 13.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01291656494140625, -0.01257479190826416, -0.01223301887512207, -0.01189124584197998, -0.01154947280883789, -0.0112076997756958, -0.010865926742553711, -0.010524153709411621, -0.010182380676269531, -0.009840607643127441, -0.009498834609985352, -0.009157061576843262, -0.008815288543701172, -0.008473515510559082, -0.008131742477416992, -0.007789969444274902, -0.0074481964111328125, -0.007106423377990723, -0.006764650344848633, -0.006422877311706543, -0.006081104278564453, -0.005739331245422363, -0.0053975582122802734, -0.005055785179138184, -0.004714012145996094, -0.004372239112854004, -0.004030466079711914, -0.0036886930465698242, -0.0033469200134277344, -0.0030051469802856445, -0.0026633739471435547, -0.002321600914001465, -0.001979827880859375, -0.0016380548477172852, -0.0012962818145751953, -0.0009545087814331055, -0.0006127357482910156, -0.0002709627151489258, 7.081031799316406e-05, 0.0004125833511352539, 0.0007543563842773438, 0.0010961294174194336, 0.0014379024505615234, 0.0017796754837036133, 0.002121448516845703, 0.002463221549987793, 0.002804994583129883, 0.0031467676162719727, 0.0034885406494140625, 0.0038303136825561523, 0.004172086715698242, 0.004513859748840332, 0.004855632781982422, 0.005197405815124512, 0.0055391788482666016, 0.005880951881408691, 0.006222724914550781, 0.006564497947692871, 0.006906270980834961, 0.007248044013977051, 0.007589817047119141, 0.00793159008026123, 0.00827336311340332, 0.00861513614654541, 0.0089569091796875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 46.0, 428.0, 467.0, 50.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8015698194503784, -0.7867310047149658, -0.7718921303749084, -0.7570532560348511, -0.7422144412994385, -0.7273756265640259, -0.7125367522239685, -0.6976978778839111, -0.6828590631484985, -0.6680202484130859, -0.6531813740730286, -0.6383424997329712, -0.6235036849975586, -0.608664870262146, -0.5938259959220886, -0.5789871215820312, -0.5641483068466187, -0.549309492111206, -0.5344706177711487, -0.5196317434310913, -0.5047929286956787, -0.4899540841579437, -0.47511523962020874, -0.46027639508247375, -0.44543755054473877, -0.4305987060070038, -0.4157598614692688, -0.4009210169315338, -0.38608217239379883, -0.37124332785606384, -0.35640448331832886, -0.34156563878059387, -0.3267267942428589, -0.3118879497051239, -0.2970491051673889, -0.28221026062965393, -0.26737141609191895, -0.25253257155418396, -0.23769372701644897, -0.222854882478714, -0.2080160528421402, -0.1931772083044052, -0.17833836376667023, -0.16349951922893524, -0.14866067469120026, -0.13382183015346527, -0.11898298561573029, -0.1041441410779953, -0.08930529654026031, -0.07446645200252533, -0.059627607464790344, -0.04478876292705536, -0.029949918389320374, -0.015111073851585388, -0.00027222931385040283, 0.014566615223884583, 0.029405459761619568, 0.04424430429935455, 0.05908314883708954, 0.07392199337482452, 0.08876083791255951, 0.1035996824502945, 0.11843852698802948, 0.13327737152576447, 0.14811621606349945]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 4.0, 8.0, 2.0, 11.0, 13.0, 17.0, 11.0, 17.0, 11.0, 21.0, 23.0, 27.0, 37.0, 32.0, 35.0, 29.0, 33.0, 38.0, 33.0, 49.0, 53.0, 32.0, 28.0, 34.0, 37.0, 32.0, 37.0, 33.0, 26.0, 25.0, 33.0, 20.0, 30.0, 25.0, 14.0, 15.0, 17.0, 9.0, 3.0, 8.0, 8.0, 2.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061264991760253906, -0.05924972519278526, -0.05723445862531662, -0.05521918833255768, -0.053203921765089035, -0.05118865519762039, -0.04917338490486145, -0.04715811833739281, -0.045142851769924164, -0.04312758520245552, -0.04111231863498688, -0.039097048342227936, -0.03708178177475929, -0.03506651520729065, -0.03305124491453171, -0.031035978347063065, -0.02902071177959442, -0.027005445212125778, -0.024990176782011986, -0.022974908351898193, -0.02095964178442955, -0.018944375216960907, -0.016929106786847115, -0.014913839288055897, -0.012898571789264679, -0.010883304290473461, -0.008868036791682243, -0.0068527692928910255, -0.004837501794099808, -0.00282223429530859, -0.0008069667965173721, 0.0012083007022738457, 0.0032235682010650635, 0.005238835699856281, 0.007254103198647499, 0.009269370697438717, 0.011284638196229935, 0.013299905695021152, 0.01531517319381237, 0.017330441623926163, 0.019345708191394806, 0.02136097475886345, 0.02337624318897724, 0.025391511619091034, 0.027406778186559677, 0.02942204475402832, 0.03143731504678726, 0.033452581614255905, 0.03546784818172455, 0.03748311474919319, 0.039498381316661835, 0.041513651609420776, 0.04352891817688942, 0.04554418474435806, 0.047559455037117004, 0.04957472160458565, 0.05158998817205429, 0.053605254739522934, 0.05562052130699158, 0.05763579159975052, 0.05965105816721916, 0.061666324734687805, 0.06368159502744675, 0.06569685786962509, 0.06771212816238403]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 16.0, 10.0, 20.0, 50.0, 78.0, 216.0, 759.0, 1824.0, 2917.0, 5687.0, 47698.0, 4042111.0, 81639.0, 6369.0, 2646.0, 853.0, 597.0, 450.0, 143.0, 59.0, 44.0, 15.0, 18.0, 16.0, 9.0, 4.0, 5.0, 8.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052032470703125, -0.050330162048339844, -0.04862785339355469, -0.04692554473876953, -0.045223236083984375, -0.04352092742919922, -0.04181861877441406, -0.040116310119628906, -0.03841400146484375, -0.036711692810058594, -0.03500938415527344, -0.03330707550048828, -0.031604766845703125, -0.02990245819091797, -0.028200149536132812, -0.026497840881347656, -0.0247955322265625, -0.023093223571777344, -0.021390914916992188, -0.01968860626220703, -0.017986297607421875, -0.01628398895263672, -0.014581680297851562, -0.012879371643066406, -0.01117706298828125, -0.009474754333496094, -0.0077724456787109375, -0.006070137023925781, -0.004367828369140625, -0.0026655197143554688, -0.0009632110595703125, 0.0007390975952148438, 0.00244140625, 0.004143714904785156, 0.0058460235595703125, 0.007548332214355469, 0.009250640869140625, 0.010952949523925781, 0.012655258178710938, 0.014357566833496094, 0.01605987548828125, 0.017762184143066406, 0.019464492797851562, 0.02116680145263672, 0.022869110107421875, 0.02457141876220703, 0.026273727416992188, 0.027976036071777344, 0.0296783447265625, 0.031380653381347656, 0.03308296203613281, 0.03478527069091797, 0.036487579345703125, 0.03818988800048828, 0.03989219665527344, 0.041594505310058594, 0.04329681396484375, 0.044999122619628906, 0.04670143127441406, 0.04840373992919922, 0.050106048583984375, 0.05180835723876953, 0.05351066589355469, 0.055212974548339844, 0.056915283203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 28.0, 114.0, 327.0, 352.0, 143.0, 26.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06903076171875, -0.06700563430786133, -0.06498050689697266, -0.06295537948608398, -0.06093025207519531, -0.05890512466430664, -0.05687999725341797, -0.0548548698425293, -0.052829742431640625, -0.05080461502075195, -0.04877948760986328, -0.04675436019897461, -0.04472923278808594, -0.042704105377197266, -0.040678977966308594, -0.03865385055541992, -0.03662872314453125, -0.03460359573364258, -0.032578468322753906, -0.030553340911865234, -0.028528213500976562, -0.02650308609008789, -0.02447795867919922, -0.022452831268310547, -0.020427703857421875, -0.018402576446533203, -0.01637744903564453, -0.01435232162475586, -0.012327194213867188, -0.010302066802978516, -0.008276939392089844, -0.006251811981201172, -0.0042266845703125, -0.002201557159423828, -0.00017642974853515625, 0.0018486976623535156, 0.0038738250732421875, 0.005898952484130859, 0.007924079895019531, 0.009949207305908203, 0.011974334716796875, 0.013999462127685547, 0.01602458953857422, 0.01804971694946289, 0.020074844360351562, 0.022099971771240234, 0.024125099182128906, 0.026150226593017578, 0.02817535400390625, 0.030200481414794922, 0.032225608825683594, 0.034250736236572266, 0.03627586364746094, 0.03830099105834961, 0.04032611846923828, 0.04235124588012695, 0.044376373291015625, 0.0464015007019043, 0.04842662811279297, 0.05045175552368164, 0.05247688293457031, 0.054502010345458984, 0.056527137756347656, 0.05855226516723633, 0.060577392578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 7.0, 32.0, 73.0, 109.0, 320.0, 1448.0, 24329.0, 4005485.0, 158030.0, 3655.0, 522.0, 157.0, 63.0, 23.0, 10.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.028659343719482422, -0.026709556579589844, -0.024759769439697266, -0.022809982299804688, -0.02086019515991211, -0.01891040802001953, -0.016960620880126953, -0.015010833740234375, -0.013061046600341797, -0.011111259460449219, -0.00916147232055664, -0.0072116851806640625, -0.005261898040771484, -0.0033121109008789062, -0.0013623237609863281, 0.00058746337890625, 0.002537250518798828, 0.004487037658691406, 0.006436824798583984, 0.008386611938476562, 0.01033639907836914, 0.012286186218261719, 0.014235973358154297, 0.016185760498046875, 0.018135547637939453, 0.02008533477783203, 0.02203512191772461, 0.023984909057617188, 0.025934696197509766, 0.027884483337402344, 0.029834270477294922, 0.0317840576171875, 0.03373384475708008, 0.035683631896972656, 0.037633419036865234, 0.03958320617675781, 0.04153299331665039, 0.04348278045654297, 0.04543256759643555, 0.047382354736328125, 0.0493321418762207, 0.05128192901611328, 0.05323171615600586, 0.05518150329589844, 0.057131290435791016, 0.059081077575683594, 0.06103086471557617, 0.06298065185546875, 0.06493043899536133, 0.0668802261352539, 0.06883001327514648, 0.07077980041503906, 0.07272958755493164, 0.07467937469482422, 0.0766291618347168, 0.07857894897460938, 0.08052873611450195, 0.08247852325439453, 0.08442831039428711, 0.08637809753417969, 0.08832788467407227, 0.09027767181396484, 0.09222745895385742, 0.09417724609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 22.0, 54.0, 89.0, 209.0, 715.0, 1823.0, 724.0, 206.0, 97.0, 49.0, 31.0, 16.0, 13.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.041153669357299805, -0.04016256332397461, -0.039171457290649414, -0.03818035125732422, -0.03718924522399902, -0.03619813919067383, -0.03520703315734863, -0.03421592712402344, -0.03322482109069824, -0.03223371505737305, -0.03124260902404785, -0.030251502990722656, -0.02926039695739746, -0.028269290924072266, -0.02727818489074707, -0.026287078857421875, -0.02529597282409668, -0.024304866790771484, -0.02331376075744629, -0.022322654724121094, -0.0213315486907959, -0.020340442657470703, -0.019349336624145508, -0.018358230590820312, -0.017367124557495117, -0.016376018524169922, -0.015384912490844727, -0.014393806457519531, -0.013402700424194336, -0.01241159439086914, -0.011420488357543945, -0.01042938232421875, -0.009438276290893555, -0.00844717025756836, -0.007456064224243164, -0.006464958190917969, -0.0054738521575927734, -0.004482746124267578, -0.003491640090942383, -0.0025005340576171875, -0.0015094280242919922, -0.0005183219909667969, 0.00047278404235839844, 0.0014638900756835938, 0.002454996109008789, 0.0034461021423339844, 0.00443720817565918, 0.005428314208984375, 0.00641942024230957, 0.007410526275634766, 0.008401632308959961, 0.009392738342285156, 0.010383844375610352, 0.011374950408935547, 0.012366056442260742, 0.013357162475585938, 0.014348268508911133, 0.015339374542236328, 0.016330480575561523, 0.01732158660888672, 0.018312692642211914, 0.01930379867553711, 0.020294904708862305, 0.0212860107421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 26.0, 92.0, 252.0, 346.0, 190.0, 63.0, 19.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1307908296585083, -0.12615326046943665, -0.12151569128036499, -0.11687812209129333, -0.11224055290222168, -0.10760298371315002, -0.10296542197465897, -0.09832785278558731, -0.09369028359651566, -0.089052714407444, -0.08441514521837234, -0.07977757602930069, -0.07514001429080963, -0.07050244510173798, -0.06586487591266632, -0.061227306723594666, -0.05658973753452301, -0.051952168345451355, -0.0473145991563797, -0.04267703369259834, -0.03803946450352669, -0.03340189531445503, -0.028764327988028526, -0.02412676066160202, -0.019489191472530365, -0.014851623214781284, -0.010214054957032204, -0.005576486699283123, -0.0009389184415340424, 0.003698650747537613, 0.008336218073964119, 0.012973785400390625, 0.01761135458946228, 0.022248923778533936, 0.02688649110496044, 0.03152405843138695, 0.0361616276204586, 0.04079919680953026, 0.045436762273311615, 0.05007433146238327, 0.054711900651454926, 0.05934946984052658, 0.06398703902959824, 0.06862460821866989, 0.07326216995716095, 0.0778997391462326, 0.08253730833530426, 0.08717487752437592, 0.09181244671344757, 0.09645001590251923, 0.10108758509159088, 0.10572515428066254, 0.11036272346973419, 0.11500029265880585, 0.1196378543972969, 0.12427542358636856, 0.12891298532485962, 0.13355055451393127, 0.13818812370300293, 0.14282569289207458, 0.14746326208114624, 0.1521008312702179, 0.15673840045928955, 0.1613759696483612, 0.16601353883743286]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 2.0, 4.0, 11.0, 6.0, 13.0, 21.0, 19.0, 17.0, 26.0, 17.0, 30.0, 24.0, 30.0, 45.0, 39.0, 51.0, 40.0, 42.0, 44.0, 42.0, 41.0, 32.0, 54.0, 30.0, 34.0, 32.0, 36.0, 29.0, 24.0, 29.0, 23.0, 26.0, 15.0, 11.0, 13.0, 11.0, 11.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0357244610786438, -0.03455135226249695, -0.0333782434463501, -0.03220513090491295, -0.031032022088766098, -0.029858913272619247, -0.028685802593827248, -0.027512691915035248, -0.026339583098888397, -0.025166474282741547, -0.023993363603949547, -0.022820252925157547, -0.021647144109010696, -0.020474035292863846, -0.019300924614071846, -0.018127813935279846, -0.016954705119132996, -0.015781596302986145, -0.014608485624194145, -0.01343537587672472, -0.012262266129255295, -0.01108915638178587, -0.009916046634316444, -0.00874293688684702, -0.007569827139377594, -0.006396717391908169, -0.005223607644438744, -0.004050497896969318, -0.002877388149499893, -0.001704278402030468, -0.0005311686545610428, 0.0006419410929083824, 0.0018150508403778076, 0.002988160587847233, 0.004161270335316658, 0.005334380082786083, 0.006507489830255508, 0.007680599577724934, 0.008853709325194359, 0.010026819072663784, 0.01119992882013321, 0.012373038567602634, 0.01354614831507206, 0.014719258062541485, 0.01589236781001091, 0.01706547662615776, 0.01823858730494976, 0.01941169798374176, 0.02058480679988861, 0.02175791561603546, 0.02293102629482746, 0.02410413697361946, 0.02527724578976631, 0.026450354605913162, 0.027623465284705162, 0.028796575963497162, 0.029969684779644012, 0.031142793595790863, 0.032315902411937714, 0.03348901495337486, 0.03466212376952171, 0.035835232585668564, 0.03700834512710571, 0.038181453943252563, 0.039354562759399414]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 7.0, 10.0, 4.0, 6.0, 18.0, 21.0, 24.0, 36.0, 51.0, 68.0, 73.0, 105.0, 181.0, 224.0, 324.0, 486.0, 701.0, 1285.0, 4094.0, 37281.0, 729895.0, 255639.0, 12761.0, 2290.0, 932.0, 593.0, 372.0, 285.0, 211.0, 147.0, 114.0, 82.0, 71.0, 58.0, 22.0, 19.0, 20.0, 7.0, 12.0, 4.0, 3.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.044921875, -0.04359245300292969, -0.042263031005859375, -0.04093360900878906, -0.03960418701171875, -0.03827476501464844, -0.036945343017578125, -0.03561592102050781, -0.0342864990234375, -0.03295707702636719, -0.031627655029296875, -0.030298233032226562, -0.02896881103515625, -0.027639389038085938, -0.026309967041015625, -0.024980545043945312, -0.023651123046875, -0.022321701049804688, -0.020992279052734375, -0.019662857055664062, -0.01833343505859375, -0.017004013061523438, -0.015674591064453125, -0.014345169067382812, -0.0130157470703125, -0.011686325073242188, -0.010356903076171875, -0.009027481079101562, -0.00769805908203125, -0.0063686370849609375, -0.005039215087890625, -0.0037097930908203125, -0.00238037109375, -0.0010509490966796875, 0.000278472900390625, 0.0016078948974609375, 0.00293731689453125, 0.0042667388916015625, 0.005596160888671875, 0.0069255828857421875, 0.0082550048828125, 0.009584426879882812, 0.010913848876953125, 0.012243270874023438, 0.01357269287109375, 0.014902114868164062, 0.016231536865234375, 0.017560958862304688, 0.018890380859375, 0.020219802856445312, 0.021549224853515625, 0.022878646850585938, 0.02420806884765625, 0.025537490844726562, 0.026866912841796875, 0.028196334838867188, 0.0295257568359375, 0.030855178833007812, 0.032184600830078125, 0.03351402282714844, 0.03484344482421875, 0.03617286682128906, 0.037502288818359375, 0.03883171081542969, 0.0401611328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 16.0, 84.0, 274.0, 366.0, 205.0, 44.0, 9.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0660400390625, -0.06406116485595703, -0.06208229064941406, -0.060103416442871094, -0.058124542236328125, -0.056145668029785156, -0.05416679382324219, -0.05218791961669922, -0.05020904541015625, -0.04823017120361328, -0.04625129699707031, -0.044272422790527344, -0.042293548583984375, -0.040314674377441406, -0.03833580017089844, -0.03635692596435547, -0.0343780517578125, -0.03239917755126953, -0.030420303344726562, -0.028441429138183594, -0.026462554931640625, -0.024483680725097656, -0.022504806518554688, -0.02052593231201172, -0.01854705810546875, -0.01656818389892578, -0.014589309692382812, -0.012610435485839844, -0.010631561279296875, -0.008652687072753906, -0.0066738128662109375, -0.004694938659667969, -0.002716064453125, -0.0007371902465820312, 0.0012416839599609375, 0.0032205581665039062, 0.005199432373046875, 0.007178306579589844, 0.009157180786132812, 0.011136054992675781, 0.01311492919921875, 0.015093803405761719, 0.017072677612304688, 0.019051551818847656, 0.021030426025390625, 0.023009300231933594, 0.024988174438476562, 0.02696704864501953, 0.0289459228515625, 0.03092479705810547, 0.03290367126464844, 0.034882545471191406, 0.036861419677734375, 0.038840293884277344, 0.04081916809082031, 0.04279804229736328, 0.04477691650390625, 0.04675579071044922, 0.04873466491699219, 0.050713539123535156, 0.052692413330078125, 0.054671287536621094, 0.05665016174316406, 0.05862903594970703, 0.06060791015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 8.0, 12.0, 11.0, 16.0, 19.0, 25.0, 32.0, 28.0, 45.0, 60.0, 77.0, 84.0, 118.0, 191.0, 513.0, 2211.0, 30297.0, 689026.0, 312042.0, 11477.0, 1283.0, 319.0, 153.0, 79.0, 95.0, 63.0, 60.0, 39.0, 38.0, 39.0, 17.0, 20.0, 16.0, 11.0, 8.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04284381866455078, -0.04149818420410156, -0.040152549743652344, -0.038806915283203125, -0.037461280822753906, -0.03611564636230469, -0.03477001190185547, -0.03342437744140625, -0.03207874298095703, -0.030733108520507812, -0.029387474060058594, -0.028041839599609375, -0.026696205139160156, -0.025350570678710938, -0.02400493621826172, -0.0226593017578125, -0.02131366729736328, -0.019968032836914062, -0.018622398376464844, -0.017276763916015625, -0.015931129455566406, -0.014585494995117188, -0.013239860534667969, -0.01189422607421875, -0.010548591613769531, -0.009202957153320312, -0.007857322692871094, -0.006511688232421875, -0.005166053771972656, -0.0038204193115234375, -0.0024747848510742188, -0.001129150390625, 0.00021648406982421875, 0.0015621185302734375, 0.0029077529907226562, 0.004253387451171875, 0.005599021911621094, 0.0069446563720703125, 0.008290290832519531, 0.00963592529296875, 0.010981559753417969, 0.012327194213867188, 0.013672828674316406, 0.015018463134765625, 0.016364097595214844, 0.017709732055664062, 0.01905536651611328, 0.0204010009765625, 0.02174663543701172, 0.023092269897460938, 0.024437904357910156, 0.025783538818359375, 0.027129173278808594, 0.028474807739257812, 0.02982044219970703, 0.03116607666015625, 0.03251171112060547, 0.03385734558105469, 0.035202980041503906, 0.036548614501953125, 0.037894248962402344, 0.03923988342285156, 0.04058551788330078, 0.04193115234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 1.0, 8.0, 9.0, 11.0, 10.0, 9.0, 11.0, 21.0, 20.0, 27.0, 32.0, 32.0, 33.0, 36.0, 37.0, 34.0, 48.0, 53.0, 45.0, 55.0, 50.0, 47.0, 40.0, 55.0, 38.0, 44.0, 29.0, 26.0, 33.0, 22.0, 23.0, 9.0, 9.0, 11.0, 7.0, 9.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024993896484375, -0.024166107177734375, -0.02333831787109375, -0.022510528564453125, -0.0216827392578125, -0.020854949951171875, -0.02002716064453125, -0.019199371337890625, -0.01837158203125, -0.017543792724609375, -0.01671600341796875, -0.015888214111328125, -0.0150604248046875, -0.014232635498046875, -0.01340484619140625, -0.012577056884765625, -0.011749267578125, -0.010921478271484375, -0.01009368896484375, -0.009265899658203125, -0.0084381103515625, -0.007610321044921875, -0.00678253173828125, -0.005954742431640625, -0.005126953125, -0.004299163818359375, -0.00347137451171875, -0.002643585205078125, -0.0018157958984375, -0.000988006591796875, -0.00016021728515625, 0.000667572021484375, 0.001495361328125, 0.002323150634765625, 0.00315093994140625, 0.003978729248046875, 0.0048065185546875, 0.005634307861328125, 0.00646209716796875, 0.007289886474609375, 0.00811767578125, 0.008945465087890625, 0.00977325439453125, 0.010601043701171875, 0.0114288330078125, 0.012256622314453125, 0.01308441162109375, 0.013912200927734375, 0.014739990234375, 0.015567779541015625, 0.01639556884765625, 0.017223358154296875, 0.0180511474609375, 0.018878936767578125, 0.01970672607421875, 0.020534515380859375, 0.0213623046875, 0.022190093994140625, 0.02301788330078125, 0.023845672607421875, 0.0246734619140625, 0.025501251220703125, 0.02632904052734375, 0.027156829833984375, 0.027984619140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 7.0, 10.0, 12.0, 19.0, 40.0, 74.0, 126.0, 186.0, 342.0, 714.0, 1391.0, 2883.0, 5942.0, 14363.0, 37843.0, 114276.0, 374506.0, 337126.0, 100985.0, 33775.0, 12970.0, 5565.0, 2643.0, 1287.0, 646.0, 357.0, 190.0, 113.0, 55.0, 37.0, 22.0, 18.0, 9.0, 10.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0056304931640625, -0.00545424222946167, -0.00527799129486084, -0.00510174036026001, -0.00492548942565918, -0.00474923849105835, -0.0045729875564575195, -0.0043967366218566895, -0.004220485687255859, -0.004044234752655029, -0.0038679838180541992, -0.003691732883453369, -0.003515481948852539, -0.003339231014251709, -0.003162980079650879, -0.002986729145050049, -0.0028104782104492188, -0.0026342272758483887, -0.0024579763412475586, -0.0022817254066467285, -0.0021054744720458984, -0.0019292235374450684, -0.0017529726028442383, -0.0015767216682434082, -0.0014004707336425781, -0.001224219799041748, -0.001047968864440918, -0.0008717179298400879, -0.0006954669952392578, -0.0005192160606384277, -0.00034296512603759766, -0.00016671419143676758, 9.5367431640625e-06, 0.00018578767776489258, 0.00036203861236572266, 0.0005382895469665527, 0.0007145404815673828, 0.0008907914161682129, 0.001067042350769043, 0.001243293285369873, 0.0014195442199707031, 0.0015957951545715332, 0.0017720460891723633, 0.0019482970237731934, 0.0021245479583740234, 0.0023007988929748535, 0.0024770498275756836, 0.0026533007621765137, 0.0028295516967773438, 0.003005802631378174, 0.003182053565979004, 0.003358304500579834, 0.003534555435180664, 0.003710806369781494, 0.0038870573043823242, 0.004063308238983154, 0.004239559173583984, 0.0044158101081848145, 0.0045920610427856445, 0.004768311977386475, 0.004944562911987305, 0.005120813846588135, 0.005297064781188965, 0.005473315715789795, 0.005649566650390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 1.0, 8.0, 8.0, 10.0, 16.0, 41.0, 49.0, 58.0, 85.0, 94.0, 110.0, 122.0, 103.0, 70.0, 54.0, 44.0, 46.0, 27.0, 16.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.343292236328125e-05, -7.090624421834946e-05, -6.837956607341766e-05, -6.585288792848587e-05, -6.332620978355408e-05, -6.0799531638622284e-05, -5.827285349369049e-05, -5.57461753487587e-05, -5.3219497203826904e-05, -5.069281905889511e-05, -4.816614091396332e-05, -4.5639462769031525e-05, -4.311278462409973e-05, -4.058610647916794e-05, -3.8059428334236145e-05, -3.553275018930435e-05, -3.300607204437256e-05, -3.0479393899440765e-05, -2.7952715754508972e-05, -2.542603760957718e-05, -2.2899359464645386e-05, -2.0372681319713593e-05, -1.78460031747818e-05, -1.5319325029850006e-05, -1.2792646884918213e-05, -1.026596873998642e-05, -7.739290595054626e-06, -5.212612450122833e-06, -2.68593430519104e-06, -1.5925616025924683e-07, 2.3674219846725464e-06, 4.89410012960434e-06, 7.420778274536133e-06, 9.947456419467926e-06, 1.247413456439972e-05, 1.5000812709331512e-05, 1.7527490854263306e-05, 2.00541689991951e-05, 2.2580847144126892e-05, 2.5107525289058685e-05, 2.763420343399048e-05, 3.0160881578922272e-05, 3.2687559723854065e-05, 3.521423786878586e-05, 3.774091601371765e-05, 4.0267594158649445e-05, 4.279427230358124e-05, 4.532095044851303e-05, 4.7847628593444824e-05, 5.037430673837662e-05, 5.290098488330841e-05, 5.5427663028240204e-05, 5.7954341173172e-05, 6.048101931810379e-05, 6.300769746303558e-05, 6.553437560796738e-05, 6.806105375289917e-05, 7.058773189783096e-05, 7.311441004276276e-05, 7.564108818769455e-05, 7.816776633262634e-05, 8.069444447755814e-05, 8.322112262248993e-05, 8.574780076742172e-05, 8.827447891235352e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 5.0, 6.0, 10.0, 14.0, 21.0, 25.0, 48.0, 76.0, 166.0, 446.0, 1499.0, 7341.0, 66449.0, 772515.0, 181219.0, 15049.0, 2537.0, 630.0, 224.0, 105.0, 46.0, 36.0, 29.0, 10.0, 14.0, 13.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.018369674682617188, -0.017894744873046875, -0.017419815063476562, -0.01694488525390625, -0.016469955444335938, -0.015995025634765625, -0.015520095825195312, -0.015045166015625, -0.014570236206054688, -0.014095306396484375, -0.013620376586914062, -0.01314544677734375, -0.012670516967773438, -0.012195587158203125, -0.011720657348632812, -0.0112457275390625, -0.010770797729492188, -0.010295867919921875, -0.009820938110351562, -0.00934600830078125, -0.008871078491210938, -0.008396148681640625, -0.007921218872070312, -0.0074462890625, -0.0069713592529296875, -0.006496429443359375, -0.0060214996337890625, -0.00554656982421875, -0.0050716400146484375, -0.004596710205078125, -0.0041217803955078125, -0.0036468505859375, -0.0031719207763671875, -0.002696990966796875, -0.0022220611572265625, -0.00174713134765625, -0.0012722015380859375, -0.000797271728515625, -0.0003223419189453125, 0.000152587890625, 0.0006275177001953125, 0.001102447509765625, 0.0015773773193359375, 0.00205230712890625, 0.0025272369384765625, 0.003002166748046875, 0.0034770965576171875, 0.0039520263671875, 0.0044269561767578125, 0.004901885986328125, 0.0053768157958984375, 0.00585174560546875, 0.0063266754150390625, 0.006801605224609375, 0.0072765350341796875, 0.00775146484375, 0.008226394653320312, 0.008701324462890625, 0.009176254272460938, 0.00965118408203125, 0.010126113891601562, 0.010601043701171875, 0.011075973510742188, 0.0115509033203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 2.0, 4.0, 7.0, 13.0, 9.0, 19.0, 14.0, 29.0, 40.0, 63.0, 54.0, 91.0, 114.0, 104.0, 99.0, 73.0, 61.0, 45.0, 49.0, 26.0, 30.0, 13.0, 7.0, 14.0, 7.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007579803466796875, -0.007292807102203369, -0.007005810737609863, -0.006718814373016357, -0.0064318180084228516, -0.006144821643829346, -0.00585782527923584, -0.005570828914642334, -0.005283832550048828, -0.004996836185455322, -0.004709839820861816, -0.0044228434562683105, -0.004135847091674805, -0.003848850727081299, -0.003561854362487793, -0.003274857997894287, -0.0029878616333007812, -0.0027008652687072754, -0.0024138689041137695, -0.0021268725395202637, -0.0018398761749267578, -0.001552879810333252, -0.001265883445739746, -0.0009788870811462402, -0.0006918907165527344, -0.0004048943519592285, -0.00011789798736572266, 0.0001690983772277832, 0.00045609474182128906, 0.0007430911064147949, 0.0010300874710083008, 0.0013170838356018066, 0.0016040802001953125, 0.0018910765647888184, 0.0021780729293823242, 0.00246506929397583, 0.002752065658569336, 0.003039062023162842, 0.0033260583877563477, 0.0036130547523498535, 0.0039000511169433594, 0.004187047481536865, 0.004474043846130371, 0.004761040210723877, 0.005048036575317383, 0.005335032939910889, 0.0056220293045043945, 0.0059090256690979, 0.006196022033691406, 0.006483018398284912, 0.006770014762878418, 0.007057011127471924, 0.00734400749206543, 0.0076310038566589355, 0.007918000221252441, 0.008204996585845947, 0.008491992950439453, 0.008778989315032959, 0.009065985679626465, 0.00935298204421997, 0.009639978408813477, 0.009926974773406982, 0.010213971138000488, 0.010500967502593994, 0.0107879638671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 32.0, 602.0, 358.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17137160897254944, -0.15407779812812805, -0.13678400218486786, -0.11949019879102707, -0.10219639539718628, -0.08490259200334549, -0.0676087886095047, -0.05031498521566391, -0.03302118182182312, -0.01572737842798233, 0.0015664249658584595, 0.01886022835969925, 0.03615403175354004, 0.05344783514738083, 0.07074163854122162, 0.08803544193506241, 0.1053292453289032, 0.12262304872274399, 0.13991685211658478, 0.15721064805984497, 0.17450445890426636, 0.19179826974868774, 0.20909206569194794, 0.22638586163520813, 0.24367967247962952, 0.2609734833240509, 0.2782672643661499, 0.2955610752105713, 0.3128548860549927, 0.33014869689941406, 0.34744250774383545, 0.36473628878593445, 0.3820301294326782, 0.3993239402770996, 0.416617751121521, 0.43391153216362, 0.4512053430080414, 0.46849915385246277, 0.48579293489456177, 0.5030867457389832, 0.5203805565834045, 0.5376743674278259, 0.5549681782722473, 0.5722619891166687, 0.5895557403564453, 0.6068495512008667, 0.6241433620452881, 0.6414371728897095, 0.6587309837341309, 0.6760247945785522, 0.6933186054229736, 0.710612416267395, 0.7279062271118164, 0.745199978351593, 0.7624937891960144, 0.7797876000404358, 0.7970814108848572, 0.8143752217292786, 0.8316690325737, 0.8489628434181213, 0.866256594657898, 0.8835504055023193, 0.9008442163467407, 0.9181380271911621, 0.9354318380355835]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 7.0, 1.0, 11.0, 13.0, 15.0, 16.0, 18.0, 15.0, 21.0, 15.0, 25.0, 28.0, 43.0, 37.0, 44.0, 29.0, 35.0, 40.0, 41.0, 36.0, 38.0, 45.0, 37.0, 32.0, 25.0, 30.0, 22.0, 29.0, 27.0, 33.0, 24.0, 24.0, 23.0, 23.0, 11.0, 16.0, 12.0, 9.0, 5.0, 4.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.06923782825469971, -0.06714363396167755, -0.0650494396686554, -0.06295523792505264, -0.06086104363203049, -0.05876684933900833, -0.05667265132069588, -0.05457845330238342, -0.05248425900936127, -0.05039006471633911, -0.04829586669802666, -0.0462016686797142, -0.04410747438669205, -0.04201328009366989, -0.03991908207535744, -0.03782488405704498, -0.03573068976402283, -0.03363649547100067, -0.03154229745268822, -0.029448101297020912, -0.027353905141353607, -0.025259708985686302, -0.023165512830018997, -0.021071316674351692, -0.018977120518684387, -0.016882924363017082, -0.014788728207349777, -0.012694532051682472, -0.010600335896015167, -0.008506139740347862, -0.006411943584680557, -0.004317747429013252, -0.0022235512733459473, -0.00012935511767864227, 0.0019648410379886627, 0.004059037193655968, 0.006153233349323273, 0.008247429504990578, 0.010341625660657883, 0.012435821816325188, 0.014530017971992493, 0.016624214127659798, 0.018718410283327103, 0.020812606438994408, 0.022906802594661713, 0.025000998750329018, 0.027095194905996323, 0.029189391061663628, 0.03128358721733093, 0.03337778151035309, 0.03547197952866554, 0.037566177546978, 0.03966037184000015, 0.04175456613302231, 0.04384876415133476, 0.04594296216964722, 0.04803715646266937, 0.05013135075569153, 0.05222554877400398, 0.05431974679231644, 0.05641394108533859, 0.05850813537836075, 0.0606023333966732, 0.06269653141498566, 0.06479072570800781]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 16.0, 30.0, 101.0, 573.0, 1992.0, 6032.0, 3841636.0, 338164.0, 4129.0, 957.0, 485.0, 89.0, 36.0, 17.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09118270874023438, -0.08849334716796875, -0.08580398559570312, -0.0831146240234375, -0.08042526245117188, -0.07773590087890625, -0.07504653930664062, -0.072357177734375, -0.06966781616210938, -0.06697845458984375, -0.06428909301757812, -0.0615997314453125, -0.058910369873046875, -0.05622100830078125, -0.053531646728515625, -0.05084228515625, -0.048152923583984375, -0.04546356201171875, -0.042774200439453125, -0.0400848388671875, -0.037395477294921875, -0.03470611572265625, -0.032016754150390625, -0.029327392578125, -0.026638031005859375, -0.02394866943359375, -0.021259307861328125, -0.0185699462890625, -0.015880584716796875, -0.01319122314453125, -0.010501861572265625, -0.0078125, -0.005123138427734375, -0.00243377685546875, 0.000255584716796875, 0.0029449462890625, 0.005634307861328125, 0.00832366943359375, 0.011013031005859375, 0.013702392578125, 0.016391754150390625, 0.01908111572265625, 0.021770477294921875, 0.0244598388671875, 0.027149200439453125, 0.02983856201171875, 0.032527923583984375, 0.03521728515625, 0.037906646728515625, 0.04059600830078125, 0.043285369873046875, 0.0459747314453125, 0.048664093017578125, 0.05135345458984375, 0.054042816162109375, 0.056732177734375, 0.059421539306640625, 0.06211090087890625, 0.06480026245117188, 0.0674896240234375, 0.07017898559570312, 0.07286834716796875, 0.07555770874023438, 0.0782470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 28.0, 107.0, 316.0, 372.0, 139.0, 32.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06591796875, -0.06392812728881836, -0.06193828582763672, -0.05994844436645508, -0.05795860290527344, -0.0559687614440918, -0.053978919982910156, -0.051989078521728516, -0.049999237060546875, -0.048009395599365234, -0.046019554138183594, -0.04402971267700195, -0.04203987121582031, -0.04005002975463867, -0.03806018829345703, -0.03607034683227539, -0.03408050537109375, -0.03209066390991211, -0.03010082244873047, -0.028110980987548828, -0.026121139526367188, -0.024131298065185547, -0.022141456604003906, -0.020151615142822266, -0.018161773681640625, -0.016171932220458984, -0.014182090759277344, -0.012192249298095703, -0.010202407836914062, -0.008212566375732422, -0.006222724914550781, -0.004232883453369141, -0.0022430419921875, -0.0002532005310058594, 0.0017366409301757812, 0.003726482391357422, 0.0057163238525390625, 0.007706165313720703, 0.009696006774902344, 0.011685848236083984, 0.013675689697265625, 0.015665531158447266, 0.017655372619628906, 0.019645214080810547, 0.021635055541992188, 0.023624897003173828, 0.02561473846435547, 0.02760457992553711, 0.02959442138671875, 0.03158426284790039, 0.03357410430908203, 0.03556394577026367, 0.03755378723144531, 0.03954362869262695, 0.041533470153808594, 0.043523311614990234, 0.045513153076171875, 0.047502994537353516, 0.049492835998535156, 0.0514826774597168, 0.05347251892089844, 0.05546236038208008, 0.05745220184326172, 0.05944204330444336, 0.061431884765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 7.0, 8.0, 18.0, 43.0, 67.0, 128.0, 251.0, 610.0, 1496.0, 4288.0, 15905.0, 87024.0, 2808457.0, 1191198.0, 65855.0, 12940.0, 3708.0, 1245.0, 521.0, 234.0, 120.0, 70.0, 31.0, 22.0, 9.0, 4.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01361846923828125, -0.013024449348449707, -0.012430429458618164, -0.011836409568786621, -0.011242389678955078, -0.010648369789123535, -0.010054349899291992, -0.00946033000946045, -0.008866310119628906, -0.008272290229797363, -0.00767827033996582, -0.007084250450134277, -0.006490230560302734, -0.005896210670471191, -0.0053021907806396484, -0.0047081708908081055, -0.0041141510009765625, -0.0035201311111450195, -0.0029261112213134766, -0.0023320913314819336, -0.0017380714416503906, -0.0011440515518188477, -0.0005500316619873047, 4.398822784423828e-05, 0.0006380081176757812, 0.0012320280075073242, 0.0018260478973388672, 0.00242006778717041, 0.003014087677001953, 0.003608107566833496, 0.004202127456665039, 0.004796147346496582, 0.005390167236328125, 0.005984187126159668, 0.006578207015991211, 0.007172226905822754, 0.007766246795654297, 0.00836026668548584, 0.008954286575317383, 0.009548306465148926, 0.010142326354980469, 0.010736346244812012, 0.011330366134643555, 0.011924386024475098, 0.01251840591430664, 0.013112425804138184, 0.013706445693969727, 0.01430046558380127, 0.014894485473632812, 0.015488505363464355, 0.0160825252532959, 0.01667654514312744, 0.017270565032958984, 0.017864584922790527, 0.01845860481262207, 0.019052624702453613, 0.019646644592285156, 0.0202406644821167, 0.020834684371948242, 0.021428704261779785, 0.022022724151611328, 0.02261674404144287, 0.023210763931274414, 0.023804783821105957, 0.0243988037109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 10.0, 10.0, 8.0, 23.0, 32.0, 33.0, 67.0, 78.0, 180.0, 243.0, 605.0, 1290.0, 654.0, 323.0, 146.0, 104.0, 86.0, 42.0, 32.0, 26.0, 18.0, 11.0, 7.0, 10.0, 9.0, 2.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010833740234375, -0.010520100593566895, -0.010206460952758789, -0.009892821311950684, -0.009579181671142578, -0.009265542030334473, -0.008951902389526367, -0.008638262748718262, -0.008324623107910156, -0.00801098346710205, -0.007697343826293945, -0.00738370418548584, -0.007070064544677734, -0.006756424903869629, -0.0064427852630615234, -0.006129145622253418, -0.0058155059814453125, -0.005501866340637207, -0.0051882266998291016, -0.004874587059020996, -0.004560947418212891, -0.004247307777404785, -0.00393366813659668, -0.0036200284957885742, -0.0033063888549804688, -0.0029927492141723633, -0.002679109573364258, -0.0023654699325561523, -0.002051830291748047, -0.0017381906509399414, -0.001424551010131836, -0.0011109113693237305, -0.000797271728515625, -0.00048363208770751953, -0.00016999244689941406, 0.0001436471939086914, 0.0004572868347167969, 0.0007709264755249023, 0.0010845661163330078, 0.0013982057571411133, 0.0017118453979492188, 0.0020254850387573242, 0.0023391246795654297, 0.002652764320373535, 0.0029664039611816406, 0.003280043601989746, 0.0035936832427978516, 0.003907322883605957, 0.0042209625244140625, 0.004534602165222168, 0.0048482418060302734, 0.005161881446838379, 0.005475521087646484, 0.00578916072845459, 0.006102800369262695, 0.006416440010070801, 0.006730079650878906, 0.007043719291687012, 0.007357358932495117, 0.007670998573303223, 0.007984638214111328, 0.008298277854919434, 0.008611917495727539, 0.008925557136535645, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 55.0, 228.0, 388.0, 246.0, 60.0, 12.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15272080898284912, -0.149119570851326, -0.14551831781864166, -0.14191707968711853, -0.1383158266544342, -0.13471458852291107, -0.13111333549022675, -0.1275120973587036, -0.12391085177659988, -0.12030960619449615, -0.11670836061239243, -0.1131071150302887, -0.10950587689876556, -0.10590462386608124, -0.1023033857345581, -0.09870214015245438, -0.09510089457035065, -0.09149964898824692, -0.08789840340614319, -0.08429715782403946, -0.08069591224193573, -0.0770946741104126, -0.07349342852830887, -0.06989218294620514, -0.06629093736410141, -0.06268969178199768, -0.05908844619989395, -0.05548720434308052, -0.05188595876097679, -0.04828471317887306, -0.04468347132205963, -0.0410822257399559, -0.037480972707271576, -0.03387972712516785, -0.030278483405709267, -0.026677239686250687, -0.023075994104146957, -0.019474748522043228, -0.015873504802584648, -0.012272261083126068, -0.008671015501022339, -0.005069770850241184, -0.0014685261994600296, 0.002132718451321125, 0.00573396310210228, 0.009335208684206009, 0.012936452403664589, 0.01653769612312317, 0.020138941705226898, 0.023740187287330627, 0.027341431006789207, 0.030942674726247787, 0.03454392030835152, 0.038145165890455246, 0.04174640774726868, 0.045347653329372406, 0.048948898911476135, 0.052550144493579865, 0.056151390075683594, 0.059752631932497025, 0.06335388123989105, 0.06695511937141418, 0.07055636495351791, 0.07415761053562164, 0.07775885611772537]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 9.0, 8.0, 8.0, 8.0, 13.0, 23.0, 20.0, 26.0, 25.0, 41.0, 30.0, 51.0, 43.0, 38.0, 58.0, 52.0, 54.0, 52.0, 56.0, 50.0, 43.0, 33.0, 54.0, 28.0, 29.0, 32.0, 19.0, 19.0, 16.0, 17.0, 12.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024567008018493652, -0.02381231263279915, -0.023057615384459496, -0.022302918136119843, -0.02154822275042534, -0.020793527364730835, -0.020038830116391182, -0.01928413286805153, -0.018529437482357025, -0.01777474209666252, -0.01702004484832287, -0.016265347599983215, -0.015510652214288712, -0.014755955897271633, -0.014001259580254555, -0.013246563263237476, -0.012491866946220398, -0.01173717062920332, -0.010982474312186241, -0.010227777995169163, -0.009473081678152084, -0.008718385361135006, -0.007963689044117928, -0.007208992727100849, -0.006454296410083771, -0.005699600093066692, -0.004944903776049614, -0.0041902074590325356, -0.003435511142015457, -0.0026808148249983788, -0.0019261185079813004, -0.001171422190964222, -0.00041672587394714355, 0.00033797044306993484, 0.0010926667600870132, 0.0018473630771040916, 0.00260205939412117, 0.0033567557111382484, 0.004111452028155327, 0.004866148345172405, 0.005620844662189484, 0.006375540979206562, 0.0071302372962236404, 0.007884933613240719, 0.008639629930257797, 0.009394326247274876, 0.010149022564291954, 0.010903718881309032, 0.01165841519832611, 0.01241311151534319, 0.013167807832360268, 0.013922504149377346, 0.014677200466394424, 0.015431896783411503, 0.01618659310042858, 0.016941290348768234, 0.017695985734462738, 0.018450681120157242, 0.019205378368496895, 0.019960075616836548, 0.02071477100253105, 0.021469466388225555, 0.02222416363656521, 0.02297886088490486, 0.023733556270599365]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 8.0, 8.0, 8.0, 6.0, 11.0, 16.0, 24.0, 25.0, 40.0, 58.0, 68.0, 86.0, 135.0, 156.0, 249.0, 298.0, 450.0, 630.0, 1156.0, 3176.0, 26228.0, 577403.0, 413694.0, 18644.0, 2746.0, 1057.0, 609.0, 440.0, 286.0, 208.0, 164.0, 123.0, 93.0, 70.0, 58.0, 34.0, 24.0, 22.0, 11.0, 12.0, 2.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.03985595703125, -0.0386815071105957, -0.037507057189941406, -0.03633260726928711, -0.03515815734863281, -0.033983707427978516, -0.03280925750732422, -0.03163480758666992, -0.030460357666015625, -0.029285907745361328, -0.02811145782470703, -0.026937007904052734, -0.025762557983398438, -0.02458810806274414, -0.023413658142089844, -0.022239208221435547, -0.02106475830078125, -0.019890308380126953, -0.018715858459472656, -0.01754140853881836, -0.016366958618164062, -0.015192508697509766, -0.014018058776855469, -0.012843608856201172, -0.011669158935546875, -0.010494709014892578, -0.009320259094238281, -0.008145809173583984, -0.0069713592529296875, -0.005796909332275391, -0.004622459411621094, -0.003448009490966797, -0.0022735595703125, -0.0010991096496582031, 7.534027099609375e-05, 0.0012497901916503906, 0.0024242401123046875, 0.0035986900329589844, 0.004773139953613281, 0.005947589874267578, 0.007122039794921875, 0.008296489715576172, 0.009470939636230469, 0.010645389556884766, 0.011819839477539062, 0.01299428939819336, 0.014168739318847656, 0.015343189239501953, 0.01651763916015625, 0.017692089080810547, 0.018866539001464844, 0.02004098892211914, 0.021215438842773438, 0.022389888763427734, 0.02356433868408203, 0.024738788604736328, 0.025913238525390625, 0.027087688446044922, 0.02826213836669922, 0.029436588287353516, 0.030611038208007812, 0.03178548812866211, 0.032959938049316406, 0.0341343879699707, 0.035308837890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 23.0, 101.0, 315.0, 357.0, 155.0, 39.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.061387062072753906, -0.05941963195800781, -0.05745220184326172, -0.055484771728515625, -0.05351734161376953, -0.05154991149902344, -0.049582481384277344, -0.04761505126953125, -0.045647621154785156, -0.04368019104003906, -0.04171276092529297, -0.039745330810546875, -0.03777790069580078, -0.03581047058105469, -0.033843040466308594, -0.0318756103515625, -0.029908180236816406, -0.027940750122070312, -0.02597332000732422, -0.024005889892578125, -0.02203845977783203, -0.020071029663085938, -0.018103599548339844, -0.01613616943359375, -0.014168739318847656, -0.012201309204101562, -0.010233879089355469, -0.008266448974609375, -0.006299018859863281, -0.0043315887451171875, -0.0023641586303710938, -0.000396728515625, 0.0015707015991210938, 0.0035381317138671875, 0.005505561828613281, 0.007472991943359375, 0.009440422058105469, 0.011407852172851562, 0.013375282287597656, 0.01534271240234375, 0.017310142517089844, 0.019277572631835938, 0.02124500274658203, 0.023212432861328125, 0.02517986297607422, 0.027147293090820312, 0.029114723205566406, 0.0310821533203125, 0.033049583435058594, 0.03501701354980469, 0.03698444366455078, 0.038951873779296875, 0.04091930389404297, 0.04288673400878906, 0.044854164123535156, 0.04682159423828125, 0.048789024353027344, 0.05075645446777344, 0.05272388458251953, 0.054691314697265625, 0.05665874481201172, 0.05862617492675781, 0.060593605041503906, 0.06256103515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 10.0, 4.0, 8.0, 14.0, 13.0, 17.0, 21.0, 20.0, 30.0, 39.0, 42.0, 50.0, 48.0, 46.0, 58.0, 56.0, 86.0, 126.0, 238.0, 550.0, 2030.0, 14236.0, 212018.0, 727932.0, 81483.0, 6836.0, 1231.0, 419.0, 193.0, 112.0, 93.0, 76.0, 81.0, 48.0, 53.0, 31.0, 27.0, 21.0, 27.0, 25.0, 18.0, 14.0, 19.0, 8.0, 10.0, 7.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0], "bins": [-0.033111572265625, -0.03214716911315918, -0.03118276596069336, -0.03021836280822754, -0.02925395965576172, -0.0282895565032959, -0.027325153350830078, -0.026360750198364258, -0.025396347045898438, -0.024431943893432617, -0.023467540740966797, -0.022503137588500977, -0.021538734436035156, -0.020574331283569336, -0.019609928131103516, -0.018645524978637695, -0.017681121826171875, -0.016716718673706055, -0.015752315521240234, -0.014787912368774414, -0.013823509216308594, -0.012859106063842773, -0.011894702911376953, -0.010930299758911133, -0.009965896606445312, -0.009001493453979492, -0.008037090301513672, -0.0070726871490478516, -0.006108283996582031, -0.005143880844116211, -0.004179477691650391, -0.0032150745391845703, -0.00225067138671875, -0.0012862682342529297, -0.0003218650817871094, 0.0006425380706787109, 0.0016069412231445312, 0.0025713443756103516, 0.003535747528076172, 0.004500150680541992, 0.0054645538330078125, 0.006428956985473633, 0.007393360137939453, 0.008357763290405273, 0.009322166442871094, 0.010286569595336914, 0.011250972747802734, 0.012215375900268555, 0.013179779052734375, 0.014144182205200195, 0.015108585357666016, 0.016072988510131836, 0.017037391662597656, 0.018001794815063477, 0.018966197967529297, 0.019930601119995117, 0.020895004272460938, 0.021859407424926758, 0.022823810577392578, 0.0237882137298584, 0.02475261688232422, 0.02571702003479004, 0.02668142318725586, 0.02764582633972168, 0.0286102294921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 11.0, 5.0, 13.0, 13.0, 9.0, 17.0, 15.0, 23.0, 33.0, 27.0, 34.0, 28.0, 30.0, 36.0, 33.0, 39.0, 48.0, 49.0, 49.0, 51.0, 42.0, 38.0, 29.0, 41.0, 30.0, 27.0, 26.0, 20.0, 30.0, 23.0, 25.0, 19.0, 16.0, 14.0, 13.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.02099609375, -0.020303726196289062, -0.019611358642578125, -0.018918991088867188, -0.01822662353515625, -0.017534255981445312, -0.016841888427734375, -0.016149520874023438, -0.0154571533203125, -0.014764785766601562, -0.014072418212890625, -0.013380050659179688, -0.01268768310546875, -0.011995315551757812, -0.011302947998046875, -0.010610580444335938, -0.009918212890625, -0.009225845336914062, -0.008533477783203125, -0.007841110229492188, -0.00714874267578125, -0.0064563751220703125, -0.005764007568359375, -0.0050716400146484375, -0.0043792724609375, -0.0036869049072265625, -0.002994537353515625, -0.0023021697998046875, -0.00160980224609375, -0.0009174346923828125, -0.000225067138671875, 0.0004673004150390625, 0.00115966796875, 0.0018520355224609375, 0.002544403076171875, 0.0032367706298828125, 0.00392913818359375, 0.0046215057373046875, 0.005313873291015625, 0.0060062408447265625, 0.0066986083984375, 0.0073909759521484375, 0.008083343505859375, 0.008775711059570312, 0.00946807861328125, 0.010160446166992188, 0.010852813720703125, 0.011545181274414062, 0.012237548828125, 0.012929916381835938, 0.013622283935546875, 0.014314651489257812, 0.01500701904296875, 0.015699386596679688, 0.016391754150390625, 0.017084121704101562, 0.0177764892578125, 0.018468856811523438, 0.019161224365234375, 0.019853591918945312, 0.02054595947265625, 0.021238327026367188, 0.021930694580078125, 0.022623062133789062, 0.0233154296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 9.0, 6.0, 24.0, 16.0, 38.0, 55.0, 96.0, 183.0, 318.0, 579.0, 1170.0, 2313.0, 4770.0, 10507.0, 26056.0, 77673.0, 308392.0, 439274.0, 115864.0, 35498.0, 13885.0, 5883.0, 2904.0, 1418.0, 714.0, 414.0, 206.0, 117.0, 70.0, 41.0, 15.0, 16.0, 13.0, 5.0, 5.0, 9.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005504608154296875, -0.005333423614501953, -0.005162239074707031, -0.004991054534912109, -0.0048198699951171875, -0.004648685455322266, -0.004477500915527344, -0.004306316375732422, -0.0041351318359375, -0.003963947296142578, -0.0037927627563476562, -0.0036215782165527344, -0.0034503936767578125, -0.0032792091369628906, -0.0031080245971679688, -0.002936840057373047, -0.002765655517578125, -0.002594470977783203, -0.0024232864379882812, -0.0022521018981933594, -0.0020809173583984375, -0.0019097328186035156, -0.0017385482788085938, -0.0015673637390136719, -0.00139617919921875, -0.0012249946594238281, -0.0010538101196289062, -0.0008826255798339844, -0.0007114410400390625, -0.0005402565002441406, -0.00036907196044921875, -0.00019788742065429688, -2.6702880859375e-05, 0.00014448165893554688, 0.00031566619873046875, 0.0004868507385253906, 0.0006580352783203125, 0.0008292198181152344, 0.0010004043579101562, 0.0011715888977050781, 0.0013427734375, 0.0015139579772949219, 0.0016851425170898438, 0.0018563270568847656, 0.0020275115966796875, 0.0021986961364746094, 0.0023698806762695312, 0.002541065216064453, 0.002712249755859375, 0.002883434295654297, 0.0030546188354492188, 0.0032258033752441406, 0.0033969879150390625, 0.0035681724548339844, 0.0037393569946289062, 0.003910541534423828, 0.00408172607421875, 0.004252910614013672, 0.004424095153808594, 0.004595279693603516, 0.0047664642333984375, 0.004937648773193359, 0.005108833312988281, 0.005280017852783203, 0.005451202392578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 2.0, 10.0, 20.0, 11.0, 14.0, 25.0, 36.0, 45.0, 49.0, 65.0, 98.0, 112.0, 89.0, 82.0, 80.0, 58.0, 52.0, 26.0, 21.0, 24.0, 16.0, 9.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.316205978393555e-05, -9.043142199516296e-05, -8.770078420639038e-05, -8.49701464176178e-05, -8.223950862884521e-05, -7.950887084007263e-05, -7.677823305130005e-05, -7.404759526252747e-05, -7.131695747375488e-05, -6.85863196849823e-05, -6.585568189620972e-05, -6.312504410743713e-05, -6.039440631866455e-05, -5.766376852989197e-05, -5.4933130741119385e-05, -5.22024929523468e-05, -4.947185516357422e-05, -4.6741217374801636e-05, -4.401057958602905e-05, -4.127994179725647e-05, -3.854930400848389e-05, -3.5818666219711304e-05, -3.308802843093872e-05, -3.0357390642166138e-05, -2.7626752853393555e-05, -2.489611506462097e-05, -2.216547727584839e-05, -1.9434839487075806e-05, -1.6704201698303223e-05, -1.397356390953064e-05, -1.1242926120758057e-05, -8.512288331985474e-06, -5.781650543212891e-06, -3.0510127544403076e-06, -3.203749656677246e-07, 2.4102628231048584e-06, 5.140900611877441e-06, 7.871538400650024e-06, 1.0602176189422607e-05, 1.333281397819519e-05, 1.6063451766967773e-05, 1.8794089555740356e-05, 2.152472734451294e-05, 2.4255365133285522e-05, 2.6986002922058105e-05, 2.971664071083069e-05, 3.244727849960327e-05, 3.5177916288375854e-05, 3.790855407714844e-05, 4.063919186592102e-05, 4.3369829654693604e-05, 4.6100467443466187e-05, 4.883110523223877e-05, 5.156174302101135e-05, 5.4292380809783936e-05, 5.702301859855652e-05, 5.97536563873291e-05, 6.248429417610168e-05, 6.521493196487427e-05, 6.794556975364685e-05, 7.067620754241943e-05, 7.340684533119202e-05, 7.61374831199646e-05, 7.886812090873718e-05, 8.159875869750977e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 17.0, 28.0, 37.0, 48.0, 92.0, 180.0, 468.0, 1642.0, 10020.0, 124412.0, 837070.0, 66027.0, 6511.0, 1179.0, 365.0, 181.0, 94.0, 60.0, 40.0, 14.0, 21.0, 7.0, 11.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01219940185546875, -0.011677861213684082, -0.011156320571899414, -0.010634779930114746, -0.010113239288330078, -0.00959169864654541, -0.009070158004760742, -0.008548617362976074, -0.008027076721191406, -0.007505536079406738, -0.00698399543762207, -0.006462454795837402, -0.005940914154052734, -0.005419373512268066, -0.0048978328704833984, -0.0043762922286987305, -0.0038547515869140625, -0.0033332109451293945, -0.0028116703033447266, -0.0022901296615600586, -0.0017685890197753906, -0.0012470483779907227, -0.0007255077362060547, -0.00020396709442138672, 0.00031757354736328125, 0.0008391141891479492, 0.0013606548309326172, 0.0018821954727172852, 0.002403736114501953, 0.002925276756286621, 0.003446817398071289, 0.003968358039855957, 0.004489898681640625, 0.005011439323425293, 0.005532979965209961, 0.006054520606994629, 0.006576061248779297, 0.007097601890563965, 0.007619142532348633, 0.0081406831741333, 0.008662223815917969, 0.009183764457702637, 0.009705305099487305, 0.010226845741271973, 0.01074838638305664, 0.011269927024841309, 0.011791467666625977, 0.012313008308410645, 0.012834548950195312, 0.01335608959197998, 0.013877630233764648, 0.014399170875549316, 0.014920711517333984, 0.015442252159118652, 0.01596379280090332, 0.01648533344268799, 0.017006874084472656, 0.017528414726257324, 0.018049955368041992, 0.01857149600982666, 0.019093036651611328, 0.019614577293395996, 0.020136117935180664, 0.020657658576965332, 0.02117919921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 7.0, 15.0, 24.0, 37.0, 41.0, 81.0, 127.0, 148.0, 145.0, 119.0, 86.0, 59.0, 35.0, 10.0, 10.0, 10.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.01494908332824707, -0.01462411880493164, -0.014299154281616211, -0.013974189758300781, -0.013649225234985352, -0.013324260711669922, -0.012999296188354492, -0.012674331665039062, -0.012349367141723633, -0.012024402618408203, -0.011699438095092773, -0.011374473571777344, -0.011049509048461914, -0.010724544525146484, -0.010399580001831055, -0.010074615478515625, -0.009749650955200195, -0.009424686431884766, -0.009099721908569336, -0.008774757385253906, -0.008449792861938477, -0.008124828338623047, -0.007799863815307617, -0.0074748992919921875, -0.007149934768676758, -0.006824970245361328, -0.0065000057220458984, -0.006175041198730469, -0.005850076675415039, -0.005525112152099609, -0.00520014762878418, -0.00487518310546875, -0.00455021858215332, -0.004225254058837891, -0.003900289535522461, -0.0035753250122070312, -0.0032503604888916016, -0.002925395965576172, -0.002600431442260742, -0.0022754669189453125, -0.0019505023956298828, -0.0016255378723144531, -0.0013005733489990234, -0.0009756088256835938, -0.0006506443023681641, -0.0003256797790527344, -7.152557373046875e-07, 0.000324249267578125, 0.0006492137908935547, 0.0009741783142089844, 0.001299142837524414, 0.0016241073608398438, 0.0019490718841552734, 0.002274036407470703, 0.002599000930786133, 0.0029239654541015625, 0.003248929977416992, 0.003573894500732422, 0.0038988590240478516, 0.004223823547363281, 0.004548788070678711, 0.004873752593994141, 0.00519871711730957, 0.005523681640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 55.0, 874.0, 78.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18397590517997742, -0.16228285431861877, -0.14058981835842133, -0.11889676749706268, -0.09720372408628464, -0.07551068067550659, -0.05381762981414795, -0.0321245938539505, -0.010431542992591858, 0.011261502280831337, 0.03295454755425453, 0.054647594690322876, 0.07634063810110092, 0.09803368151187897, 0.11972673237323761, 0.14141976833343506, 0.1631128191947937, 0.18480587005615234, 0.2064989060163498, 0.22819195687770844, 0.24988499283790588, 0.2715780436992645, 0.29327109456062317, 0.3149641156196594, 0.33665716648101807, 0.3583502173423767, 0.38004326820373535, 0.401736319065094, 0.42342934012413025, 0.4451223909854889, 0.46681544184684753, 0.4885084629058838, 0.5102015137672424, 0.5318945646286011, 0.5535876154899597, 0.5752806663513184, 0.596973717212677, 0.6186667680740356, 0.6403597593307495, 0.6620528101921082, 0.6837458610534668, 0.7054389119148254, 0.7271319627761841, 0.7488250136375427, 0.7705180644989014, 0.7922110557556152, 0.8139041662216187, 0.8355971574783325, 0.8572902679443359, 0.8789833188056946, 0.9006763696670532, 0.9223694205284119, 0.9440624713897705, 0.9657554626464844, 0.9874485731124878, 1.0091415643692017, 1.0308345556259155, 1.0525275468826294, 1.0742206573486328, 1.0959136486053467, 1.11760675907135, 1.139299750328064, 1.1609928607940674, 1.1826858520507812, 1.2043789625167847]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 5.0, 5.0, 6.0, 12.0, 18.0, 16.0, 9.0, 20.0, 20.0, 22.0, 24.0, 28.0, 40.0, 37.0, 31.0, 36.0, 40.0, 49.0, 37.0, 33.0, 47.0, 35.0, 38.0, 45.0, 43.0, 41.0, 25.0, 25.0, 35.0, 25.0, 18.0, 18.0, 14.0, 13.0, 12.0, 12.0, 4.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07189327478408813, -0.06971617043018341, -0.06753907352685928, -0.06536196917295456, -0.06318487226963043, -0.06100776791572571, -0.058830663561820984, -0.05665356293320656, -0.05447646230459213, -0.05229936167597771, -0.05012226104736328, -0.04794515669345856, -0.04576805606484413, -0.043590955436229706, -0.04141385108232498, -0.039236750453710556, -0.03705964982509613, -0.034882549196481705, -0.03270544856786728, -0.030528344213962555, -0.02835124358534813, -0.026174142956733704, -0.02399704046547413, -0.021819937974214554, -0.019642837345600128, -0.017465736716985703, -0.015288634225726128, -0.013111532665789127, -0.010934431105852127, -0.008757329545915127, -0.0065802279859781265, -0.004403126426041126, -0.002226024866104126, -4.89233061671257e-05, 0.0021281782537698746, 0.004305279813706875, 0.006482381373643875, 0.008659482933580875, 0.010836584493517876, 0.013013686053454876, 0.015190787613391876, 0.017367888242006302, 0.019544990733265877, 0.02172209322452545, 0.023899193853139877, 0.026076294481754303, 0.028253396973013878, 0.030430499464273453, 0.03260760009288788, 0.034784700721502304, 0.03696180135011673, 0.039138905704021454, 0.04131600633263588, 0.043493106961250305, 0.04567021131515503, 0.047847311943769455, 0.05002441257238388, 0.052201513200998306, 0.05437861382961273, 0.056555718183517456, 0.05873281881213188, 0.06090991944074631, 0.06308702379465103, 0.06526412069797516, 0.06744122505187988]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 5.0, 19.0, 44.0, 137.0, 386.0, 987.0, 1618.0, 3577.0, 42712.0, 4114485.0, 25250.0, 2892.0, 1162.0, 445.0, 248.0, 174.0, 65.0, 25.0, 18.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050537109375, -0.048760414123535156, -0.04698371887207031, -0.04520702362060547, -0.043430328369140625, -0.04165363311767578, -0.03987693786621094, -0.038100242614746094, -0.03632354736328125, -0.034546852111816406, -0.03277015686035156, -0.03099346160888672, -0.029216766357421875, -0.02744007110595703, -0.025663375854492188, -0.023886680603027344, -0.0221099853515625, -0.020333290100097656, -0.018556594848632812, -0.01677989959716797, -0.015003204345703125, -0.013226509094238281, -0.011449813842773438, -0.009673118591308594, -0.00789642333984375, -0.006119728088378906, -0.0043430328369140625, -0.0025663375854492188, -0.000789642333984375, 0.0009870529174804688, 0.0027637481689453125, 0.004540443420410156, 0.006317138671875, 0.008093833923339844, 0.009870529174804688, 0.011647224426269531, 0.013423919677734375, 0.015200614929199219, 0.016977310180664062, 0.018754005432128906, 0.02053070068359375, 0.022307395935058594, 0.024084091186523438, 0.02586078643798828, 0.027637481689453125, 0.02941417694091797, 0.031190872192382812, 0.032967567443847656, 0.0347442626953125, 0.036520957946777344, 0.03829765319824219, 0.04007434844970703, 0.041851043701171875, 0.04362773895263672, 0.04540443420410156, 0.047181129455566406, 0.04895782470703125, 0.050734519958496094, 0.05251121520996094, 0.05428791046142578, 0.056064605712890625, 0.05784130096435547, 0.05961799621582031, 0.061394691467285156, 0.06317138671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 25.0, 144.0, 376.0, 324.0, 109.0, 18.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06842041015625, -0.06634235382080078, -0.06426429748535156, -0.062186241149902344, -0.060108184814453125, -0.058030128479003906, -0.05595207214355469, -0.05387401580810547, -0.05179595947265625, -0.04971790313720703, -0.04763984680175781, -0.045561790466308594, -0.043483734130859375, -0.041405677795410156, -0.03932762145996094, -0.03724956512451172, -0.0351715087890625, -0.03309345245361328, -0.031015396118164062, -0.028937339782714844, -0.026859283447265625, -0.024781227111816406, -0.022703170776367188, -0.02062511444091797, -0.01854705810546875, -0.01646900177001953, -0.014390945434570312, -0.012312889099121094, -0.010234832763671875, -0.008156776428222656, -0.0060787200927734375, -0.004000663757324219, -0.001922607421875, 0.00015544891357421875, 0.0022335052490234375, 0.004311561584472656, 0.006389617919921875, 0.008467674255371094, 0.010545730590820312, 0.012623786926269531, 0.01470184326171875, 0.01677989959716797, 0.018857955932617188, 0.020936012268066406, 0.023014068603515625, 0.025092124938964844, 0.027170181274414062, 0.02924823760986328, 0.0313262939453125, 0.03340435028076172, 0.03548240661621094, 0.037560462951660156, 0.039638519287109375, 0.041716575622558594, 0.04379463195800781, 0.04587268829345703, 0.04795074462890625, 0.05002880096435547, 0.05210685729980469, 0.054184913635253906, 0.056262969970703125, 0.058341026306152344, 0.06041908264160156, 0.06249713897705078, 0.0645751953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 51.0, 101.0, 228.0, 1229.0, 11013.0, 841698.0, 3321404.0, 16425.0, 1638.0, 344.0, 98.0, 26.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.033504486083984375, -0.03221893310546875, -0.030933380126953125, -0.0296478271484375, -0.028362274169921875, -0.02707672119140625, -0.025791168212890625, -0.024505615234375, -0.023220062255859375, -0.02193450927734375, -0.020648956298828125, -0.0193634033203125, -0.018077850341796875, -0.01679229736328125, -0.015506744384765625, -0.01422119140625, -0.012935638427734375, -0.01165008544921875, -0.010364532470703125, -0.0090789794921875, -0.007793426513671875, -0.00650787353515625, -0.005222320556640625, -0.003936767578125, -0.002651214599609375, -0.00136566162109375, -8.0108642578125e-05, 0.0012054443359375, 0.002490997314453125, 0.00377655029296875, 0.005062103271484375, 0.00634765625, 0.007633209228515625, 0.00891876220703125, 0.010204315185546875, 0.0114898681640625, 0.012775421142578125, 0.01406097412109375, 0.015346527099609375, 0.016632080078125, 0.017917633056640625, 0.01920318603515625, 0.020488739013671875, 0.0217742919921875, 0.023059844970703125, 0.02434539794921875, 0.025630950927734375, 0.02691650390625, 0.028202056884765625, 0.02948760986328125, 0.030773162841796875, 0.0320587158203125, 0.033344268798828125, 0.03462982177734375, 0.035915374755859375, 0.037200927734375, 0.038486480712890625, 0.03977203369140625, 0.041057586669921875, 0.0423431396484375, 0.043628692626953125, 0.04491424560546875, 0.046199798583984375, 0.0474853515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 14.0, 30.0, 32.0, 128.0, 248.0, 1018.0, 1837.0, 442.0, 136.0, 73.0, 42.0, 19.0, 19.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020355224609375, -0.019821882247924805, -0.01928853988647461, -0.018755197525024414, -0.01822185516357422, -0.017688512802124023, -0.017155170440673828, -0.016621828079223633, -0.016088485717773438, -0.015555143356323242, -0.015021800994873047, -0.014488458633422852, -0.013955116271972656, -0.013421773910522461, -0.012888431549072266, -0.01235508918762207, -0.011821746826171875, -0.01128840446472168, -0.010755062103271484, -0.010221719741821289, -0.009688377380371094, -0.009155035018920898, -0.008621692657470703, -0.008088350296020508, -0.0075550079345703125, -0.007021665573120117, -0.006488323211669922, -0.0059549808502197266, -0.005421638488769531, -0.004888296127319336, -0.004354953765869141, -0.0038216114044189453, -0.00328826904296875, -0.0027549266815185547, -0.0022215843200683594, -0.001688241958618164, -0.0011548995971679688, -0.0006215572357177734, -8.821487426757812e-05, 0.0004451274871826172, 0.0009784698486328125, 0.0015118122100830078, 0.002045154571533203, 0.0025784969329833984, 0.0031118392944335938, 0.003645181655883789, 0.004178524017333984, 0.00471186637878418, 0.005245208740234375, 0.00577855110168457, 0.006311893463134766, 0.006845235824584961, 0.007378578186035156, 0.007911920547485352, 0.008445262908935547, 0.008978605270385742, 0.009511947631835938, 0.010045289993286133, 0.010578632354736328, 0.011111974716186523, 0.011645317077636719, 0.012178659439086914, 0.01271200180053711, 0.013245344161987305, 0.0137786865234375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 41.0, 215.0, 430.0, 237.0, 55.0, 19.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.2023770958185196, -0.1987934410572052, -0.19520977139472961, -0.19162611663341522, -0.18804244697093964, -0.18445879220962524, -0.18087512254714966, -0.17729146778583527, -0.17370781302452087, -0.17012415826320648, -0.1665404886007309, -0.1629568338394165, -0.15937316417694092, -0.15578950941562653, -0.15220585465431213, -0.14862218499183655, -0.14503851532936096, -0.14145486056804657, -0.13787119090557098, -0.1342875361442566, -0.130703866481781, -0.1271202117204666, -0.12353654950857162, -0.11995288729667664, -0.11636923253536224, -0.11278557032346725, -0.10920190811157227, -0.10561825335025787, -0.10203459113836288, -0.0984509289264679, -0.0948672667145729, -0.09128360450267792, -0.08769994229078293, -0.08411628007888794, -0.08053261786699295, -0.07694895565509796, -0.07336530089378357, -0.06978163868188858, -0.06619797646999359, -0.0626143142580986, -0.05903065204620361, -0.055446989834308624, -0.051863331347703934, -0.048279669135808945, -0.044696006923913956, -0.041112348437309265, -0.037528686225414276, -0.03394502401351929, -0.030361365526914597, -0.026777705177664757, -0.023194042965769768, -0.019610382616519928, -0.01602672040462494, -0.0124430600553751, -0.00885939970612526, -0.00527573749423027, -0.0016920771449804306, 0.0018915839027613401, 0.005475244950503111, 0.009058905765414238, 0.012642567045986652, 0.016226228326559067, 0.019809888675808907, 0.023393550887703896, 0.026977211236953735]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 30.0, 23.0, 27.0, 34.0, 46.0, 47.0, 70.0, 54.0, 71.0, 61.0, 55.0, 58.0, 57.0, 60.0, 57.0, 39.0, 45.0, 36.0, 27.0, 21.0, 23.0, 9.0, 9.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027879655361175537, -0.026923367753624916, -0.025967080146074295, -0.025010792538523674, -0.024054504930973053, -0.023098217323422432, -0.02214192971587181, -0.02118564210832119, -0.02022935450077057, -0.019273066893219948, -0.018316779285669327, -0.017360491678118706, -0.016404204070568085, -0.015447916463017464, -0.014491628855466843, -0.013535341247916222, -0.0125790536403656, -0.01162276603281498, -0.010666478425264359, -0.009710190817713737, -0.008753903210163116, -0.007797615602612495, -0.006841327995061874, -0.005885040387511253, -0.004928752779960632, -0.003972465172410011, -0.0030161775648593903, -0.0020598899573087692, -0.0011036023497581482, -0.00014731474220752716, 0.0008089728653430939, 0.001765260472893715, 0.002721548080444336, 0.003677835687994957, 0.004634123295545578, 0.005590410903096199, 0.00654669851064682, 0.007502986118197441, 0.008459273725748062, 0.009415561333298683, 0.010371848940849304, 0.011328136548399925, 0.012284424155950546, 0.013240711763501167, 0.014196999371051788, 0.01515328697860241, 0.01610957458615303, 0.01706586219370365, 0.018022149801254272, 0.018978437408804893, 0.019934725016355515, 0.020891012623906136, 0.021847300231456757, 0.022803587839007378, 0.023759875446558, 0.02471616305410862, 0.02567245066165924, 0.026628738269209862, 0.027585025876760483, 0.028541313484311104, 0.029497601091861725, 0.030453888699412346, 0.03141017630696297, 0.03236646205186844, 0.03332275152206421]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 13.0, 9.0, 16.0, 22.0, 41.0, 37.0, 48.0, 66.0, 92.0, 128.0, 171.0, 198.0, 286.0, 370.0, 592.0, 1075.0, 2677.0, 14169.0, 249612.0, 729522.0, 40471.0, 4963.0, 1469.0, 724.0, 444.0, 325.0, 247.0, 187.0, 138.0, 103.0, 78.0, 71.0, 48.0, 28.0, 21.0, 25.0, 17.0, 7.0, 11.0, 5.0, 6.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0379638671875, -0.03682088851928711, -0.03567790985107422, -0.03453493118286133, -0.03339195251464844, -0.03224897384643555, -0.031105995178222656, -0.029963016510009766, -0.028820037841796875, -0.027677059173583984, -0.026534080505371094, -0.025391101837158203, -0.024248123168945312, -0.023105144500732422, -0.02196216583251953, -0.02081918716430664, -0.01967620849609375, -0.01853322982788086, -0.01739025115966797, -0.016247272491455078, -0.015104293823242188, -0.013961315155029297, -0.012818336486816406, -0.011675357818603516, -0.010532379150390625, -0.009389400482177734, -0.008246421813964844, -0.007103443145751953, -0.0059604644775390625, -0.004817485809326172, -0.0036745071411132812, -0.0025315284729003906, -0.0013885498046875, -0.0002455711364746094, 0.0008974075317382812, 0.002040386199951172, 0.0031833648681640625, 0.004326343536376953, 0.005469322204589844, 0.006612300872802734, 0.007755279541015625, 0.008898258209228516, 0.010041236877441406, 0.011184215545654297, 0.012327194213867188, 0.013470172882080078, 0.014613151550292969, 0.01575613021850586, 0.01689910888671875, 0.01804208755493164, 0.01918506622314453, 0.020328044891357422, 0.021471023559570312, 0.022614002227783203, 0.023756980895996094, 0.024899959564208984, 0.026042938232421875, 0.027185916900634766, 0.028328895568847656, 0.029471874237060547, 0.030614852905273438, 0.03175783157348633, 0.03290081024169922, 0.03404378890991211, 0.035186767578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 24.0, 122.0, 338.0, 337.0, 147.0, 24.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.06380701065063477, -0.06181812286376953, -0.0598292350769043, -0.05784034729003906, -0.05585145950317383, -0.053862571716308594, -0.05187368392944336, -0.049884796142578125, -0.04789590835571289, -0.045907020568847656, -0.04391813278198242, -0.04192924499511719, -0.03994035720825195, -0.03795146942138672, -0.035962581634521484, -0.03397369384765625, -0.031984806060791016, -0.02999591827392578, -0.028007030487060547, -0.026018142700195312, -0.024029254913330078, -0.022040367126464844, -0.02005147933959961, -0.018062591552734375, -0.01607370376586914, -0.014084815979003906, -0.012095928192138672, -0.010107040405273438, -0.008118152618408203, -0.006129264831542969, -0.004140377044677734, -0.0021514892578125, -0.00016260147094726562, 0.0018262863159179688, 0.003815174102783203, 0.0058040618896484375, 0.007792949676513672, 0.009781837463378906, 0.01177072525024414, 0.013759613037109375, 0.01574850082397461, 0.017737388610839844, 0.019726276397705078, 0.021715164184570312, 0.023704051971435547, 0.02569293975830078, 0.027681827545166016, 0.02967071533203125, 0.031659603118896484, 0.03364849090576172, 0.03563737869262695, 0.03762626647949219, 0.03961515426635742, 0.041604042053222656, 0.04359292984008789, 0.045581817626953125, 0.04757070541381836, 0.049559593200683594, 0.05154848098754883, 0.05353736877441406, 0.0555262565612793, 0.05751514434814453, 0.059504032135009766, 0.061492919921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 10.0, 18.0, 18.0, 17.0, 39.0, 30.0, 52.0, 47.0, 83.0, 74.0, 113.0, 153.0, 297.0, 946.0, 4453.0, 50037.0, 730873.0, 245288.0, 12848.0, 1903.0, 510.0, 200.0, 133.0, 80.0, 52.0, 61.0, 48.0, 46.0, 26.0, 26.0, 14.0, 14.0, 13.0, 7.0, 5.0, 7.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028289794921875, -0.02727031707763672, -0.026250839233398438, -0.025231361389160156, -0.024211883544921875, -0.023192405700683594, -0.022172927856445312, -0.02115345001220703, -0.02013397216796875, -0.01911449432373047, -0.018095016479492188, -0.017075538635253906, -0.016056060791015625, -0.015036582946777344, -0.014017105102539062, -0.012997627258300781, -0.0119781494140625, -0.010958671569824219, -0.009939193725585938, -0.008919715881347656, -0.007900238037109375, -0.006880760192871094, -0.0058612823486328125, -0.004841804504394531, -0.00382232666015625, -0.0028028488159179688, -0.0017833709716796875, -0.0007638931274414062, 0.000255584716796875, 0.0012750625610351562, 0.0022945404052734375, 0.0033140182495117188, 0.00433349609375, 0.005352973937988281, 0.0063724517822265625, 0.007391929626464844, 0.008411407470703125, 0.009430885314941406, 0.010450363159179688, 0.011469841003417969, 0.01248931884765625, 0.013508796691894531, 0.014528274536132812, 0.015547752380371094, 0.016567230224609375, 0.017586708068847656, 0.018606185913085938, 0.01962566375732422, 0.0206451416015625, 0.02166461944580078, 0.022684097290039062, 0.023703575134277344, 0.024723052978515625, 0.025742530822753906, 0.026762008666992188, 0.02778148651123047, 0.02880096435546875, 0.02982044219970703, 0.030839920043945312, 0.031859397888183594, 0.032878875732421875, 0.033898353576660156, 0.03491783142089844, 0.03593730926513672, 0.036956787109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 9.0, 16.0, 21.0, 23.0, 31.0, 27.0, 40.0, 41.0, 44.0, 49.0, 49.0, 58.0, 64.0, 62.0, 62.0, 64.0, 43.0, 47.0, 39.0, 42.0, 27.0, 32.0, 28.0, 18.0, 16.0, 10.0, 6.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032623291015625, -0.031708478927612305, -0.03079366683959961, -0.029878854751586914, -0.02896404266357422, -0.028049230575561523, -0.027134418487548828, -0.026219606399536133, -0.025304794311523438, -0.024389982223510742, -0.023475170135498047, -0.02256035804748535, -0.021645545959472656, -0.02073073387145996, -0.019815921783447266, -0.01890110969543457, -0.017986297607421875, -0.01707148551940918, -0.016156673431396484, -0.015241861343383789, -0.014327049255371094, -0.013412237167358398, -0.012497425079345703, -0.011582612991333008, -0.010667800903320312, -0.009752988815307617, -0.008838176727294922, -0.007923364639282227, -0.007008552551269531, -0.006093740463256836, -0.005178928375244141, -0.004264116287231445, -0.00334930419921875, -0.0024344921112060547, -0.0015196800231933594, -0.0006048679351806641, 0.00030994415283203125, 0.0012247562408447266, 0.002139568328857422, 0.003054380416870117, 0.0039691925048828125, 0.004884004592895508, 0.005798816680908203, 0.0067136287689208984, 0.007628440856933594, 0.008543252944946289, 0.009458065032958984, 0.01037287712097168, 0.011287689208984375, 0.01220250129699707, 0.013117313385009766, 0.014032125473022461, 0.014946937561035156, 0.01586174964904785, 0.016776561737060547, 0.017691373825073242, 0.018606185913085938, 0.019520998001098633, 0.020435810089111328, 0.021350622177124023, 0.02226543426513672, 0.023180246353149414, 0.02409505844116211, 0.025009870529174805, 0.0259246826171875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 11.0, 3.0, 16.0, 13.0, 22.0, 38.0, 34.0, 54.0, 106.0, 133.0, 254.0, 377.0, 601.0, 1062.0, 1938.0, 3616.0, 7282.0, 16373.0, 44282.0, 173629.0, 535097.0, 184770.0, 45772.0, 17014.0, 7466.0, 3754.0, 1990.0, 1114.0, 654.0, 383.0, 234.0, 134.0, 112.0, 78.0, 48.0, 28.0, 10.0, 11.0, 10.0, 8.0, 11.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00585174560546875, -0.005659997463226318, -0.005468249320983887, -0.005276501178741455, -0.0050847530364990234, -0.004893004894256592, -0.00470125675201416, -0.0045095086097717285, -0.004317760467529297, -0.004126012325286865, -0.003934264183044434, -0.003742516040802002, -0.0035507678985595703, -0.0033590197563171387, -0.003167271614074707, -0.0029755234718322754, -0.0027837753295898438, -0.002592027187347412, -0.0024002790451049805, -0.002208530902862549, -0.002016782760620117, -0.0018250346183776855, -0.001633286476135254, -0.0014415383338928223, -0.0012497901916503906, -0.001058042049407959, -0.0008662939071655273, -0.0006745457649230957, -0.00048279762268066406, -0.0002910494804382324, -9.930133819580078e-05, 9.244680404663086e-05, 0.0002841949462890625, 0.00047594308853149414, 0.0006676912307739258, 0.0008594393730163574, 0.001051187515258789, 0.0012429356575012207, 0.0014346837997436523, 0.001626431941986084, 0.0018181800842285156, 0.0020099282264709473, 0.002201676368713379, 0.0023934245109558105, 0.002585172653198242, 0.002776920795440674, 0.0029686689376831055, 0.003160417079925537, 0.0033521652221679688, 0.0035439133644104004, 0.003735661506652832, 0.003927409648895264, 0.004119157791137695, 0.004310905933380127, 0.004502654075622559, 0.00469440221786499, 0.004886150360107422, 0.0050778985023498535, 0.005269646644592285, 0.005461394786834717, 0.0056531429290771484, 0.00584489107131958, 0.006036639213562012, 0.006228387355804443, 0.006420135498046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 7.0, 18.0, 27.0, 27.0, 58.0, 153.0, 220.0, 203.0, 118.0, 88.0, 34.0, 16.0, 13.0, 6.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.00021215900778770447, -0.0002064034342765808, -0.00020064786076545715, -0.0001948922872543335, -0.00018913671374320984, -0.00018338114023208618, -0.00017762556672096252, -0.00017186999320983887, -0.0001661144196987152, -0.00016035884618759155, -0.0001546032726764679, -0.00014884769916534424, -0.00014309212565422058, -0.00013733655214309692, -0.00013158097863197327, -0.0001258254051208496, -0.00012006983160972595, -0.0001143142580986023, -0.00010855868458747864, -0.00010280311107635498, -9.704753756523132e-05, -9.129196405410767e-05, -8.553639054298401e-05, -7.978081703186035e-05, -7.40252435207367e-05, -6.826967000961304e-05, -6.251409649848938e-05, -5.675852298736572e-05, -5.1002949476242065e-05, -4.524737596511841e-05, -3.949180245399475e-05, -3.3736228942871094e-05, -2.7980655431747437e-05, -2.222508192062378e-05, -1.6469508409500122e-05, -1.0713934898376465e-05, -4.958361387252808e-06, 7.972121238708496e-07, 6.552785634994507e-06, 1.2308359146118164e-05, 1.806393265724182e-05, 2.381950616836548e-05, 2.9575079679489136e-05, 3.533065319061279e-05, 4.108622670173645e-05, 4.684180021286011e-05, 5.2597373723983765e-05, 5.835294723510742e-05, 6.410852074623108e-05, 6.986409425735474e-05, 7.56196677684784e-05, 8.137524127960205e-05, 8.713081479072571e-05, 9.288638830184937e-05, 9.864196181297302e-05, 0.00010439753532409668, 0.00011015310883522034, 0.000115908682346344, 0.00012166425585746765, 0.0001274198293685913, 0.00013317540287971497, 0.00013893097639083862, 0.00014468654990196228, 0.00015044212341308594]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 14.0, 32.0, 37.0, 77.0, 126.0, 256.0, 540.0, 1222.0, 3426.0, 14051.0, 112413.0, 811934.0, 87091.0, 12046.0, 3112.0, 1101.0, 477.0, 238.0, 140.0, 99.0, 40.0, 30.0, 13.0, 11.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0166473388671875, -0.016177773475646973, -0.015708208084106445, -0.015238642692565918, -0.01476907730102539, -0.014299511909484863, -0.013829946517944336, -0.013360381126403809, -0.012890815734863281, -0.012421250343322754, -0.011951684951782227, -0.0114821195602417, -0.011012554168701172, -0.010542988777160645, -0.010073423385620117, -0.00960385799407959, -0.009134292602539062, -0.008664727210998535, -0.008195161819458008, -0.0077255964279174805, -0.007256031036376953, -0.006786465644836426, -0.0063169002532958984, -0.005847334861755371, -0.005377769470214844, -0.004908204078674316, -0.004438638687133789, -0.003969073295593262, -0.0034995079040527344, -0.003029942512512207, -0.0025603771209716797, -0.0020908117294311523, -0.001621246337890625, -0.0011516809463500977, -0.0006821155548095703, -0.00021255016326904297, 0.0002570152282714844, 0.0007265806198120117, 0.001196146011352539, 0.0016657114028930664, 0.0021352767944335938, 0.002604842185974121, 0.0030744075775146484, 0.0035439729690551758, 0.004013538360595703, 0.0044831037521362305, 0.004952669143676758, 0.005422234535217285, 0.0058917999267578125, 0.00636136531829834, 0.006830930709838867, 0.0073004961013793945, 0.007770061492919922, 0.00823962688446045, 0.008709192276000977, 0.009178757667541504, 0.009648323059082031, 0.010117888450622559, 0.010587453842163086, 0.011057019233703613, 0.01152658462524414, 0.011996150016784668, 0.012465715408325195, 0.012935280799865723, 0.01340484619140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 7.0, 8.0, 9.0, 12.0, 21.0, 25.0, 34.0, 70.0, 117.0, 114.0, 152.0, 135.0, 91.0, 66.0, 33.0, 21.0, 17.0, 15.0, 5.0, 13.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006931304931640625, -0.006607115268707275, -0.006282925605773926, -0.005958735942840576, -0.0056345462799072266, -0.005310356616973877, -0.004986166954040527, -0.004661977291107178, -0.004337787628173828, -0.0040135979652404785, -0.003689408302307129, -0.0033652186393737793, -0.0030410289764404297, -0.00271683931350708, -0.0023926496505737305, -0.002068459987640381, -0.0017442703247070312, -0.0014200806617736816, -0.001095890998840332, -0.0007717013359069824, -0.0004475116729736328, -0.0001233220100402832, 0.0002008676528930664, 0.000525057315826416, 0.0008492469787597656, 0.0011734366416931152, 0.0014976263046264648, 0.0018218159675598145, 0.002146005630493164, 0.0024701952934265137, 0.0027943849563598633, 0.003118574619293213, 0.0034427642822265625, 0.003766953945159912, 0.004091143608093262, 0.004415333271026611, 0.004739522933959961, 0.0050637125968933105, 0.00538790225982666, 0.00571209192276001, 0.006036281585693359, 0.006360471248626709, 0.006684660911560059, 0.007008850574493408, 0.007333040237426758, 0.007657229900360107, 0.007981419563293457, 0.008305609226226807, 0.008629798889160156, 0.008953988552093506, 0.009278178215026855, 0.009602367877960205, 0.009926557540893555, 0.010250747203826904, 0.010574936866760254, 0.010899126529693604, 0.011223316192626953, 0.011547505855560303, 0.011871695518493652, 0.012195885181427002, 0.012520074844360352, 0.012844264507293701, 0.01316845417022705, 0.0134926438331604, 0.01381683349609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 12.0, 112.0, 586.0, 247.0, 37.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15375575423240662, -0.14257372915744781, -0.131391704082489, -0.12020967155694962, -0.10902764648199081, -0.09784562140703201, -0.08666358888149261, -0.07548156380653381, -0.06429953873157501, -0.05311751365661621, -0.04193548485636711, -0.03075345605611801, -0.01957143098115921, -0.008389405906200409, 0.0027926266193389893, 0.01397465169429779, 0.025156676769256592, 0.03633870184421539, 0.04752073064446449, 0.05870275944471359, 0.0698847845196724, 0.0810668095946312, 0.0922488421201706, 0.1034308671951294, 0.1146128922700882, 0.125794917345047, 0.1369769424200058, 0.1481589674949646, 0.1593410074710846, 0.1705230176448822, 0.1817050576210022, 0.192887082695961, 0.2040690779685974, 0.2152511030435562, 0.22643312811851501, 0.237615168094635, 0.24879717826843262, 0.2599792182445526, 0.2711612582206726, 0.2823432683944702, 0.2935252785682678, 0.3047073185443878, 0.3158893287181854, 0.3270713686943054, 0.338253378868103, 0.349435418844223, 0.360617458820343, 0.3717994689941406, 0.3829815089702606, 0.3941635489463806, 0.4053455591201782, 0.4165275990962982, 0.4277096092700958, 0.4388916492462158, 0.4500736594200134, 0.4612556993961334, 0.4724377393722534, 0.4836197793483734, 0.494801789522171, 0.505983829498291, 0.5171658396720886, 0.5283478498458862, 0.5395299196243286, 0.5507119297981262, 0.5618939399719238]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 16.0, 17.0, 17.0, 19.0, 19.0, 32.0, 36.0, 36.0, 34.0, 41.0, 38.0, 40.0, 51.0, 48.0, 45.0, 53.0, 49.0, 36.0, 35.0, 37.0, 31.0, 33.0, 29.0, 31.0, 31.0, 31.0, 16.0, 15.0, 16.0, 11.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07513010501861572, -0.07288433611392975, -0.07063857465982437, -0.0683928057551384, -0.06614704430103302, -0.06390127539634705, -0.06165550649166107, -0.059409741312265396, -0.05716397613286972, -0.054918210953474045, -0.05267244577407837, -0.050426676869392395, -0.04818091168999672, -0.045935146510601044, -0.04368937760591507, -0.041443612426519394, -0.03919784724712372, -0.03695208206772804, -0.03470631688833237, -0.03246054798364639, -0.030214782804250717, -0.02796901762485504, -0.025723250582814217, -0.02347748354077339, -0.021231718361377716, -0.01898595318198204, -0.016740186139941216, -0.014494420029222965, -0.012248653918504715, -0.010002887807786465, -0.007757121697068214, -0.0055113546550273895, -0.003265589475631714, -0.0010198233649134636, 0.0012259427458047867, 0.003471708856523037, 0.005717474967241287, 0.007963241077959538, 0.010209007188677788, 0.012454774230718613, 0.014700539410114288, 0.016946304589509964, 0.01919207163155079, 0.021437838673591614, 0.02368360385298729, 0.025929369032382965, 0.02817513607442379, 0.030420903116464615, 0.03266666829586029, 0.034912433475255966, 0.03715819865465164, 0.039403967559337616, 0.04164973273873329, 0.04389549791812897, 0.04614126682281494, 0.04838703200221062, 0.05063279718160629, 0.05287856236100197, 0.055124327540397644, 0.05737009644508362, 0.059615861624479294, 0.06186162680387497, 0.06410739570856094, 0.06635315716266632, 0.0685989260673523]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 3.0, 8.0, 16.0, 25.0, 37.0, 93.0, 286.0, 658.0, 1166.0, 1485.0, 2422.0, 8542.0, 238502.0, 3910507.0, 23033.0, 3787.0, 1735.0, 819.0, 387.0, 291.0, 244.0, 99.0, 40.0, 25.0, 18.0, 12.0, 11.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.0379328727722168, -0.036589622497558594, -0.03524637222290039, -0.03390312194824219, -0.032559871673583984, -0.03121662139892578, -0.029873371124267578, -0.028530120849609375, -0.027186870574951172, -0.02584362030029297, -0.024500370025634766, -0.023157119750976562, -0.02181386947631836, -0.020470619201660156, -0.019127368927001953, -0.01778411865234375, -0.016440868377685547, -0.015097618103027344, -0.01375436782836914, -0.012411117553710938, -0.011067867279052734, -0.009724617004394531, -0.008381366729736328, -0.007038116455078125, -0.005694866180419922, -0.004351615905761719, -0.0030083656311035156, -0.0016651153564453125, -0.0003218650817871094, 0.0010213851928710938, 0.002364635467529297, 0.0037078857421875, 0.005051136016845703, 0.006394386291503906, 0.007737636566162109, 0.009080886840820312, 0.010424137115478516, 0.011767387390136719, 0.013110637664794922, 0.014453887939453125, 0.015797138214111328, 0.01714038848876953, 0.018483638763427734, 0.019826889038085938, 0.02117013931274414, 0.022513389587402344, 0.023856639862060547, 0.02519989013671875, 0.026543140411376953, 0.027886390686035156, 0.02922964096069336, 0.030572891235351562, 0.031916141510009766, 0.03325939178466797, 0.03460264205932617, 0.035945892333984375, 0.03728914260864258, 0.03863239288330078, 0.039975643157958984, 0.04131889343261719, 0.04266214370727539, 0.044005393981933594, 0.0453486442565918, 0.04669189453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 15.0, 88.0, 262.0, 372.0, 201.0, 53.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06346893310546875, -0.0615081787109375, -0.05954742431640625, -0.057586669921875, -0.05562591552734375, -0.0536651611328125, -0.05170440673828125, -0.04974365234375, -0.04778289794921875, -0.0458221435546875, -0.04386138916015625, -0.041900634765625, -0.03993988037109375, -0.0379791259765625, -0.03601837158203125, -0.0340576171875, -0.03209686279296875, -0.0301361083984375, -0.02817535400390625, -0.026214599609375, -0.02425384521484375, -0.0222930908203125, -0.02033233642578125, -0.01837158203125, -0.01641082763671875, -0.0144500732421875, -0.01248931884765625, -0.010528564453125, -0.00856781005859375, -0.0066070556640625, -0.00464630126953125, -0.002685546875, -0.00072479248046875, 0.0012359619140625, 0.00319671630859375, 0.005157470703125, 0.00711822509765625, 0.0090789794921875, 0.01103973388671875, 0.01300048828125, 0.01496124267578125, 0.0169219970703125, 0.01888275146484375, 0.020843505859375, 0.02280426025390625, 0.0247650146484375, 0.02672576904296875, 0.0286865234375, 0.03064727783203125, 0.0326080322265625, 0.03456878662109375, 0.036529541015625, 0.03849029541015625, 0.0404510498046875, 0.04241180419921875, 0.04437255859375, 0.04633331298828125, 0.0482940673828125, 0.05025482177734375, 0.052215576171875, 0.05417633056640625, 0.0561370849609375, 0.05809783935546875, 0.06005859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 6.0, 12.0, 13.0, 16.0, 20.0, 28.0, 55.0, 90.0, 120.0, 193.0, 296.0, 603.0, 1236.0, 3080.0, 8707.0, 32822.0, 186715.0, 3540404.0, 351426.0, 48814.0, 12431.0, 3989.0, 1599.0, 696.0, 363.0, 187.0, 117.0, 76.0, 43.0, 30.0, 31.0, 13.0, 14.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0187835693359375, -0.018284320831298828, -0.017785072326660156, -0.017285823822021484, -0.016786575317382812, -0.01628732681274414, -0.01578807830810547, -0.015288829803466797, -0.014789581298828125, -0.014290332794189453, -0.013791084289550781, -0.01329183578491211, -0.012792587280273438, -0.012293338775634766, -0.011794090270996094, -0.011294841766357422, -0.01079559326171875, -0.010296344757080078, -0.009797096252441406, -0.009297847747802734, -0.008798599243164062, -0.00829935073852539, -0.007800102233886719, -0.007300853729248047, -0.006801605224609375, -0.006302356719970703, -0.005803108215332031, -0.005303859710693359, -0.0048046112060546875, -0.004305362701416016, -0.0038061141967773438, -0.003306865692138672, -0.0028076171875, -0.002308368682861328, -0.0018091201782226562, -0.0013098716735839844, -0.0008106231689453125, -0.0003113746643066406, 0.00018787384033203125, 0.0006871223449707031, 0.001186370849609375, 0.0016856193542480469, 0.0021848678588867188, 0.0026841163635253906, 0.0031833648681640625, 0.0036826133728027344, 0.004181861877441406, 0.004681110382080078, 0.00518035888671875, 0.005679607391357422, 0.006178855895996094, 0.006678104400634766, 0.0071773529052734375, 0.007676601409912109, 0.008175849914550781, 0.008675098419189453, 0.009174346923828125, 0.009673595428466797, 0.010172843933105469, 0.01067209243774414, 0.011171340942382812, 0.011670589447021484, 0.012169837951660156, 0.012669086456298828, 0.0131683349609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 2.0, 7.0, 15.0, 20.0, 20.0, 32.0, 45.0, 61.0, 112.0, 246.0, 593.0, 1277.0, 808.0, 327.0, 150.0, 95.0, 58.0, 59.0, 32.0, 27.0, 16.0, 8.0, 11.0, 9.0, 6.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01275634765625, -0.012376904487609863, -0.011997461318969727, -0.01161801815032959, -0.011238574981689453, -0.010859131813049316, -0.01047968864440918, -0.010100245475769043, -0.009720802307128906, -0.00934135913848877, -0.008961915969848633, -0.008582472801208496, -0.00820302963256836, -0.007823586463928223, -0.007444143295288086, -0.007064700126647949, -0.0066852569580078125, -0.006305813789367676, -0.005926370620727539, -0.005546927452087402, -0.005167484283447266, -0.004788041114807129, -0.004408597946166992, -0.0040291547775268555, -0.0036497116088867188, -0.003270268440246582, -0.0028908252716064453, -0.0025113821029663086, -0.002131938934326172, -0.0017524957656860352, -0.0013730525970458984, -0.0009936094284057617, -0.000614166259765625, -0.00023472309112548828, 0.00014472007751464844, 0.0005241632461547852, 0.0009036064147949219, 0.0012830495834350586, 0.0016624927520751953, 0.002041935920715332, 0.0024213790893554688, 0.0028008222579956055, 0.003180265426635742, 0.003559708595275879, 0.003939151763916016, 0.004318594932556152, 0.004698038101196289, 0.005077481269836426, 0.0054569244384765625, 0.005836367607116699, 0.006215810775756836, 0.006595253944396973, 0.006974697113037109, 0.007354140281677246, 0.007733583450317383, 0.00811302661895752, 0.008492469787597656, 0.008871912956237793, 0.00925135612487793, 0.009630799293518066, 0.010010242462158203, 0.01038968563079834, 0.010769128799438477, 0.011148571968078613, 0.01152801513671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 13.0, 46.0, 143.0, 360.0, 273.0, 121.0, 34.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17345602810382843, -0.16957254707813263, -0.16568908095359802, -0.16180559992790222, -0.15792211890220642, -0.15403863787651062, -0.150155171751976, -0.1462716907262802, -0.1423882246017456, -0.1385047435760498, -0.1346212774515152, -0.1307377964258194, -0.1268543154001236, -0.12297084182500839, -0.11908736824989319, -0.11520388722419739, -0.11132040619850159, -0.10743693262338638, -0.10355345159769058, -0.09966997802257538, -0.09578649699687958, -0.09190302342176437, -0.08801954984664917, -0.08413606882095337, -0.08025259524583817, -0.07636912167072296, -0.07248564064502716, -0.06860216706991196, -0.06471869349479675, -0.06083521246910095, -0.05695173889398575, -0.053068261593580246, -0.04918479174375534, -0.04530131444334984, -0.041417837142944336, -0.03753436356782913, -0.03365088626742363, -0.029767408967018127, -0.025883933529257774, -0.02200045809149742, -0.01811698079109192, -0.014233504422008991, -0.010350028052926064, -0.006466551683843136, -0.002583075314760208, 0.0013004019856452942, 0.005183877423405647, 0.009067352861166, 0.012950830161571503, 0.016834307461977005, 0.020717782899737358, 0.02460125833749771, 0.028484735637903214, 0.032368212938308716, 0.03625168651342392, 0.04013516381382942, 0.044018641114234924, 0.04790211841464043, 0.05178559571504593, 0.05566906929016113, 0.059552546590566635, 0.06343602389097214, 0.06731949746608734, 0.07120297849178314, 0.07508645206689835]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 5.0, 6.0, 15.0, 20.0, 17.0, 15.0, 19.0, 20.0, 30.0, 36.0, 26.0, 32.0, 40.0, 38.0, 34.0, 39.0, 50.0, 39.0, 44.0, 40.0, 40.0, 46.0, 38.0, 32.0, 33.0, 28.0, 32.0, 20.0, 19.0, 19.0, 14.0, 18.0, 16.0, 15.0, 7.0, 4.0, 6.0, 5.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02538299560546875, -0.024583134800195694, -0.023783275857567787, -0.02298341691493988, -0.022183556109666824, -0.02138369530439377, -0.02058383636176586, -0.019783977419137955, -0.0189841166138649, -0.018184255808591843, -0.017384396865963936, -0.01658453792333603, -0.015784677118062973, -0.014984817244112492, -0.01418495737016201, -0.013385097496211529, -0.012585237622261047, -0.011785377748310566, -0.010985517874360085, -0.010185658000409603, -0.009385798126459122, -0.00858593825250864, -0.007786078378558159, -0.0069862185046076775, -0.006186358630657196, -0.005386498756706715, -0.004586638882756233, -0.003786779008805752, -0.0029869191348552704, -0.002187059260904789, -0.0013871993869543076, -0.0005873395130038261, 0.00021252036094665527, 0.0010123802348971367, 0.001812240108847618, 0.0026120999827980995, 0.003411959856748581, 0.004211819730699062, 0.005011679604649544, 0.005811539478600025, 0.006611399352550507, 0.007411259226500988, 0.00821111910045147, 0.00901097897440195, 0.009810838848352432, 0.010610698722302914, 0.011410558596253395, 0.012210418470203876, 0.013010278344154358, 0.01381013821810484, 0.01460999809205532, 0.015409857966005802, 0.016209717839956284, 0.01700957864522934, 0.017809437587857246, 0.018609296530485153, 0.01940915733575821, 0.020209018141031265, 0.021008877083659172, 0.02180873602628708, 0.022608596831560135, 0.02340845763683319, 0.024208316579461098, 0.025008175522089005, 0.02580803632736206]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 12.0, 13.0, 19.0, 13.0, 25.0, 24.0, 30.0, 39.0, 69.0, 76.0, 121.0, 141.0, 195.0, 275.0, 367.0, 624.0, 1114.0, 3213.0, 22214.0, 548118.0, 447588.0, 18395.0, 2893.0, 969.0, 576.0, 392.0, 251.0, 193.0, 123.0, 97.0, 92.0, 59.0, 46.0, 46.0, 35.0, 16.0, 17.0, 12.0, 13.0, 7.0, 5.0, 3.0, 9.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.043548583984375, -0.042095184326171875, -0.04064178466796875, -0.039188385009765625, -0.0377349853515625, -0.036281585693359375, -0.03482818603515625, -0.033374786376953125, -0.03192138671875, -0.030467987060546875, -0.02901458740234375, -0.027561187744140625, -0.0261077880859375, -0.024654388427734375, -0.02320098876953125, -0.021747589111328125, -0.020294189453125, -0.018840789794921875, -0.01738739013671875, -0.015933990478515625, -0.0144805908203125, -0.013027191162109375, -0.01157379150390625, -0.010120391845703125, -0.0086669921875, -0.007213592529296875, -0.00576019287109375, -0.004306793212890625, -0.0028533935546875, -0.001399993896484375, 5.340576171875e-05, 0.001506805419921875, 0.002960205078125, 0.004413604736328125, 0.00586700439453125, 0.007320404052734375, 0.0087738037109375, 0.010227203369140625, 0.01168060302734375, 0.013134002685546875, 0.01458740234375, 0.016040802001953125, 0.01749420166015625, 0.018947601318359375, 0.0204010009765625, 0.021854400634765625, 0.02330780029296875, 0.024761199951171875, 0.026214599609375, 0.027667999267578125, 0.02912139892578125, 0.030574798583984375, 0.0320281982421875, 0.033481597900390625, 0.03493499755859375, 0.036388397216796875, 0.037841796875, 0.039295196533203125, 0.04074859619140625, 0.042201995849609375, 0.0436553955078125, 0.045108795166015625, 0.04656219482421875, 0.048015594482421875, 0.049468994140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 25.0, 118.0, 319.0, 361.0, 145.0, 26.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06493473052978516, -0.06291389465332031, -0.06089305877685547, -0.058872222900390625, -0.05685138702392578, -0.05483055114746094, -0.052809715270996094, -0.05078887939453125, -0.048768043518066406, -0.04674720764160156, -0.04472637176513672, -0.042705535888671875, -0.04068470001220703, -0.03866386413574219, -0.036643028259277344, -0.0346221923828125, -0.032601356506347656, -0.030580520629882812, -0.02855968475341797, -0.026538848876953125, -0.02451801300048828, -0.022497177124023438, -0.020476341247558594, -0.01845550537109375, -0.016434669494628906, -0.014413833618164062, -0.012392997741699219, -0.010372161865234375, -0.008351325988769531, -0.0063304901123046875, -0.004309654235839844, -0.002288818359375, -0.00026798248291015625, 0.0017528533935546875, 0.0037736892700195312, 0.005794525146484375, 0.007815361022949219, 0.009836196899414062, 0.011857032775878906, 0.01387786865234375, 0.015898704528808594, 0.017919540405273438, 0.01994037628173828, 0.021961212158203125, 0.02398204803466797, 0.026002883911132812, 0.028023719787597656, 0.0300445556640625, 0.032065391540527344, 0.03408622741699219, 0.03610706329345703, 0.038127899169921875, 0.04014873504638672, 0.04216957092285156, 0.044190406799316406, 0.04621124267578125, 0.048232078552246094, 0.05025291442871094, 0.05227375030517578, 0.054294586181640625, 0.05631542205810547, 0.05833625793457031, 0.060357093811035156, 0.0623779296875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 10.0, 11.0, 19.0, 14.0, 30.0, 57.0, 98.0, 150.0, 334.0, 1064.0, 4389.0, 45974.0, 811919.0, 172981.0, 8792.0, 1656.0, 540.0, 200.0, 104.0, 53.0, 44.0, 36.0, 19.0, 11.0, 10.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.057647705078125, -0.056157588958740234, -0.05466747283935547, -0.0531773567199707, -0.05168724060058594, -0.05019712448120117, -0.048707008361816406, -0.04721689224243164, -0.045726776123046875, -0.04423666000366211, -0.042746543884277344, -0.04125642776489258, -0.03976631164550781, -0.03827619552612305, -0.03678607940673828, -0.035295963287353516, -0.03380584716796875, -0.032315731048583984, -0.03082561492919922, -0.029335498809814453, -0.027845382690429688, -0.026355266571044922, -0.024865150451660156, -0.02337503433227539, -0.021884918212890625, -0.02039480209350586, -0.018904685974121094, -0.017414569854736328, -0.015924453735351562, -0.014434337615966797, -0.012944221496582031, -0.011454105377197266, -0.0099639892578125, -0.008473873138427734, -0.006983757019042969, -0.005493640899658203, -0.0040035247802734375, -0.002513408660888672, -0.0010232925415039062, 0.0004668235778808594, 0.001956939697265625, 0.0034470558166503906, 0.004937171936035156, 0.006427288055419922, 0.007917404174804688, 0.009407520294189453, 0.010897636413574219, 0.012387752532958984, 0.01387786865234375, 0.015367984771728516, 0.01685810089111328, 0.018348217010498047, 0.019838333129882812, 0.021328449249267578, 0.022818565368652344, 0.02430868148803711, 0.025798797607421875, 0.02728891372680664, 0.028779029846191406, 0.030269145965576172, 0.03175926208496094, 0.0332493782043457, 0.03473949432373047, 0.036229610443115234, 0.0377197265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 5.0, 11.0, 16.0, 24.0, 24.0, 25.0, 28.0, 40.0, 51.0, 46.0, 53.0, 43.0, 57.0, 56.0, 58.0, 54.0, 43.0, 50.0, 59.0, 40.0, 44.0, 35.0, 17.0, 24.0, 24.0, 15.0, 10.0, 10.0, 4.0, 10.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024688720703125, -0.02373027801513672, -0.022771835327148438, -0.021813392639160156, -0.020854949951171875, -0.019896507263183594, -0.018938064575195312, -0.01797962188720703, -0.01702117919921875, -0.01606273651123047, -0.015104293823242188, -0.014145851135253906, -0.013187408447265625, -0.012228965759277344, -0.011270523071289062, -0.010312080383300781, -0.0093536376953125, -0.008395195007324219, -0.0074367523193359375, -0.006478309631347656, -0.005519866943359375, -0.004561424255371094, -0.0036029815673828125, -0.0026445388793945312, -0.00168609619140625, -0.0007276535034179688, 0.0002307891845703125, 0.0011892318725585938, 0.002147674560546875, 0.0031061172485351562, 0.0040645599365234375, 0.005023002624511719, 0.0059814453125, 0.006939888000488281, 0.007898330688476562, 0.008856773376464844, 0.009815216064453125, 0.010773658752441406, 0.011732101440429688, 0.012690544128417969, 0.01364898681640625, 0.014607429504394531, 0.015565872192382812, 0.016524314880371094, 0.017482757568359375, 0.018441200256347656, 0.019399642944335938, 0.02035808563232422, 0.0213165283203125, 0.02227497100830078, 0.023233413696289062, 0.024191856384277344, 0.025150299072265625, 0.026108741760253906, 0.027067184448242188, 0.02802562713623047, 0.02898406982421875, 0.02994251251220703, 0.030900955200195312, 0.031859397888183594, 0.032817840576171875, 0.033776283264160156, 0.03473472595214844, 0.03569316864013672, 0.036651611328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 9.0, 15.0, 29.0, 16.0, 25.0, 46.0, 55.0, 73.0, 86.0, 141.0, 174.0, 254.0, 357.0, 420.0, 629.0, 808.0, 1248.0, 1697.0, 2507.0, 3974.0, 7201.0, 19719.0, 92532.0, 713864.0, 153103.0, 26993.0, 8649.0, 4466.0, 2785.0, 1867.0, 1287.0, 917.0, 660.0, 494.0, 386.0, 271.0, 182.0, 157.0, 133.0, 86.0, 55.0, 37.0, 32.0, 16.0, 26.0, 17.0, 10.0, 8.0, 10.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0113067626953125, -0.010949134826660156, -0.010591506958007812, -0.010233879089355469, -0.009876251220703125, -0.009518623352050781, -0.009160995483398438, -0.008803367614746094, -0.00844573974609375, -0.008088111877441406, -0.0077304840087890625, -0.007372856140136719, -0.007015228271484375, -0.006657600402832031, -0.0062999725341796875, -0.005942344665527344, -0.005584716796875, -0.005227088928222656, -0.0048694610595703125, -0.004511833190917969, -0.004154205322265625, -0.0037965774536132812, -0.0034389495849609375, -0.0030813217163085938, -0.00272369384765625, -0.0023660659790039062, -0.0020084381103515625, -0.0016508102416992188, -0.001293182373046875, -0.0009355545043945312, -0.0005779266357421875, -0.00022029876708984375, 0.0001373291015625, 0.0004949569702148438, 0.0008525848388671875, 0.0012102127075195312, 0.001567840576171875, 0.0019254684448242188, 0.0022830963134765625, 0.0026407241821289062, 0.00299835205078125, 0.0033559799194335938, 0.0037136077880859375, 0.004071235656738281, 0.004428863525390625, 0.004786491394042969, 0.0051441192626953125, 0.005501747131347656, 0.005859375, 0.006217002868652344, 0.0065746307373046875, 0.006932258605957031, 0.007289886474609375, 0.007647514343261719, 0.008005142211914062, 0.008362770080566406, 0.00872039794921875, 0.009078025817871094, 0.009435653686523438, 0.009793281555175781, 0.010150909423828125, 0.010508537292480469, 0.010866165161132812, 0.011223793029785156, 0.0115814208984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 8.0, 19.0, 36.0, 50.0, 81.0, 121.0, 164.0, 140.0, 146.0, 90.0, 40.0, 34.0, 18.0, 13.0, 5.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014734268188476562, -0.0001427382230758667, -0.00013813376426696777, -0.00013352930545806885, -0.00012892484664916992, -0.000124320387840271, -0.00011971592903137207, -0.00011511147022247314, -0.00011050701141357422, -0.00010590255260467529, -0.00010129809379577637, -9.669363498687744e-05, -9.208917617797852e-05, -8.748471736907959e-05, -8.288025856018066e-05, -7.827579975128174e-05, -7.367134094238281e-05, -6.906688213348389e-05, -6.446242332458496e-05, -5.9857964515686035e-05, -5.525350570678711e-05, -5.0649046897888184e-05, -4.604458808898926e-05, -4.144012928009033e-05, -3.6835670471191406e-05, -3.223121166229248e-05, -2.7626752853393555e-05, -2.302229404449463e-05, -1.8417835235595703e-05, -1.3813376426696777e-05, -9.208917617797852e-06, -4.604458808898926e-06, 0.0, 4.604458808898926e-06, 9.208917617797852e-06, 1.3813376426696777e-05, 1.8417835235595703e-05, 2.302229404449463e-05, 2.7626752853393555e-05, 3.223121166229248e-05, 3.6835670471191406e-05, 4.144012928009033e-05, 4.604458808898926e-05, 5.0649046897888184e-05, 5.525350570678711e-05, 5.9857964515686035e-05, 6.446242332458496e-05, 6.906688213348389e-05, 7.367134094238281e-05, 7.827579975128174e-05, 8.288025856018066e-05, 8.748471736907959e-05, 9.208917617797852e-05, 9.669363498687744e-05, 0.00010129809379577637, 0.00010590255260467529, 0.00011050701141357422, 0.00011511147022247314, 0.00011971592903137207, 0.000124320387840271, 0.00012892484664916992, 0.00013352930545806885, 0.00013813376426696777, 0.0001427382230758667, 0.00014734268188476562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 8.0, 4.0, 5.0, 6.0, 11.0, 12.0, 12.0, 25.0, 31.0, 50.0, 75.0, 114.0, 215.0, 388.0, 775.0, 1459.0, 3297.0, 8730.0, 33974.0, 346728.0, 588613.0, 45977.0, 10629.0, 3685.0, 1802.0, 827.0, 452.0, 245.0, 146.0, 86.0, 59.0, 34.0, 26.0, 17.0, 11.0, 9.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.016937255859375, -0.016425371170043945, -0.01591348648071289, -0.015401601791381836, -0.014889717102050781, -0.014377832412719727, -0.013865947723388672, -0.013354063034057617, -0.012842178344726562, -0.012330293655395508, -0.011818408966064453, -0.011306524276733398, -0.010794639587402344, -0.010282754898071289, -0.009770870208740234, -0.00925898551940918, -0.008747100830078125, -0.00823521614074707, -0.007723331451416016, -0.007211446762084961, -0.006699562072753906, -0.0061876773834228516, -0.005675792694091797, -0.005163908004760742, -0.0046520233154296875, -0.004140138626098633, -0.003628253936767578, -0.0031163692474365234, -0.0026044845581054688, -0.002092599868774414, -0.0015807151794433594, -0.0010688304901123047, -0.00055694580078125, -4.506111145019531e-05, 0.0004668235778808594, 0.000978708267211914, 0.0014905929565429688, 0.0020024776458740234, 0.002514362335205078, 0.003026247024536133, 0.0035381317138671875, 0.004050016403198242, 0.004561901092529297, 0.0050737857818603516, 0.005585670471191406, 0.006097555160522461, 0.006609439849853516, 0.00712132453918457, 0.007633209228515625, 0.00814509391784668, 0.008656978607177734, 0.009168863296508789, 0.009680747985839844, 0.010192632675170898, 0.010704517364501953, 0.011216402053833008, 0.011728286743164062, 0.012240171432495117, 0.012752056121826172, 0.013263940811157227, 0.013775825500488281, 0.014287710189819336, 0.01479959487915039, 0.015311479568481445, 0.0158233642578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 2.0, 8.0, 11.0, 13.0, 39.0, 126.0, 256.0, 303.0, 131.0, 47.0, 27.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015960693359375, -0.015298604965209961, -0.014636516571044922, -0.013974428176879883, -0.013312339782714844, -0.012650251388549805, -0.011988162994384766, -0.011326074600219727, -0.010663986206054688, -0.010001897811889648, -0.00933980941772461, -0.00867772102355957, -0.008015632629394531, -0.007353544235229492, -0.006691455841064453, -0.006029367446899414, -0.005367279052734375, -0.004705190658569336, -0.004043102264404297, -0.003381013870239258, -0.0027189254760742188, -0.0020568370819091797, -0.0013947486877441406, -0.0007326602935791016, -7.05718994140625e-05, 0.0005915164947509766, 0.0012536048889160156, 0.0019156932830810547, 0.0025777816772460938, 0.003239870071411133, 0.003901958465576172, 0.004564046859741211, 0.00522613525390625, 0.005888223648071289, 0.006550312042236328, 0.007212400436401367, 0.007874488830566406, 0.008536577224731445, 0.009198665618896484, 0.009860754013061523, 0.010522842407226562, 0.011184930801391602, 0.01184701919555664, 0.01250910758972168, 0.013171195983886719, 0.013833284378051758, 0.014495372772216797, 0.015157461166381836, 0.015819549560546875, 0.016481637954711914, 0.017143726348876953, 0.017805814743041992, 0.01846790313720703, 0.01912999153137207, 0.01979207992553711, 0.02045416831970215, 0.021116256713867188, 0.021778345108032227, 0.022440433502197266, 0.023102521896362305, 0.023764610290527344, 0.024426698684692383, 0.025088787078857422, 0.02575087547302246, 0.0264129638671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 43.0, 535.0, 388.0, 35.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.201520323753357, -1.180418610572815, -1.1593170166015625, -1.1382153034210205, -1.1171135902404785, -1.096011996269226, -1.074910283088684, -1.0538086891174316, -1.0327069759368896, -1.0116052627563477, -0.9905036091804504, -0.9694019556045532, -0.948300302028656, -0.9271986484527588, -0.9060969352722168, -0.8849952816963196, -0.8638936281204224, -0.8427919745445251, -0.8216902613639832, -0.8005886077880859, -0.7794869542121887, -0.7583853006362915, -0.7372835874557495, -0.7161819338798523, -0.6950802206993103, -0.6739785671234131, -0.6528768539428711, -0.6317752003669739, -0.6106735467910767, -0.5895718932151794, -0.5684701800346375, -0.5473685264587402, -0.5262669324874878, -0.5051652789115906, -0.48406359553337097, -0.46296191215515137, -0.44186025857925415, -0.42075857520103455, -0.39965689182281494, -0.3785552382469177, -0.35745352506637573, -0.33635184168815613, -0.3152501881122589, -0.2941485047340393, -0.2730468511581421, -0.2519451677799225, -0.23084349930286407, -0.20974183082580566, -0.18864017724990845, -0.16753850877285004, -0.14643684029579163, -0.12533515691757202, -0.10423349589109421, -0.0831318274140358, -0.06203015148639679, -0.04092848300933838, -0.019826814532279968, 0.0012748558074235916, 0.02237652614712715, 0.04347819834947586, 0.06457986682653427, 0.08568153530359268, 0.10678321123123169, 0.1278848797082901, 0.1489865481853485]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 4.0, 2.0, 5.0, 12.0, 11.0, 17.0, 12.0, 16.0, 14.0, 20.0, 20.0, 24.0, 24.0, 37.0, 17.0, 37.0, 34.0, 39.0, 38.0, 39.0, 32.0, 43.0, 27.0, 45.0, 35.0, 30.0, 36.0, 24.0, 33.0, 32.0, 36.0, 19.0, 41.0, 17.0, 16.0, 10.0, 12.0, 14.0, 7.0, 13.0, 11.0, 9.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.07135003805160522, -0.06931910663843155, -0.06728818267583847, -0.0652572512626648, -0.06322632730007172, -0.06119539588689804, -0.059164464473724365, -0.05713353678584099, -0.05510260909795761, -0.053071681410074234, -0.05104075372219086, -0.04900982230901718, -0.046978894621133804, -0.04494796693325043, -0.04291703552007675, -0.040886107832193375, -0.03885518014431, -0.03682425245642662, -0.03479332476854324, -0.03276239335536957, -0.03073146566748619, -0.028700537979602814, -0.026669608429074287, -0.02463867887854576, -0.022607751190662384, -0.020576823502779007, -0.01854589395225048, -0.016514964401721954, -0.014484036713838577, -0.012453108094632626, -0.010422179475426674, -0.008391250856220722, -0.0063603222370147705, -0.004329393617808819, -0.002298464998602867, -0.00026753637939691544, 0.0017633922398090363, 0.003794320859014988, 0.00582524947822094, 0.007856178097426891, 0.009887106716632843, 0.011918035335838795, 0.013948963955044746, 0.015979893505573273, 0.01801082119345665, 0.020041748881340027, 0.022072678431868553, 0.02410360798239708, 0.026134535670280457, 0.028165463358163834, 0.03019639290869236, 0.032227322459220886, 0.03425825014710426, 0.03628917783498764, 0.038320109248161316, 0.04035103693604469, 0.04238196462392807, 0.04441289231181145, 0.046443819999694824, 0.0484747514128685, 0.05050567910075188, 0.052536606788635254, 0.05456753820180893, 0.056598465889692307, 0.058629393577575684]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 15.0, 19.0, 40.0, 87.0, 284.0, 595.0, 1410.0, 2187.0, 5635.0, 70659.0, 4062273.0, 43490.0, 4330.0, 1736.0, 644.0, 374.0, 289.0, 93.0, 39.0, 26.0, 17.0, 13.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05462646484375, -0.0529932975769043, -0.051360130310058594, -0.04972696304321289, -0.04809379577636719, -0.046460628509521484, -0.04482746124267578, -0.04319429397583008, -0.041561126708984375, -0.03992795944213867, -0.03829479217529297, -0.036661624908447266, -0.03502845764160156, -0.03339529037475586, -0.031762123107910156, -0.030128955841064453, -0.02849578857421875, -0.026862621307373047, -0.025229454040527344, -0.02359628677368164, -0.021963119506835938, -0.020329952239990234, -0.01869678497314453, -0.017063617706298828, -0.015430450439453125, -0.013797283172607422, -0.012164115905761719, -0.010530948638916016, -0.008897781372070312, -0.007264614105224609, -0.005631446838378906, -0.003998279571533203, -0.0023651123046875, -0.0007319450378417969, 0.0009012222290039062, 0.0025343894958496094, 0.0041675567626953125, 0.005800724029541016, 0.007433891296386719, 0.009067058563232422, 0.010700225830078125, 0.012333393096923828, 0.013966560363769531, 0.015599727630615234, 0.017232894897460938, 0.01886606216430664, 0.020499229431152344, 0.022132396697998047, 0.02376556396484375, 0.025398731231689453, 0.027031898498535156, 0.02866506576538086, 0.030298233032226562, 0.031931400299072266, 0.03356456756591797, 0.03519773483276367, 0.036830902099609375, 0.03846406936645508, 0.04009723663330078, 0.041730403900146484, 0.04336357116699219, 0.04499673843383789, 0.046629905700683594, 0.0482630729675293, 0.049896240234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 11.0, 55.0, 218.0, 368.0, 258.0, 76.0, 12.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.06295013427734375, -0.0609588623046875, -0.05896759033203125, -0.056976318359375, -0.05498504638671875, -0.0529937744140625, -0.05100250244140625, -0.04901123046875, -0.04701995849609375, -0.0450286865234375, -0.04303741455078125, -0.041046142578125, -0.03905487060546875, -0.0370635986328125, -0.03507232666015625, -0.0330810546875, -0.03108978271484375, -0.0290985107421875, -0.02710723876953125, -0.025115966796875, -0.02312469482421875, -0.0211334228515625, -0.01914215087890625, -0.01715087890625, -0.01515960693359375, -0.0131683349609375, -0.01117706298828125, -0.009185791015625, -0.00719451904296875, -0.0052032470703125, -0.00321197509765625, -0.001220703125, 0.00077056884765625, 0.0027618408203125, 0.00475311279296875, 0.006744384765625, 0.00873565673828125, 0.0107269287109375, 0.01271820068359375, 0.01470947265625, 0.01670074462890625, 0.0186920166015625, 0.02068328857421875, 0.022674560546875, 0.02466583251953125, 0.0266571044921875, 0.02864837646484375, 0.0306396484375, 0.03263092041015625, 0.0346221923828125, 0.03661346435546875, 0.038604736328125, 0.04059600830078125, 0.0425872802734375, 0.04457855224609375, 0.04656982421875, 0.04856109619140625, 0.0505523681640625, 0.05254364013671875, 0.054534912109375, 0.05652618408203125, 0.0585174560546875, 0.06050872802734375, 0.0625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 16.0, 13.0, 23.0, 48.0, 86.0, 161.0, 273.0, 617.0, 1278.0, 4048.0, 23801.0, 505604.0, 3585456.0, 61730.0, 7612.0, 1983.0, 767.0, 384.0, 184.0, 94.0, 57.0, 23.0, 15.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0262451171875, -0.025279998779296875, -0.02431488037109375, -0.023349761962890625, -0.0223846435546875, -0.021419525146484375, -0.02045440673828125, -0.019489288330078125, -0.018524169921875, -0.017559051513671875, -0.01659393310546875, -0.015628814697265625, -0.0146636962890625, -0.013698577880859375, -0.01273345947265625, -0.011768341064453125, -0.01080322265625, -0.009838104248046875, -0.00887298583984375, -0.007907867431640625, -0.0069427490234375, -0.005977630615234375, -0.00501251220703125, -0.004047393798828125, -0.003082275390625, -0.002117156982421875, -0.00115203857421875, -0.000186920166015625, 0.0007781982421875, 0.001743316650390625, 0.00270843505859375, 0.003673553466796875, 0.004638671875, 0.005603790283203125, 0.00656890869140625, 0.007534027099609375, 0.0084991455078125, 0.009464263916015625, 0.01042938232421875, 0.011394500732421875, 0.012359619140625, 0.013324737548828125, 0.01428985595703125, 0.015254974365234375, 0.0162200927734375, 0.017185211181640625, 0.01815032958984375, 0.019115447998046875, 0.02008056640625, 0.021045684814453125, 0.02201080322265625, 0.022975921630859375, 0.0239410400390625, 0.024906158447265625, 0.02587127685546875, 0.026836395263671875, 0.027801513671875, 0.028766632080078125, 0.02973175048828125, 0.030696868896484375, 0.0316619873046875, 0.032627105712890625, 0.03359222412109375, 0.034557342529296875, 0.0355224609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 7.0, 9.0, 18.0, 32.0, 50.0, 99.0, 262.0, 852.0, 1666.0, 610.0, 192.0, 105.0, 56.0, 40.0, 24.0, 18.0, 16.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.02491903305053711, -0.02423381805419922, -0.023548603057861328, -0.022863388061523438, -0.022178173065185547, -0.021492958068847656, -0.020807743072509766, -0.020122528076171875, -0.019437313079833984, -0.018752098083496094, -0.018066883087158203, -0.017381668090820312, -0.016696453094482422, -0.01601123809814453, -0.01532602310180664, -0.01464080810546875, -0.01395559310913086, -0.013270378112792969, -0.012585163116455078, -0.011899948120117188, -0.011214733123779297, -0.010529518127441406, -0.009844303131103516, -0.009159088134765625, -0.008473873138427734, -0.007788658142089844, -0.007103443145751953, -0.0064182281494140625, -0.005733013153076172, -0.005047798156738281, -0.004362583160400391, -0.0036773681640625, -0.0029921531677246094, -0.0023069381713867188, -0.0016217231750488281, -0.0009365081787109375, -0.0002512931823730469, 0.00043392181396484375, 0.0011191368103027344, 0.001804351806640625, 0.0024895668029785156, 0.0031747817993164062, 0.003859996795654297, 0.0045452117919921875, 0.005230426788330078, 0.005915641784667969, 0.006600856781005859, 0.00728607177734375, 0.00797128677368164, 0.008656501770019531, 0.009341716766357422, 0.010026931762695312, 0.010712146759033203, 0.011397361755371094, 0.012082576751708984, 0.012767791748046875, 0.013453006744384766, 0.014138221740722656, 0.014823436737060547, 0.015508651733398438, 0.016193866729736328, 0.01687908172607422, 0.01756429672241211, 0.01824951171875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 33.0, 93.0, 287.0, 359.0, 169.0, 44.0, 10.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.27695393562316895, -0.27163928747177124, -0.2663246691226959, -0.2610100507736206, -0.2556954026222229, -0.2503807544708252, -0.24506613612174988, -0.23975150287151337, -0.23443686962127686, -0.22912223637104034, -0.22380760312080383, -0.21849296987056732, -0.2131783366203308, -0.2078637033700943, -0.2025490701198578, -0.19723443686962128, -0.19191980361938477, -0.18660517036914825, -0.18129053711891174, -0.17597590386867523, -0.17066127061843872, -0.1653466373682022, -0.1600320041179657, -0.1547173708677292, -0.14940273761749268, -0.14408810436725616, -0.13877347111701965, -0.13345883786678314, -0.12814420461654663, -0.12282957136631012, -0.11751493811607361, -0.1122003048658371, -0.10688565671443939, -0.10157102346420288, -0.09625639021396637, -0.09094175696372986, -0.08562712371349335, -0.08031249046325684, -0.07499785721302032, -0.06968322396278381, -0.0643685907125473, -0.05905395746231079, -0.05373932421207428, -0.04842469096183777, -0.04311005771160126, -0.037795424461364746, -0.032480791211128235, -0.027166157960891724, -0.021851524710655212, -0.0165368914604187, -0.01122225821018219, -0.005907624959945679, -0.0005929917097091675, 0.004721641540527344, 0.010036274790763855, 0.015350908041000366, 0.020665541291236877, 0.02598017454147339, 0.0312948077917099, 0.03660944104194641, 0.04192407429218292, 0.047238707542419434, 0.052553340792655945, 0.057867974042892456, 0.06318260729312897]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 12.0, 9.0, 17.0, 17.0, 17.0, 18.0, 28.0, 28.0, 35.0, 27.0, 43.0, 50.0, 53.0, 58.0, 48.0, 37.0, 51.0, 54.0, 50.0, 46.0, 31.0, 40.0, 32.0, 22.0, 23.0, 23.0, 18.0, 14.0, 13.0, 19.0, 16.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.039634883403778076, -0.0384724959731102, -0.03731011226773262, -0.03614772856235504, -0.034985341131687164, -0.03382295370101929, -0.03266056999564171, -0.03149818629026413, -0.030335798859596252, -0.029173413291573524, -0.028011027723550797, -0.02684864215552807, -0.02568625658750534, -0.024523871019482613, -0.023361485451459885, -0.022199099883437157, -0.02103671431541443, -0.0198743287473917, -0.018711943179368973, -0.017549557611346245, -0.016387172043323517, -0.015224786475300789, -0.014062400907278061, -0.012900015339255333, -0.011737629771232605, -0.010575244203209877, -0.009412858635187149, -0.008250473067164421, -0.007088087499141693, -0.005925701931118965, -0.004763316363096237, -0.003600930795073509, -0.0024385452270507812, -0.0012761596590280533, -0.00011377409100532532, 0.0010486114770174026, 0.0022109970450401306, 0.0033733826130628586, 0.0045357681810855865, 0.0056981537491083145, 0.0068605393171310425, 0.00802292488515377, 0.009185310453176498, 0.010347696021199226, 0.011510081589221954, 0.012672467157244682, 0.01383485272526741, 0.014997238293290138, 0.016159623861312866, 0.017322009429335594, 0.018484394997358322, 0.01964678056538105, 0.020809166133403778, 0.021971551701426506, 0.023133937269449234, 0.024296322837471962, 0.02545870840549469, 0.026621093973517418, 0.027783479541540146, 0.028945865109562874, 0.030108250677585602, 0.03127063810825348, 0.03243302181363106, 0.033595405519008636, 0.034757792949676514]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 9.0, 8.0, 11.0, 18.0, 23.0, 22.0, 41.0, 44.0, 68.0, 85.0, 119.0, 158.0, 211.0, 290.0, 467.0, 717.0, 1588.0, 5080.0, 38605.0, 755027.0, 226631.0, 13481.0, 2774.0, 1116.0, 598.0, 387.0, 242.0, 192.0, 143.0, 93.0, 76.0, 44.0, 40.0, 33.0, 21.0, 21.0, 11.0, 12.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.042882442474365234, -0.04139232635498047, -0.0399022102355957, -0.03841209411621094, -0.03692197799682617, -0.035431861877441406, -0.03394174575805664, -0.032451629638671875, -0.03096151351928711, -0.029471397399902344, -0.027981281280517578, -0.026491165161132812, -0.025001049041748047, -0.02351093292236328, -0.022020816802978516, -0.02053070068359375, -0.019040584564208984, -0.01755046844482422, -0.016060352325439453, -0.014570236206054688, -0.013080120086669922, -0.011590003967285156, -0.01009988784790039, -0.008609771728515625, -0.007119655609130859, -0.005629539489746094, -0.004139423370361328, -0.0026493072509765625, -0.0011591911315917969, 0.00033092498779296875, 0.0018210411071777344, 0.0033111572265625, 0.004801273345947266, 0.006291389465332031, 0.007781505584716797, 0.009271621704101562, 0.010761737823486328, 0.012251853942871094, 0.01374197006225586, 0.015232086181640625, 0.01672220230102539, 0.018212318420410156, 0.019702434539794922, 0.021192550659179688, 0.022682666778564453, 0.02417278289794922, 0.025662899017333984, 0.02715301513671875, 0.028643131256103516, 0.03013324737548828, 0.03162336349487305, 0.03311347961425781, 0.03460359573364258, 0.036093711853027344, 0.03758382797241211, 0.039073944091796875, 0.04056406021118164, 0.042054176330566406, 0.04354429244995117, 0.04503440856933594, 0.0465245246887207, 0.04801464080810547, 0.049504756927490234, 0.050994873046875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 52.0, 213.0, 384.0, 249.0, 84.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06561708450317383, -0.06360721588134766, -0.061597347259521484, -0.05958747863769531, -0.05757761001586914, -0.05556774139404297, -0.0535578727722168, -0.051548004150390625, -0.04953813552856445, -0.04752826690673828, -0.04551839828491211, -0.04350852966308594, -0.041498661041259766, -0.039488792419433594, -0.03747892379760742, -0.03546905517578125, -0.03345918655395508, -0.031449317932128906, -0.029439449310302734, -0.027429580688476562, -0.02541971206665039, -0.02340984344482422, -0.021399974822998047, -0.019390106201171875, -0.017380237579345703, -0.015370368957519531, -0.01336050033569336, -0.011350631713867188, -0.009340763092041016, -0.007330894470214844, -0.005321025848388672, -0.0033111572265625, -0.0013012886047363281, 0.0007085800170898438, 0.0027184486389160156, 0.0047283172607421875, 0.006738185882568359, 0.008748054504394531, 0.010757923126220703, 0.012767791748046875, 0.014777660369873047, 0.01678752899169922, 0.01879739761352539, 0.020807266235351562, 0.022817134857177734, 0.024827003479003906, 0.026836872100830078, 0.02884674072265625, 0.030856609344482422, 0.032866477966308594, 0.034876346588134766, 0.03688621520996094, 0.03889608383178711, 0.04090595245361328, 0.04291582107543945, 0.044925689697265625, 0.0469355583190918, 0.04894542694091797, 0.05095529556274414, 0.05296516418457031, 0.054975032806396484, 0.056984901428222656, 0.05899477005004883, 0.061004638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 23.0, 20.0, 35.0, 74.0, 115.0, 171.0, 438.0, 1156.0, 4178.0, 23721.0, 387281.0, 589031.0, 34480.0, 5393.0, 1431.0, 495.0, 220.0, 107.0, 49.0, 35.0, 27.0, 23.0, 7.0, 4.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.03630495071411133, -0.035012245178222656, -0.033719539642333984, -0.03242683410644531, -0.03113412857055664, -0.02984142303466797, -0.028548717498779297, -0.027256011962890625, -0.025963306427001953, -0.02467060089111328, -0.02337789535522461, -0.022085189819335938, -0.020792484283447266, -0.019499778747558594, -0.018207073211669922, -0.01691436767578125, -0.015621662139892578, -0.014328956604003906, -0.013036251068115234, -0.011743545532226562, -0.01045083999633789, -0.009158134460449219, -0.007865428924560547, -0.006572723388671875, -0.005280017852783203, -0.003987312316894531, -0.0026946067810058594, -0.0014019012451171875, -0.00010919570922851562, 0.0011835098266601562, 0.002476215362548828, 0.0037689208984375, 0.005061626434326172, 0.006354331970214844, 0.007647037506103516, 0.008939743041992188, 0.01023244857788086, 0.011525154113769531, 0.012817859649658203, 0.014110565185546875, 0.015403270721435547, 0.01669597625732422, 0.01798868179321289, 0.019281387329101562, 0.020574092864990234, 0.021866798400878906, 0.023159503936767578, 0.02445220947265625, 0.025744915008544922, 0.027037620544433594, 0.028330326080322266, 0.029623031616210938, 0.03091573715209961, 0.03220844268798828, 0.03350114822387695, 0.034793853759765625, 0.0360865592956543, 0.03737926483154297, 0.03867197036743164, 0.03996467590332031, 0.041257381439208984, 0.042550086975097656, 0.04384279251098633, 0.045135498046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 9.0, 20.0, 30.0, 42.0, 41.0, 61.0, 56.0, 80.0, 78.0, 105.0, 87.0, 75.0, 54.0, 47.0, 50.0, 43.0, 31.0, 23.0, 11.0, 15.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04168701171875, -0.04027509689331055, -0.038863182067871094, -0.03745126724243164, -0.03603935241699219, -0.034627437591552734, -0.03321552276611328, -0.03180360794067383, -0.030391693115234375, -0.028979778289794922, -0.02756786346435547, -0.026155948638916016, -0.024744033813476562, -0.02333211898803711, -0.021920204162597656, -0.020508289337158203, -0.01909637451171875, -0.017684459686279297, -0.016272544860839844, -0.01486063003540039, -0.013448715209960938, -0.012036800384521484, -0.010624885559082031, -0.009212970733642578, -0.007801055908203125, -0.006389141082763672, -0.004977226257324219, -0.0035653114318847656, -0.0021533966064453125, -0.0007414817810058594, 0.0006704330444335938, 0.002082347869873047, 0.0034942626953125, 0.004906177520751953, 0.006318092346191406, 0.007730007171630859, 0.009141921997070312, 0.010553836822509766, 0.011965751647949219, 0.013377666473388672, 0.014789581298828125, 0.016201496124267578, 0.01761341094970703, 0.019025325775146484, 0.020437240600585938, 0.02184915542602539, 0.023261070251464844, 0.024672985076904297, 0.02608489990234375, 0.027496814727783203, 0.028908729553222656, 0.03032064437866211, 0.03173255920410156, 0.033144474029541016, 0.03455638885498047, 0.03596830368041992, 0.037380218505859375, 0.03879213333129883, 0.04020404815673828, 0.041615962982177734, 0.04302787780761719, 0.04443979263305664, 0.045851707458496094, 0.04726362228393555, 0.048675537109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 14.0, 27.0, 38.0, 78.0, 138.0, 285.0, 554.0, 1130.0, 2306.0, 4782.0, 11319.0, 29560.0, 118379.0, 640462.0, 178037.0, 37075.0, 13539.0, 5732.0, 2522.0, 1236.0, 641.0, 304.0, 166.0, 93.0, 45.0, 38.0, 16.0, 16.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01053619384765625, -0.010202765464782715, -0.00986933708190918, -0.009535908699035645, -0.00920248031616211, -0.008869051933288574, -0.008535623550415039, -0.008202195167541504, -0.007868766784667969, -0.007535338401794434, -0.0072019100189208984, -0.006868481636047363, -0.006535053253173828, -0.006201624870300293, -0.005868196487426758, -0.005534768104553223, -0.0052013397216796875, -0.004867911338806152, -0.004534482955932617, -0.004201054573059082, -0.003867626190185547, -0.0035341978073120117, -0.0032007694244384766, -0.0028673410415649414, -0.0025339126586914062, -0.002200484275817871, -0.001867055892944336, -0.0015336275100708008, -0.0012001991271972656, -0.0008667707443237305, -0.0005333423614501953, -0.00019991397857666016, 0.000133514404296875, 0.00046694278717041016, 0.0008003711700439453, 0.0011337995529174805, 0.0014672279357910156, 0.0018006563186645508, 0.002134084701538086, 0.002467513084411621, 0.0028009414672851562, 0.0031343698501586914, 0.0034677982330322266, 0.0038012266159057617, 0.004134654998779297, 0.004468083381652832, 0.004801511764526367, 0.005134940147399902, 0.0054683685302734375, 0.005801796913146973, 0.006135225296020508, 0.006468653678894043, 0.006802082061767578, 0.007135510444641113, 0.0074689388275146484, 0.007802367210388184, 0.008135795593261719, 0.008469223976135254, 0.008802652359008789, 0.009136080741882324, 0.00946950912475586, 0.009802937507629395, 0.01013636589050293, 0.010469794273376465, 0.01080322265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 8.0, 7.0, 7.0, 8.0, 9.0, 16.0, 23.0, 25.0, 28.0, 42.0, 57.0, 61.0, 92.0, 116.0, 101.0, 90.0, 82.0, 62.0, 41.0, 34.0, 22.0, 16.0, 17.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.00010138750076293945, -9.87071543931961e-05, -9.602680802345276e-05, -9.334646165370941e-05, -9.066611528396606e-05, -8.798576891422272e-05, -8.530542254447937e-05, -8.262507617473602e-05, -7.994472980499268e-05, -7.726438343524933e-05, -7.458403706550598e-05, -7.190369069576263e-05, -6.922334432601929e-05, -6.654299795627594e-05, -6.386265158653259e-05, -6.118230521678925e-05, -5.85019588470459e-05, -5.582161247730255e-05, -5.3141266107559204e-05, -5.046091973781586e-05, -4.778057336807251e-05, -4.510022699832916e-05, -4.2419880628585815e-05, -3.973953425884247e-05, -3.705918788909912e-05, -3.4378841519355774e-05, -3.169849514961243e-05, -2.901814877986908e-05, -2.6337802410125732e-05, -2.3657456040382385e-05, -2.0977109670639038e-05, -1.829676330089569e-05, -1.5616416931152344e-05, -1.2936070561408997e-05, -1.025572419166565e-05, -7.575377821922302e-06, -4.895031452178955e-06, -2.214685082435608e-06, 4.6566128730773926e-07, 3.1460076570510864e-06, 5.826354026794434e-06, 8.50670039653778e-06, 1.1187046766281128e-05, 1.3867393136024475e-05, 1.6547739505767822e-05, 1.922808587551117e-05, 2.1908432245254517e-05, 2.4588778614997864e-05, 2.726912498474121e-05, 2.9949471354484558e-05, 3.2629817724227905e-05, 3.531016409397125e-05, 3.79905104637146e-05, 4.067085683345795e-05, 4.3351203203201294e-05, 4.603154957294464e-05, 4.871189594268799e-05, 5.1392242312431335e-05, 5.407258868217468e-05, 5.675293505191803e-05, 5.943328142166138e-05, 6.211362779140472e-05, 6.479397416114807e-05, 6.747432053089142e-05, 7.015466690063477e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 10.0, 15.0, 29.0, 25.0, 35.0, 61.0, 102.0, 190.0, 316.0, 595.0, 1166.0, 2391.0, 5057.0, 11807.0, 32428.0, 130707.0, 632423.0, 168987.0, 37593.0, 13426.0, 5602.0, 2620.0, 1287.0, 713.0, 350.0, 236.0, 120.0, 76.0, 38.0, 31.0, 25.0, 17.0, 10.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01085662841796875, -0.010512709617614746, -0.010168790817260742, -0.009824872016906738, -0.009480953216552734, -0.00913703441619873, -0.008793115615844727, -0.008449196815490723, -0.008105278015136719, -0.007761359214782715, -0.007417440414428711, -0.007073521614074707, -0.006729602813720703, -0.006385684013366699, -0.006041765213012695, -0.005697846412658691, -0.0053539276123046875, -0.005010008811950684, -0.00466609001159668, -0.004322171211242676, -0.003978252410888672, -0.003634333610534668, -0.003290414810180664, -0.00294649600982666, -0.0026025772094726562, -0.0022586584091186523, -0.0019147396087646484, -0.0015708208084106445, -0.0012269020080566406, -0.0008829832077026367, -0.0005390644073486328, -0.0001951456069946289, 0.000148773193359375, 0.0004926919937133789, 0.0008366107940673828, 0.0011805295944213867, 0.0015244483947753906, 0.0018683671951293945, 0.0022122859954833984, 0.0025562047958374023, 0.0029001235961914062, 0.00324404239654541, 0.003587961196899414, 0.003931879997253418, 0.004275798797607422, 0.004619717597961426, 0.00496363639831543, 0.005307555198669434, 0.0056514739990234375, 0.005995392799377441, 0.006339311599731445, 0.006683230400085449, 0.007027149200439453, 0.007371068000793457, 0.007714986801147461, 0.008058905601501465, 0.008402824401855469, 0.008746743202209473, 0.009090662002563477, 0.00943458080291748, 0.009778499603271484, 0.010122418403625488, 0.010466337203979492, 0.010810256004333496, 0.0111541748046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 9.0, 1.0, 3.0, 11.0, 9.0, 6.0, 13.0, 23.0, 22.0, 40.0, 85.0, 110.0, 166.0, 171.0, 111.0, 82.0, 38.0, 16.0, 13.0, 10.0, 15.0, 11.0, 8.0, 3.0, 2.0, 7.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01230621337890625, -0.011908650398254395, -0.011511087417602539, -0.011113524436950684, -0.010715961456298828, -0.010318398475646973, -0.009920835494995117, -0.009523272514343262, -0.009125709533691406, -0.00872814655303955, -0.008330583572387695, -0.00793302059173584, -0.007535457611083984, -0.007137894630432129, -0.0067403316497802734, -0.006342768669128418, -0.0059452056884765625, -0.005547642707824707, -0.0051500797271728516, -0.004752516746520996, -0.004354953765869141, -0.003957390785217285, -0.0035598278045654297, -0.0031622648239135742, -0.0027647018432617188, -0.0023671388626098633, -0.001969575881958008, -0.0015720129013061523, -0.0011744499206542969, -0.0007768869400024414, -0.00037932395935058594, 1.823902130126953e-05, 0.000415802001953125, 0.0008133649826049805, 0.001210927963256836, 0.0016084909439086914, 0.002006053924560547, 0.0024036169052124023, 0.002801179885864258, 0.0031987428665161133, 0.0035963058471679688, 0.003993868827819824, 0.00439143180847168, 0.004788994789123535, 0.005186557769775391, 0.005584120750427246, 0.0059816837310791016, 0.006379246711730957, 0.0067768096923828125, 0.007174372673034668, 0.0075719356536865234, 0.007969498634338379, 0.008367061614990234, 0.00876462459564209, 0.009162187576293945, 0.0095597505569458, 0.009957313537597656, 0.010354876518249512, 0.010752439498901367, 0.011150002479553223, 0.011547565460205078, 0.011945128440856934, 0.012342691421508789, 0.012740254402160645, 0.0131378173828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 42.0, 245.0, 544.0, 155.0, 13.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.746342658996582, -0.7326202392578125, -0.7188977599143982, -0.7051753401756287, -0.6914528608322144, -0.6777304410934448, -0.6640080213546753, -0.650285542011261, -0.6365631222724915, -0.6228407025337219, -0.6091182231903076, -0.5953958034515381, -0.5816733241081238, -0.5679509043693542, -0.5542284250259399, -0.5405060052871704, -0.5267835259437561, -0.5130611062049866, -0.49933862686157227, -0.48561620712280273, -0.4718937575817108, -0.4581713080406189, -0.444448858499527, -0.43072640895843506, -0.4170039892196655, -0.4032815396785736, -0.3895590901374817, -0.37583667039871216, -0.36211422085762024, -0.3483917713165283, -0.3346693217754364, -0.3209468722343445, -0.30722442269325256, -0.29350197315216064, -0.2797795236110687, -0.2660570740699768, -0.2523346543312073, -0.23861220479011536, -0.22488975524902344, -0.21116730570793152, -0.1974448561668396, -0.18372240662574768, -0.16999997198581696, -0.15627752244472504, -0.14255507290363312, -0.1288326382637024, -0.11511018872261047, -0.10138773918151855, -0.08766530454158783, -0.07394286245107651, -0.06022041290998459, -0.04649797081947327, -0.032775525003671646, -0.019053079187870026, -0.005330637097358704, 0.008391812443733215, 0.022114254534244537, 0.03583670035004616, 0.04955914616584778, 0.0632815882563591, 0.07700403034687042, 0.09072647988796234, 0.10444892197847366, 0.11817137151956558, 0.1318938136100769]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 1.0, 6.0, 5.0, 7.0, 13.0, 13.0, 16.0, 14.0, 24.0, 28.0, 27.0, 39.0, 32.0, 36.0, 32.0, 42.0, 44.0, 35.0, 44.0, 47.0, 38.0, 40.0, 30.0, 39.0, 49.0, 38.0, 40.0, 34.0, 34.0, 30.0, 15.0, 21.0, 12.0, 14.0, 10.0, 13.0, 14.0, 4.0, 5.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07883483171463013, -0.07657977193593979, -0.07432471960783005, -0.07206965982913971, -0.06981460750102997, -0.06755954772233963, -0.06530448794364929, -0.06304943561553955, -0.06079437583684921, -0.05853931978344917, -0.05628426373004913, -0.054029203951358795, -0.051774147897958755, -0.049519091844558716, -0.04726403206586838, -0.04500897601246834, -0.0427539199590683, -0.04049886390566826, -0.03824380785226822, -0.03598874807357788, -0.03373369202017784, -0.0314786359667778, -0.029223578050732613, -0.026968520134687424, -0.024713464081287384, -0.022458408027887344, -0.020203350111842155, -0.017948292195796967, -0.015693236142396927, -0.013438179157674313, -0.011183122172951698, -0.00892806425690651, -0.00667300820350647, -0.0044179512187838554, -0.002162894234061241, 9.216275066137314e-05, 0.0023472197353839874, 0.004602276720106602, 0.006857333704829216, 0.009112391620874405, 0.011367447674274445, 0.013622504658997059, 0.015877561643719673, 0.018132619559764862, 0.0203876756131649, 0.02264273166656494, 0.02489778958261013, 0.02715284749865532, 0.02940790355205536, 0.0316629596054554, 0.03391801565885544, 0.036173075437545776, 0.038428131490945816, 0.040683187544345856, 0.042938247323036194, 0.045193303376436234, 0.04744835942983627, 0.04970341548323631, 0.05195847153663635, 0.05421353131532669, 0.05646858736872673, 0.05872364342212677, 0.06097870320081711, 0.06323376297950745, 0.06548881530761719]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 17.0, 129.0, 2586.0, 4123480.0, 66885.0, 1019.0, 115.0, 35.0, 12.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2225341796875, -0.21615219116210938, -0.20977020263671875, -0.20338821411132812, -0.1970062255859375, -0.19062423706054688, -0.18424224853515625, -0.17786026000976562, -0.171478271484375, -0.16509628295898438, -0.15871429443359375, -0.15233230590820312, -0.1459503173828125, -0.13956832885742188, -0.13318634033203125, -0.12680435180664062, -0.12042236328125, -0.11404037475585938, -0.10765838623046875, -0.10127639770507812, -0.0948944091796875, -0.08851242065429688, -0.08213043212890625, -0.07574844360351562, -0.069366455078125, -0.06298446655273438, -0.05660247802734375, -0.050220489501953125, -0.0438385009765625, -0.037456512451171875, -0.03107452392578125, -0.024692535400390625, -0.018310546875, -0.011928558349609375, -0.00554656982421875, 0.000835418701171875, 0.0072174072265625, 0.013599395751953125, 0.01998138427734375, 0.026363372802734375, 0.032745361328125, 0.039127349853515625, 0.04550933837890625, 0.051891326904296875, 0.0582733154296875, 0.06465530395507812, 0.07103729248046875, 0.07741928100585938, 0.08380126953125, 0.09018325805664062, 0.09656524658203125, 0.10294723510742188, 0.1093292236328125, 0.11571121215820312, 0.12209320068359375, 0.12847518920898438, 0.134857177734375, 0.14123916625976562, 0.14762115478515625, 0.15400314331054688, 0.1603851318359375, 0.16676712036132812, 0.17314910888671875, 0.17953109741210938, 0.1859130859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 29.0, 141.0, 322.0, 331.0, 134.0, 38.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.06380558013916016, -0.06181526184082031, -0.05982494354248047, -0.057834625244140625, -0.05584430694580078, -0.05385398864746094, -0.051863670349121094, -0.04987335205078125, -0.047883033752441406, -0.04589271545410156, -0.04390239715576172, -0.041912078857421875, -0.03992176055908203, -0.03793144226074219, -0.035941123962402344, -0.0339508056640625, -0.031960487365722656, -0.029970169067382812, -0.02797985076904297, -0.025989532470703125, -0.02399921417236328, -0.022008895874023438, -0.020018577575683594, -0.01802825927734375, -0.016037940979003906, -0.014047622680664062, -0.012057304382324219, -0.010066986083984375, -0.008076667785644531, -0.0060863494873046875, -0.004096031188964844, -0.002105712890625, -0.00011539459228515625, 0.0018749237060546875, 0.0038652420043945312, 0.005855560302734375, 0.007845878601074219, 0.009836196899414062, 0.011826515197753906, 0.01381683349609375, 0.015807151794433594, 0.017797470092773438, 0.01978778839111328, 0.021778106689453125, 0.02376842498779297, 0.025758743286132812, 0.027749061584472656, 0.0297393798828125, 0.031729698181152344, 0.03372001647949219, 0.03571033477783203, 0.037700653076171875, 0.03969097137451172, 0.04168128967285156, 0.043671607971191406, 0.04566192626953125, 0.047652244567871094, 0.04964256286621094, 0.05163288116455078, 0.053623199462890625, 0.05561351776123047, 0.05760383605957031, 0.059594154357910156, 0.06158447265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 12.0, 26.0, 55.0, 118.0, 232.0, 491.0, 1233.0, 3629.0, 15419.0, 118325.0, 3696042.0, 321726.0, 28100.0, 5864.0, 1777.0, 675.0, 312.0, 123.0, 66.0, 28.0, 15.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218963623046875, -0.021008729934692383, -0.020121097564697266, -0.01923346519470215, -0.01834583282470703, -0.017458200454711914, -0.016570568084716797, -0.01568293571472168, -0.014795303344726562, -0.013907670974731445, -0.013020038604736328, -0.012132406234741211, -0.011244773864746094, -0.010357141494750977, -0.00946950912475586, -0.008581876754760742, -0.007694244384765625, -0.006806612014770508, -0.005918979644775391, -0.0050313472747802734, -0.004143714904785156, -0.003256082534790039, -0.002368450164794922, -0.0014808177947998047, -0.0005931854248046875, 0.0002944469451904297, 0.0011820793151855469, 0.002069711685180664, 0.0029573440551757812, 0.0038449764251708984, 0.004732608795166016, 0.005620241165161133, 0.00650787353515625, 0.007395505905151367, 0.008283138275146484, 0.009170770645141602, 0.010058403015136719, 0.010946035385131836, 0.011833667755126953, 0.01272130012512207, 0.013608932495117188, 0.014496564865112305, 0.015384197235107422, 0.01627182960510254, 0.017159461975097656, 0.018047094345092773, 0.01893472671508789, 0.019822359085083008, 0.020709991455078125, 0.021597623825073242, 0.02248525619506836, 0.023372888565063477, 0.024260520935058594, 0.02514815330505371, 0.026035785675048828, 0.026923418045043945, 0.027811050415039062, 0.02869868278503418, 0.029586315155029297, 0.030473947525024414, 0.03136157989501953, 0.03224921226501465, 0.033136844635009766, 0.03402447700500488, 0.034912109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 15.0, 28.0, 31.0, 60.0, 126.0, 231.0, 663.0, 1587.0, 763.0, 247.0, 116.0, 74.0, 42.0, 23.0, 22.0, 11.0, 10.0, 0.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.0220181941986084, -0.021361827850341797, -0.020705461502075195, -0.020049095153808594, -0.019392728805541992, -0.01873636245727539, -0.01807999610900879, -0.017423629760742188, -0.016767263412475586, -0.016110897064208984, -0.015454530715942383, -0.014798164367675781, -0.01414179801940918, -0.013485431671142578, -0.012829065322875977, -0.012172698974609375, -0.011516332626342773, -0.010859966278076172, -0.01020359992980957, -0.009547233581542969, -0.008890867233276367, -0.008234500885009766, -0.007578134536743164, -0.0069217681884765625, -0.006265401840209961, -0.005609035491943359, -0.004952669143676758, -0.004296302795410156, -0.0036399364471435547, -0.002983570098876953, -0.0023272037506103516, -0.00167083740234375, -0.0010144710540771484, -0.0003581047058105469, 0.0002982616424560547, 0.0009546279907226562, 0.0016109943389892578, 0.0022673606872558594, 0.002923727035522461, 0.0035800933837890625, 0.004236459732055664, 0.004892826080322266, 0.005549192428588867, 0.006205558776855469, 0.00686192512512207, 0.007518291473388672, 0.008174657821655273, 0.008831024169921875, 0.009487390518188477, 0.010143756866455078, 0.01080012321472168, 0.011456489562988281, 0.012112855911254883, 0.012769222259521484, 0.013425588607788086, 0.014081954956054688, 0.014738321304321289, 0.01539468765258789, 0.016051054000854492, 0.016707420349121094, 0.017363786697387695, 0.018020153045654297, 0.0186765193939209, 0.0193328857421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 32.0, 112.0, 236.0, 297.0, 196.0, 79.0, 23.0, 17.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.25808337330818176, -0.2533353567123413, -0.24858734011650085, -0.2438393384218216, -0.23909132182598114, -0.23434330523014069, -0.22959528863430023, -0.22484728693962097, -0.22009927034378052, -0.21535125374794006, -0.2106032371520996, -0.20585523545742035, -0.2011072188615799, -0.19635920226573944, -0.191611185669899, -0.18686318397521973, -0.18211516737937927, -0.17736715078353882, -0.17261913418769836, -0.1678711324930191, -0.16312311589717865, -0.1583750993013382, -0.15362708270549774, -0.14887908101081848, -0.14413104951381683, -0.13938303291797638, -0.13463501632213593, -0.12988701462745667, -0.1251389980316162, -0.12039098143577576, -0.1156429648399353, -0.11089495569467545, -0.10614694654941559, -0.10139892995357513, -0.09665092080831528, -0.09190290421247482, -0.08715489506721497, -0.08240687847137451, -0.07765886187553406, -0.0729108527302742, -0.06816283613443375, -0.06341481953859329, -0.058666810393333435, -0.05391879379749298, -0.049170784652233124, -0.04442276805639267, -0.039674755185842514, -0.03492674231529236, -0.030178729444742203, -0.025430716574192047, -0.02068270370364189, -0.015934688970446587, -0.011186676099896431, -0.006438663229346275, -0.0016906484961509705, 0.003057364374399185, 0.007805377244949341, 0.012553390115499496, 0.017301402986049652, 0.022049417719244957, 0.026797430589795113, 0.03154544532299042, 0.03629345819354057, 0.04104147106409073, 0.045789483934640884]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 2.0, 9.0, 16.0, 5.0, 12.0, 13.0, 23.0, 25.0, 29.0, 22.0, 41.0, 43.0, 37.0, 40.0, 40.0, 49.0, 35.0, 41.0, 51.0, 41.0, 43.0, 52.0, 34.0, 36.0, 37.0, 29.0, 23.0, 35.0, 21.0, 20.0, 15.0, 18.0, 8.0, 8.0, 10.0, 11.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.044088900089263916, -0.042980991303920746, -0.04187307879328728, -0.04076516628265381, -0.03965725749731064, -0.03854934871196747, -0.037441436201334, -0.03633352369070053, -0.03522561490535736, -0.03411770612001419, -0.03300979360938072, -0.03190188109874725, -0.030793972313404083, -0.029686061665415764, -0.028578151017427444, -0.027470240369439125, -0.026362329721450806, -0.025254419073462486, -0.024146508425474167, -0.023038597777485847, -0.021930687129497528, -0.02082277648150921, -0.01971486583352089, -0.01860695518553257, -0.01749904453754425, -0.01639113388955593, -0.015283223241567612, -0.014175312593579292, -0.013067401945590973, -0.011959491297602654, -0.010851580649614334, -0.009743670001626015, -0.008635759353637695, -0.007527848705649376, -0.0064199380576610565, -0.005312027409672737, -0.004204116761684418, -0.0030962061136960983, -0.001988295465707779, -0.0008803848177194595, 0.00022752583026885986, 0.0013354364782571793, 0.0024433471262454987, 0.003551257774233818, 0.0046591684222221375, 0.005767079070210457, 0.006874989718198776, 0.007982900366187096, 0.009090811014175415, 0.010198721662163734, 0.011306632310152054, 0.012414542958140373, 0.013522453606128693, 0.014630364254117012, 0.01573827490210533, 0.01684618555009365, 0.01795409619808197, 0.01906200684607029, 0.02016991749405861, 0.02127782814204693, 0.022385738790035248, 0.023493649438023567, 0.024601560086011887, 0.025709470734000206, 0.026817381381988525]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 17.0, 11.0, 18.0, 19.0, 25.0, 50.0, 64.0, 95.0, 139.0, 173.0, 269.0, 418.0, 706.0, 1516.0, 7021.0, 162296.0, 840550.0, 29468.0, 3141.0, 915.0, 516.0, 309.0, 254.0, 167.0, 115.0, 80.0, 64.0, 47.0, 25.0, 16.0, 15.0, 11.0, 5.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06062173843383789, -0.05874347686767578, -0.05686521530151367, -0.05498695373535156, -0.05310869216918945, -0.051230430603027344, -0.049352169036865234, -0.047473907470703125, -0.045595645904541016, -0.043717384338378906, -0.0418391227722168, -0.03996086120605469, -0.03808259963989258, -0.03620433807373047, -0.03432607650756836, -0.03244781494140625, -0.03056955337524414, -0.02869129180908203, -0.026813030242919922, -0.024934768676757812, -0.023056507110595703, -0.021178245544433594, -0.019299983978271484, -0.017421722412109375, -0.015543460845947266, -0.013665199279785156, -0.011786937713623047, -0.009908676147460938, -0.008030414581298828, -0.006152153015136719, -0.004273891448974609, -0.0023956298828125, -0.0005173683166503906, 0.0013608932495117188, 0.003239154815673828, 0.0051174163818359375, 0.006995677947998047, 0.008873939514160156, 0.010752201080322266, 0.012630462646484375, 0.014508724212646484, 0.016386985778808594, 0.018265247344970703, 0.020143508911132812, 0.022021770477294922, 0.02390003204345703, 0.02577829360961914, 0.02765655517578125, 0.02953481674194336, 0.03141307830810547, 0.03329133987426758, 0.03516960144042969, 0.0370478630065918, 0.038926124572753906, 0.040804386138916016, 0.042682647705078125, 0.044560909271240234, 0.046439170837402344, 0.04831743240356445, 0.05019569396972656, 0.05207395553588867, 0.05395221710205078, 0.05583047866821289, 0.057708740234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 28.0, 144.0, 334.0, 337.0, 127.0, 24.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067626953125, -0.06557750701904297, -0.06352806091308594, -0.061478614807128906, -0.059429168701171875, -0.057379722595214844, -0.05533027648925781, -0.05328083038330078, -0.05123138427734375, -0.04918193817138672, -0.04713249206542969, -0.045083045959472656, -0.043033599853515625, -0.040984153747558594, -0.03893470764160156, -0.03688526153564453, -0.0348358154296875, -0.03278636932373047, -0.030736923217773438, -0.028687477111816406, -0.026638031005859375, -0.024588584899902344, -0.022539138793945312, -0.02048969268798828, -0.01844024658203125, -0.01639080047607422, -0.014341354370117188, -0.012291908264160156, -0.010242462158203125, -0.008193016052246094, -0.0061435699462890625, -0.004094123840332031, -0.002044677734375, 4.76837158203125e-06, 0.0020542144775390625, 0.004103660583496094, 0.006153106689453125, 0.008202552795410156, 0.010251998901367188, 0.012301445007324219, 0.01435089111328125, 0.01640033721923828, 0.018449783325195312, 0.020499229431152344, 0.022548675537109375, 0.024598121643066406, 0.026647567749023438, 0.02869701385498047, 0.0307464599609375, 0.03279590606689453, 0.03484535217285156, 0.036894798278808594, 0.038944244384765625, 0.040993690490722656, 0.04304313659667969, 0.04509258270263672, 0.04714202880859375, 0.04919147491455078, 0.05124092102050781, 0.053290367126464844, 0.055339813232421875, 0.057389259338378906, 0.05943870544433594, 0.06148815155029297, 0.06353759765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 7.0, 15.0, 18.0, 23.0, 24.0, 29.0, 50.0, 46.0, 90.0, 154.0, 295.0, 735.0, 2027.0, 7146.0, 37344.0, 283719.0, 585225.0, 109198.0, 16288.0, 3813.0, 1209.0, 468.0, 213.0, 121.0, 68.0, 55.0, 34.0, 27.0, 26.0, 15.0, 18.0, 6.0, 4.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030242919921875, -0.029333829879760742, -0.028424739837646484, -0.027515649795532227, -0.02660655975341797, -0.02569746971130371, -0.024788379669189453, -0.023879289627075195, -0.022970199584960938, -0.02206110954284668, -0.021152019500732422, -0.020242929458618164, -0.019333839416503906, -0.01842474937438965, -0.01751565933227539, -0.016606569290161133, -0.015697479248046875, -0.014788389205932617, -0.01387929916381836, -0.012970209121704102, -0.012061119079589844, -0.011152029037475586, -0.010242938995361328, -0.00933384895324707, -0.008424758911132812, -0.007515668869018555, -0.006606578826904297, -0.005697488784790039, -0.004788398742675781, -0.0038793087005615234, -0.0029702186584472656, -0.002061128616333008, -0.00115203857421875, -0.0002429485321044922, 0.0006661415100097656, 0.0015752315521240234, 0.0024843215942382812, 0.003393411636352539, 0.004302501678466797, 0.005211591720581055, 0.0061206817626953125, 0.00702977180480957, 0.007938861846923828, 0.008847951889038086, 0.009757041931152344, 0.010666131973266602, 0.01157522201538086, 0.012484312057495117, 0.013393402099609375, 0.014302492141723633, 0.01521158218383789, 0.01612067222595215, 0.017029762268066406, 0.017938852310180664, 0.018847942352294922, 0.01975703239440918, 0.020666122436523438, 0.021575212478637695, 0.022484302520751953, 0.02339339256286621, 0.02430248260498047, 0.025211572647094727, 0.026120662689208984, 0.027029752731323242, 0.0279388427734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 5.0, 6.0, 11.0, 12.0, 9.0, 18.0, 20.0, 24.0, 29.0, 33.0, 39.0, 42.0, 47.0, 41.0, 47.0, 41.0, 29.0, 46.0, 54.0, 44.0, 43.0, 36.0, 44.0, 35.0, 38.0, 31.0, 19.0, 27.0, 27.0, 21.0, 17.0, 8.0, 12.0, 8.0, 9.0, 7.0, 2.0, 5.0, 4.0, 7.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0276947021484375, -0.0268709659576416, -0.026047229766845703, -0.025223493576049805, -0.024399757385253906, -0.023576021194458008, -0.02275228500366211, -0.02192854881286621, -0.021104812622070312, -0.020281076431274414, -0.019457340240478516, -0.018633604049682617, -0.01780986785888672, -0.01698613166809082, -0.016162395477294922, -0.015338659286499023, -0.014514923095703125, -0.013691186904907227, -0.012867450714111328, -0.01204371452331543, -0.011219978332519531, -0.010396242141723633, -0.009572505950927734, -0.008748769760131836, -0.007925033569335938, -0.007101297378540039, -0.006277561187744141, -0.005453824996948242, -0.004630088806152344, -0.0038063526153564453, -0.002982616424560547, -0.0021588802337646484, -0.00133514404296875, -0.0005114078521728516, 0.0003123283386230469, 0.0011360645294189453, 0.0019598007202148438, 0.002783536911010742, 0.0036072731018066406, 0.004431009292602539, 0.0052547454833984375, 0.006078481674194336, 0.006902217864990234, 0.007725954055786133, 0.008549690246582031, 0.00937342643737793, 0.010197162628173828, 0.011020898818969727, 0.011844635009765625, 0.012668371200561523, 0.013492107391357422, 0.01431584358215332, 0.015139579772949219, 0.015963315963745117, 0.016787052154541016, 0.017610788345336914, 0.018434524536132812, 0.01925826072692871, 0.02008199691772461, 0.020905733108520508, 0.021729469299316406, 0.022553205490112305, 0.023376941680908203, 0.0242006778717041, 0.0250244140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 24.0, 22.0, 33.0, 44.0, 79.0, 95.0, 162.0, 234.0, 380.0, 594.0, 1026.0, 1860.0, 3543.0, 7613.0, 20646.0, 77380.0, 409685.0, 410876.0, 78135.0, 20656.0, 7541.0, 3481.0, 1720.0, 997.0, 583.0, 416.0, 226.0, 167.0, 111.0, 52.0, 60.0, 39.0, 25.0, 14.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00881195068359375, -0.008518218994140625, -0.0082244873046875, -0.007930755615234375, -0.00763702392578125, -0.007343292236328125, -0.007049560546875, -0.006755828857421875, -0.00646209716796875, -0.006168365478515625, -0.0058746337890625, -0.005580902099609375, -0.00528717041015625, -0.004993438720703125, -0.00469970703125, -0.004405975341796875, -0.00411224365234375, -0.003818511962890625, -0.0035247802734375, -0.003231048583984375, -0.00293731689453125, -0.002643585205078125, -0.002349853515625, -0.002056121826171875, -0.00176239013671875, -0.001468658447265625, -0.0011749267578125, -0.000881195068359375, -0.00058746337890625, -0.000293731689453125, 0.0, 0.000293731689453125, 0.00058746337890625, 0.000881195068359375, 0.0011749267578125, 0.001468658447265625, 0.00176239013671875, 0.002056121826171875, 0.002349853515625, 0.002643585205078125, 0.00293731689453125, 0.003231048583984375, 0.0035247802734375, 0.003818511962890625, 0.00411224365234375, 0.004405975341796875, 0.00469970703125, 0.004993438720703125, 0.00528717041015625, 0.005580902099609375, 0.0058746337890625, 0.006168365478515625, 0.00646209716796875, 0.006755828857421875, 0.007049560546875, 0.007343292236328125, 0.00763702392578125, 0.007930755615234375, 0.0082244873046875, 0.008518218994140625, 0.00881195068359375, 0.009105682373046875, 0.0093994140625, 0.009693145751953125, 0.00998687744140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 15.0, 18.0, 34.0, 31.0, 51.0, 49.0, 66.0, 82.0, 118.0, 108.0, 87.0, 71.0, 53.0, 52.0, 26.0, 25.0, 26.0, 21.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00011140108108520508, -0.00010846741497516632, -0.00010553374886512756, -0.0001026000827550888, -9.966641664505005e-05, -9.673275053501129e-05, -9.379908442497253e-05, -9.086541831493378e-05, -8.793175220489502e-05, -8.499808609485626e-05, -8.20644199848175e-05, -7.913075387477875e-05, -7.619708776473999e-05, -7.326342165470123e-05, -7.032975554466248e-05, -6.739608943462372e-05, -6.446242332458496e-05, -6.15287572145462e-05, -5.8595091104507446e-05, -5.566142499446869e-05, -5.272775888442993e-05, -4.9794092774391174e-05, -4.686042666435242e-05, -4.392676055431366e-05, -4.09930944442749e-05, -3.8059428334236145e-05, -3.512576222419739e-05, -3.219209611415863e-05, -2.9258430004119873e-05, -2.6324763894081116e-05, -2.339109778404236e-05, -2.04574316740036e-05, -1.7523765563964844e-05, -1.4590099453926086e-05, -1.1656433343887329e-05, -8.722767233848572e-06, -5.7891011238098145e-06, -2.855435013771057e-06, 7.82310962677002e-08, 3.0118972063064575e-06, 5.945563316345215e-06, 8.879229426383972e-06, 1.181289553642273e-05, 1.4746561646461487e-05, 1.7680227756500244e-05, 2.0613893866539e-05, 2.354755997657776e-05, 2.6481226086616516e-05, 2.9414892196655273e-05, 3.234855830669403e-05, 3.528222441673279e-05, 3.8215890526771545e-05, 4.11495566368103e-05, 4.408322274684906e-05, 4.701688885688782e-05, 4.9950554966926575e-05, 5.288422107696533e-05, 5.581788718700409e-05, 5.875155329704285e-05, 6.16852194070816e-05, 6.461888551712036e-05, 6.755255162715912e-05, 7.048621773719788e-05, 7.341988384723663e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 10.0, 14.0, 12.0, 19.0, 24.0, 63.0, 89.0, 129.0, 211.0, 364.0, 617.0, 1202.0, 2266.0, 4677.0, 10318.0, 23153.0, 64599.0, 230347.0, 457837.0, 167432.0, 49735.0, 18718.0, 8399.0, 3945.0, 1960.0, 1012.0, 545.0, 309.0, 192.0, 126.0, 78.0, 47.0, 36.0, 18.0, 17.0, 12.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0079803466796875, -0.00773388147354126, -0.0074874162673950195, -0.007240951061248779, -0.006994485855102539, -0.006748020648956299, -0.006501555442810059, -0.006255090236663818, -0.006008625030517578, -0.005762159824371338, -0.005515694618225098, -0.005269229412078857, -0.005022764205932617, -0.004776298999786377, -0.004529833793640137, -0.0042833685874938965, -0.004036903381347656, -0.003790438175201416, -0.0035439729690551758, -0.0032975077629089355, -0.0030510425567626953, -0.002804577350616455, -0.002558112144470215, -0.0023116469383239746, -0.0020651817321777344, -0.0018187165260314941, -0.001572251319885254, -0.0013257861137390137, -0.0010793209075927734, -0.0008328557014465332, -0.000586390495300293, -0.00033992528915405273, -9.34600830078125e-05, 0.00015300512313842773, 0.00039947032928466797, 0.0006459355354309082, 0.0008924007415771484, 0.0011388659477233887, 0.001385331153869629, 0.0016317963600158691, 0.0018782615661621094, 0.0021247267723083496, 0.00237119197845459, 0.00261765718460083, 0.0028641223907470703, 0.0031105875968933105, 0.0033570528030395508, 0.003603518009185791, 0.0038499832153320312, 0.0040964484214782715, 0.004342913627624512, 0.004589378833770752, 0.004835844039916992, 0.005082309246063232, 0.005328774452209473, 0.005575239658355713, 0.005821704864501953, 0.006068170070648193, 0.006314635276794434, 0.006561100482940674, 0.006807565689086914, 0.007054030895233154, 0.0073004961013793945, 0.007546961307525635, 0.007793426513671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 20.0, 17.0, 42.0, 50.0, 78.0, 91.0, 103.0, 132.0, 107.0, 99.0, 75.0, 47.0, 42.0, 24.0, 18.0, 11.0, 5.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010248303413391113, -0.009922266006469727, -0.00959622859954834, -0.009270191192626953, -0.008944153785705566, -0.00861811637878418, -0.008292078971862793, -0.007966041564941406, -0.0076400041580200195, -0.007313966751098633, -0.006987929344177246, -0.006661891937255859, -0.006335854530334473, -0.006009817123413086, -0.005683779716491699, -0.0053577423095703125, -0.005031704902648926, -0.004705667495727539, -0.004379630088806152, -0.004053592681884766, -0.003727555274963379, -0.003401517868041992, -0.0030754804611206055, -0.0027494430541992188, -0.002423405647277832, -0.0020973682403564453, -0.0017713308334350586, -0.0014452934265136719, -0.0011192560195922852, -0.0007932186126708984, -0.0004671812057495117, -0.000141143798828125, 0.00018489360809326172, 0.0005109310150146484, 0.0008369684219360352, 0.0011630058288574219, 0.0014890432357788086, 0.0018150806427001953, 0.002141118049621582, 0.0024671554565429688, 0.0027931928634643555, 0.003119230270385742, 0.003445267677307129, 0.0037713050842285156, 0.004097342491149902, 0.004423379898071289, 0.004749417304992676, 0.0050754547119140625, 0.005401492118835449, 0.005727529525756836, 0.006053566932678223, 0.006379604339599609, 0.006705641746520996, 0.007031679153442383, 0.0073577165603637695, 0.007683753967285156, 0.008009791374206543, 0.00833582878112793, 0.008661866188049316, 0.008987903594970703, 0.00931394100189209, 0.009639978408813477, 0.009966015815734863, 0.01029205322265625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 2.0, 5.0, 20.0, 41.0, 91.0, 160.0, 235.0, 212.0, 119.0, 64.0, 24.0, 16.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.24155941605567932, -0.23699802160263062, -0.2324366271495819, -0.2278752326965332, -0.2233138382434845, -0.2187524437904358, -0.21419104933738708, -0.20962965488433838, -0.20506826043128967, -0.20050686597824097, -0.19594547152519226, -0.19138407707214355, -0.18682268261909485, -0.18226128816604614, -0.17769989371299744, -0.17313849925994873, -0.16857710480690002, -0.16401571035385132, -0.1594543159008026, -0.1548929214477539, -0.1503315269947052, -0.1457701325416565, -0.1412087380886078, -0.13664734363555908, -0.13208594918251038, -0.12752455472946167, -0.12296316027641296, -0.11840176582336426, -0.11384037137031555, -0.10927897691726685, -0.10471758246421814, -0.10015618801116943, -0.09559480845928192, -0.09103341400623322, -0.08647201955318451, -0.0819106251001358, -0.0773492306470871, -0.07278783619403839, -0.06822644174098969, -0.06366504728794098, -0.05910365283489227, -0.05454225838184357, -0.04998086392879486, -0.045419469475746155, -0.04085807502269745, -0.03629668056964874, -0.03173528611660004, -0.02717389166355133, -0.022612497210502625, -0.01805110275745392, -0.013489708304405212, -0.008928313851356506, -0.0043669193983078, 0.00019447505474090576, 0.004755869507789612, 0.009317263960838318, 0.013878658413887024, 0.01844005286693573, 0.023001447319984436, 0.027562841773033142, 0.03212423622608185, 0.036685630679130554, 0.04124702513217926, 0.045808419585227966, 0.05036981403827667]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 4.0, 5.0, 8.0, 7.0, 13.0, 13.0, 11.0, 27.0, 25.0, 22.0, 38.0, 29.0, 40.0, 40.0, 42.0, 47.0, 49.0, 54.0, 43.0, 46.0, 48.0, 50.0, 45.0, 42.0, 31.0, 48.0, 22.0, 22.0, 27.0, 21.0, 12.0, 11.0, 12.0, 15.0, 7.0, 9.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07508087158203125, -0.07260803878307343, -0.0701352134346962, -0.06766238063573837, -0.06518955528736115, -0.06271672248840332, -0.060243889689445496, -0.05777106061577797, -0.05529823154211044, -0.05282540246844292, -0.05035257339477539, -0.047879740595817566, -0.04540691152215004, -0.04293408244848251, -0.04046124964952469, -0.03798842057585716, -0.035515591502189636, -0.03304276242852211, -0.030569931492209435, -0.02809710055589676, -0.025624271482229233, -0.023151442408561707, -0.02067861147224903, -0.018205780535936356, -0.01573295146226883, -0.013260121457278728, -0.010787291452288628, -0.008314461447298527, -0.005841631442308426, -0.003368801437318325, -0.0008959714323282242, 0.0015768595039844513, 0.0040496885776519775, 0.006522518582642078, 0.00899534858763218, 0.01146817859262228, 0.013941008597612381, 0.016413837671279907, 0.018886668607592583, 0.021359499543905258, 0.023832328617572784, 0.02630515769124031, 0.028777988627552986, 0.03125081956386566, 0.03372364863753319, 0.036196477711200714, 0.03866931051015854, 0.041142139583826065, 0.04361496865749359, 0.04608779773116112, 0.048560626804828644, 0.05103345960378647, 0.053506288677453995, 0.05597911775112152, 0.058451950550079346, 0.06092477962374687, 0.0633976086974144, 0.06587044149637222, 0.06834326684474945, 0.07081609964370728, 0.0732889324426651, 0.07576175779104233, 0.07823459059000015, 0.08070741593837738, 0.0831802487373352]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 15.0, 42.0, 249.0, 3045.0, 4009048.0, 179992.0, 1583.0, 204.0, 53.0, 22.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.233154296875, -0.22628021240234375, -0.2194061279296875, -0.21253204345703125, -0.205657958984375, -0.19878387451171875, -0.1919097900390625, -0.18503570556640625, -0.17816162109375, -0.17128753662109375, -0.1644134521484375, -0.15753936767578125, -0.150665283203125, -0.14379119873046875, -0.1369171142578125, -0.13004302978515625, -0.1231689453125, -0.11629486083984375, -0.1094207763671875, -0.10254669189453125, -0.095672607421875, -0.08879852294921875, -0.0819244384765625, -0.07505035400390625, -0.06817626953125, -0.06130218505859375, -0.0544281005859375, -0.04755401611328125, -0.040679931640625, -0.03380584716796875, -0.0269317626953125, -0.02005767822265625, -0.01318359375, -0.00630950927734375, 0.0005645751953125, 0.00743865966796875, 0.014312744140625, 0.02118682861328125, 0.0280609130859375, 0.03493499755859375, 0.04180908203125, 0.04868316650390625, 0.0555572509765625, 0.06243133544921875, 0.069305419921875, 0.07617950439453125, 0.0830535888671875, 0.08992767333984375, 0.0968017578125, 0.10367584228515625, 0.1105499267578125, 0.11742401123046875, 0.124298095703125, 0.13117218017578125, 0.1380462646484375, 0.14492034912109375, 0.15179443359375, 0.15866851806640625, 0.1655426025390625, 0.17241668701171875, 0.179290771484375, 0.18616485595703125, 0.1930389404296875, 0.19991302490234375, 0.206787109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 22.0, 74.0, 235.0, 346.0, 236.0, 79.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.064453125, -0.0624699592590332, -0.060486793518066406, -0.05850362777709961, -0.05652046203613281, -0.054537296295166016, -0.05255413055419922, -0.05057096481323242, -0.048587799072265625, -0.04660463333129883, -0.04462146759033203, -0.042638301849365234, -0.04065513610839844, -0.03867197036743164, -0.036688804626464844, -0.03470563888549805, -0.03272247314453125, -0.030739307403564453, -0.028756141662597656, -0.02677297592163086, -0.024789810180664062, -0.022806644439697266, -0.02082347869873047, -0.018840312957763672, -0.016857147216796875, -0.014873981475830078, -0.012890815734863281, -0.010907649993896484, -0.008924484252929688, -0.006941318511962891, -0.004958152770996094, -0.002974987030029297, -0.0009918212890625, 0.0009913444519042969, 0.0029745101928710938, 0.004957675933837891, 0.0069408416748046875, 0.008924007415771484, 0.010907173156738281, 0.012890338897705078, 0.014873504638671875, 0.016856670379638672, 0.01883983612060547, 0.020823001861572266, 0.022806167602539062, 0.02478933334350586, 0.026772499084472656, 0.028755664825439453, 0.03073883056640625, 0.03272199630737305, 0.034705162048339844, 0.03668832778930664, 0.03867149353027344, 0.040654659271240234, 0.04263782501220703, 0.04462099075317383, 0.046604156494140625, 0.04858732223510742, 0.05057048797607422, 0.052553653717041016, 0.05453681945800781, 0.05651998519897461, 0.058503150939941406, 0.0604863166809082, 0.062469482421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 11.0, 24.0, 34.0, 44.0, 67.0, 83.0, 135.0, 273.0, 529.0, 1044.0, 2064.0, 5263.0, 16146.0, 68871.0, 762525.0, 3148759.0, 146795.0, 27562.0, 8121.0, 2946.0, 1345.0, 670.0, 373.0, 177.0, 140.0, 95.0, 60.0, 30.0, 28.0, 17.0, 16.0, 12.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.021364212036132812, -0.020679473876953125, -0.019994735717773438, -0.01930999755859375, -0.018625259399414062, -0.017940521240234375, -0.017255783081054688, -0.016571044921875, -0.015886306762695312, -0.015201568603515625, -0.014516830444335938, -0.01383209228515625, -0.013147354125976562, -0.012462615966796875, -0.011777877807617188, -0.0110931396484375, -0.010408401489257812, -0.009723663330078125, -0.009038925170898438, -0.00835418701171875, -0.0076694488525390625, -0.006984710693359375, -0.0062999725341796875, -0.005615234375, -0.0049304962158203125, -0.004245758056640625, -0.0035610198974609375, -0.00287628173828125, -0.0021915435791015625, -0.001506805419921875, -0.0008220672607421875, -0.0001373291015625, 0.0005474090576171875, 0.001232147216796875, 0.0019168853759765625, 0.00260162353515625, 0.0032863616943359375, 0.003971099853515625, 0.0046558380126953125, 0.005340576171875, 0.0060253143310546875, 0.006710052490234375, 0.0073947906494140625, 0.00807952880859375, 0.008764266967773438, 0.009449005126953125, 0.010133743286132812, 0.0108184814453125, 0.011503219604492188, 0.012187957763671875, 0.012872695922851562, 0.01355743408203125, 0.014242172241210938, 0.014926910400390625, 0.015611648559570312, 0.01629638671875, 0.016981124877929688, 0.017665863037109375, 0.018350601196289062, 0.01903533935546875, 0.019720077514648438, 0.020404815673828125, 0.021089553833007812, 0.0217742919921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 12.0, 21.0, 35.0, 56.0, 100.0, 249.0, 643.0, 1607.0, 789.0, 250.0, 109.0, 65.0, 38.0, 17.0, 26.0, 13.0, 14.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020477294921875, -0.019609451293945312, -0.018741607666015625, -0.017873764038085938, -0.01700592041015625, -0.016138076782226562, -0.015270233154296875, -0.014402389526367188, -0.0135345458984375, -0.012666702270507812, -0.011798858642578125, -0.010931015014648438, -0.01006317138671875, -0.009195327758789062, -0.008327484130859375, -0.0074596405029296875, -0.006591796875, -0.0057239532470703125, -0.004856109619140625, -0.0039882659912109375, -0.00312042236328125, -0.0022525787353515625, -0.001384735107421875, -0.0005168914794921875, 0.0003509521484375, 0.0012187957763671875, 0.002086639404296875, 0.0029544830322265625, 0.00382232666015625, 0.0046901702880859375, 0.005558013916015625, 0.0064258575439453125, 0.007293701171875, 0.008161544799804688, 0.009029388427734375, 0.009897232055664062, 0.01076507568359375, 0.011632919311523438, 0.012500762939453125, 0.013368606567382812, 0.0142364501953125, 0.015104293823242188, 0.015972137451171875, 0.016839981079101562, 0.01770782470703125, 0.018575668334960938, 0.019443511962890625, 0.020311355590820312, 0.02117919921875, 0.022047042846679688, 0.022914886474609375, 0.023782730102539062, 0.02465057373046875, 0.025518417358398438, 0.026386260986328125, 0.027254104614257812, 0.0281219482421875, 0.028989791870117188, 0.029857635498046875, 0.030725479125976562, 0.03159332275390625, 0.03246116638183594, 0.033329010009765625, 0.03419685363769531, 0.035064697265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 12.0, 22.0, 69.0, 186.0, 264.0, 230.0, 126.0, 50.0, 18.0, 9.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25066709518432617, -0.2449071854352951, -0.23914729058742523, -0.23338738083839417, -0.2276274859905243, -0.22186757624149323, -0.21610766649246216, -0.21034777164459229, -0.2045878767967224, -0.19882796704769135, -0.19306807219982147, -0.1873081624507904, -0.18154826760292053, -0.17578835785388947, -0.1700284481048584, -0.16426855325698853, -0.15850864350795746, -0.1527487337589264, -0.14698883891105652, -0.14122892916202545, -0.13546903431415558, -0.1297091245651245, -0.12394922226667404, -0.11818931996822357, -0.1124294176697731, -0.10666951537132263, -0.10090961307287216, -0.09514971077442169, -0.08938980102539062, -0.08362990617752075, -0.07786999642848969, -0.07211009413003922, -0.06635017693042755, -0.06059027463197708, -0.05483037233352661, -0.04907046630978584, -0.04331056401133537, -0.0375506617128849, -0.031790755689144135, -0.026030853390693665, -0.020270951092243195, -0.01451104786247015, -0.008751144632697105, -0.002991240471601486, 0.0027686618268489838, 0.008528564125299454, 0.014288470149040222, 0.020048372447490692, 0.025808274745941162, 0.03156817704439163, 0.0373280793428421, 0.04308798536658287, 0.04884788766503334, 0.05460778996348381, 0.06036769598722458, 0.06612759828567505, 0.07188750058412552, 0.07764740288257599, 0.08340730518102646, 0.08916720747947693, 0.094927117228508, 0.10068701207637787, 0.10644692182540894, 0.1122068241238594, 0.11796672642230988]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 7.0, 13.0, 21.0, 8.0, 22.0, 33.0, 21.0, 24.0, 30.0, 38.0, 39.0, 42.0, 56.0, 47.0, 51.0, 45.0, 44.0, 44.0, 46.0, 52.0, 41.0, 22.0, 36.0, 27.0, 26.0, 18.0, 15.0, 19.0, 14.0, 14.0, 11.0, 15.0, 15.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05937594175338745, -0.057429276406764984, -0.055482614785432816, -0.05353595316410065, -0.05158928781747818, -0.04964262247085571, -0.047695960849523544, -0.045749299228191376, -0.04380263388156891, -0.04185596853494644, -0.03990930691361427, -0.037962645292282104, -0.03601597994565964, -0.03406931459903717, -0.032122652977705, -0.030175989493727684, -0.028229326009750366, -0.02628266252577305, -0.02433599904179573, -0.022389335557818413, -0.020442672073841095, -0.018496008589863777, -0.01654934510588646, -0.014602681621909142, -0.012656018137931824, -0.010709354653954506, -0.008762691169977188, -0.00681602768599987, -0.0048693642020225525, -0.0029227007180452347, -0.0009760372340679169, 0.0009706262499094009, 0.0029172897338867188, 0.0048639532178640366, 0.006810616701841354, 0.008757280185818672, 0.01070394366979599, 0.012650607153773308, 0.014597270637750626, 0.016543934121727943, 0.01849059760570526, 0.02043726108968258, 0.022383924573659897, 0.024330588057637215, 0.026277251541614532, 0.02822391502559185, 0.030170578509569168, 0.03211724013090134, 0.034063905477523804, 0.03601057082414627, 0.03795723244547844, 0.03990389406681061, 0.041850559413433075, 0.04379722476005554, 0.04574388638138771, 0.04769054800271988, 0.049637213349342346, 0.05158387869596481, 0.05353054031729698, 0.05547720193862915, 0.05742386728525162, 0.059370532631874084, 0.06131719425320625, 0.06326385587453842, 0.06521052122116089]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 7.0, 11.0, 18.0, 22.0, 24.0, 27.0, 42.0, 55.0, 70.0, 93.0, 128.0, 184.0, 246.0, 349.0, 563.0, 979.0, 2755.0, 23760.0, 590485.0, 407264.0, 16471.0, 2323.0, 851.0, 485.0, 346.0, 248.0, 172.0, 142.0, 93.0, 75.0, 38.0, 51.0, 39.0, 33.0, 12.0, 16.0, 16.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0], "bins": [-0.07342529296875, -0.07126140594482422, -0.06909751892089844, -0.06693363189697266, -0.06476974487304688, -0.0626058578491211, -0.06044197082519531, -0.05827808380126953, -0.05611419677734375, -0.05395030975341797, -0.05178642272949219, -0.049622535705566406, -0.047458648681640625, -0.045294761657714844, -0.04313087463378906, -0.04096698760986328, -0.0388031005859375, -0.03663921356201172, -0.03447532653808594, -0.032311439514160156, -0.030147552490234375, -0.027983665466308594, -0.025819778442382812, -0.02365589141845703, -0.02149200439453125, -0.01932811737060547, -0.017164230346679688, -0.015000343322753906, -0.012836456298828125, -0.010672569274902344, -0.008508682250976562, -0.006344795227050781, -0.004180908203125, -0.0020170211791992188, 0.0001468658447265625, 0.0023107528686523438, 0.004474639892578125, 0.006638526916503906, 0.008802413940429688, 0.010966300964355469, 0.01313018798828125, 0.015294075012207031, 0.017457962036132812, 0.019621849060058594, 0.021785736083984375, 0.023949623107910156, 0.026113510131835938, 0.02827739715576172, 0.0304412841796875, 0.03260517120361328, 0.03476905822753906, 0.036932945251464844, 0.039096832275390625, 0.041260719299316406, 0.04342460632324219, 0.04558849334716797, 0.04775238037109375, 0.04991626739501953, 0.05208015441894531, 0.054244041442871094, 0.056407928466796875, 0.058571815490722656, 0.06073570251464844, 0.06289958953857422, 0.0650634765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 65.0, 191.0, 350.0, 248.0, 123.0, 13.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06451416015625, -0.06254434585571289, -0.06057453155517578, -0.05860471725463867, -0.05663490295410156, -0.05466508865356445, -0.052695274353027344, -0.050725460052490234, -0.048755645751953125, -0.046785831451416016, -0.044816017150878906, -0.0428462028503418, -0.04087638854980469, -0.03890657424926758, -0.03693675994873047, -0.03496694564819336, -0.03299713134765625, -0.03102731704711914, -0.02905750274658203, -0.027087688446044922, -0.025117874145507812, -0.023148059844970703, -0.021178245544433594, -0.019208431243896484, -0.017238616943359375, -0.015268802642822266, -0.013298988342285156, -0.011329174041748047, -0.009359359741210938, -0.007389545440673828, -0.005419731140136719, -0.0034499168395996094, -0.0014801025390625, 0.0004897117614746094, 0.0024595260620117188, 0.004429340362548828, 0.0063991546630859375, 0.008368968963623047, 0.010338783264160156, 0.012308597564697266, 0.014278411865234375, 0.016248226165771484, 0.018218040466308594, 0.020187854766845703, 0.022157669067382812, 0.024127483367919922, 0.02609729766845703, 0.02806711196899414, 0.03003692626953125, 0.03200674057006836, 0.03397655487060547, 0.03594636917114258, 0.03791618347167969, 0.0398859977722168, 0.041855812072753906, 0.043825626373291016, 0.045795440673828125, 0.047765254974365234, 0.049735069274902344, 0.05170488357543945, 0.05367469787597656, 0.05564451217651367, 0.05761432647705078, 0.05958414077758789, 0.061553955078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 4.0, 6.0, 6.0, 14.0, 16.0, 30.0, 29.0, 48.0, 82.0, 139.0, 248.0, 664.0, 2066.0, 11586.0, 123904.0, 765219.0, 129001.0, 12027.0, 2161.0, 651.0, 261.0, 129.0, 73.0, 41.0, 36.0, 19.0, 30.0, 12.0, 11.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.056640625, -0.05489826202392578, -0.05315589904785156, -0.051413536071777344, -0.049671173095703125, -0.047928810119628906, -0.04618644714355469, -0.04444408416748047, -0.04270172119140625, -0.04095935821533203, -0.03921699523925781, -0.037474632263183594, -0.035732269287109375, -0.033989906311035156, -0.03224754333496094, -0.03050518035888672, -0.0287628173828125, -0.02702045440673828, -0.025278091430664062, -0.023535728454589844, -0.021793365478515625, -0.020051002502441406, -0.018308639526367188, -0.01656627655029297, -0.01482391357421875, -0.013081550598144531, -0.011339187622070312, -0.009596824645996094, -0.007854461669921875, -0.006112098693847656, -0.0043697357177734375, -0.0026273727416992188, -0.000885009765625, 0.0008573532104492188, 0.0025997161865234375, 0.004342079162597656, 0.006084442138671875, 0.007826805114746094, 0.009569168090820312, 0.011311531066894531, 0.01305389404296875, 0.014796257019042969, 0.016538619995117188, 0.018280982971191406, 0.020023345947265625, 0.021765708923339844, 0.023508071899414062, 0.02525043487548828, 0.0269927978515625, 0.02873516082763672, 0.030477523803710938, 0.032219886779785156, 0.033962249755859375, 0.035704612731933594, 0.03744697570800781, 0.03918933868408203, 0.04093170166015625, 0.04267406463623047, 0.04441642761230469, 0.046158790588378906, 0.047901153564453125, 0.049643516540527344, 0.05138587951660156, 0.05312824249267578, 0.05487060546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 11.0, 17.0, 12.0, 20.0, 13.0, 16.0, 31.0, 33.0, 36.0, 38.0, 43.0, 43.0, 48.0, 40.0, 39.0, 41.0, 42.0, 48.0, 58.0, 45.0, 36.0, 40.0, 28.0, 39.0, 24.0, 23.0, 13.0, 21.0, 15.0, 21.0, 8.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027740478515625, -0.026801586151123047, -0.025862693786621094, -0.02492380142211914, -0.023984909057617188, -0.023046016693115234, -0.02210712432861328, -0.021168231964111328, -0.020229339599609375, -0.019290447235107422, -0.01835155487060547, -0.017412662506103516, -0.016473770141601562, -0.01553487777709961, -0.014595985412597656, -0.013657093048095703, -0.01271820068359375, -0.011779308319091797, -0.010840415954589844, -0.00990152359008789, -0.008962631225585938, -0.008023738861083984, -0.007084846496582031, -0.006145954132080078, -0.005207061767578125, -0.004268169403076172, -0.0033292770385742188, -0.0023903846740722656, -0.0014514923095703125, -0.0005125999450683594, 0.00042629241943359375, 0.0013651847839355469, 0.0023040771484375, 0.003242969512939453, 0.004181861877441406, 0.005120754241943359, 0.0060596466064453125, 0.006998538970947266, 0.007937431335449219, 0.008876323699951172, 0.009815216064453125, 0.010754108428955078, 0.011693000793457031, 0.012631893157958984, 0.013570785522460938, 0.01450967788696289, 0.015448570251464844, 0.016387462615966797, 0.01732635498046875, 0.018265247344970703, 0.019204139709472656, 0.02014303207397461, 0.021081924438476562, 0.022020816802978516, 0.02295970916748047, 0.023898601531982422, 0.024837493896484375, 0.025776386260986328, 0.02671527862548828, 0.027654170989990234, 0.028593063354492188, 0.02953195571899414, 0.030470848083496094, 0.03140974044799805, 0.0323486328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 9.0, 9.0, 22.0, 33.0, 45.0, 62.0, 65.0, 119.0, 148.0, 233.0, 314.0, 506.0, 886.0, 1416.0, 2556.0, 4626.0, 9319.0, 20374.0, 48927.0, 136021.0, 357785.0, 290486.0, 102263.0, 38964.0, 16519.0, 7540.0, 3841.0, 2068.0, 1214.0, 723.0, 430.0, 331.0, 186.0, 146.0, 111.0, 58.0, 50.0, 34.0, 22.0, 15.0, 22.0, 7.0, 4.0, 8.0, 4.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00910186767578125, -0.00877523422241211, -0.008448600769042969, -0.008121967315673828, -0.0077953338623046875, -0.007468700408935547, -0.007142066955566406, -0.006815433502197266, -0.006488800048828125, -0.006162166595458984, -0.005835533142089844, -0.005508899688720703, -0.0051822662353515625, -0.004855632781982422, -0.004528999328613281, -0.004202365875244141, -0.003875732421875, -0.0035490989685058594, -0.0032224655151367188, -0.002895832061767578, -0.0025691986083984375, -0.002242565155029297, -0.0019159317016601562, -0.0015892982482910156, -0.001262664794921875, -0.0009360313415527344, -0.0006093978881835938, -0.0002827644348144531, 4.38690185546875e-05, 0.0003705024719238281, 0.0006971359252929688, 0.0010237693786621094, 0.00135040283203125, 0.0016770362854003906, 0.0020036697387695312, 0.002330303192138672, 0.0026569366455078125, 0.002983570098876953, 0.0033102035522460938, 0.0036368370056152344, 0.003963470458984375, 0.004290103912353516, 0.004616737365722656, 0.004943370819091797, 0.0052700042724609375, 0.005596637725830078, 0.005923271179199219, 0.006249904632568359, 0.0065765380859375, 0.006903171539306641, 0.007229804992675781, 0.007556438446044922, 0.007883071899414062, 0.008209705352783203, 0.008536338806152344, 0.008862972259521484, 0.009189605712890625, 0.009516239166259766, 0.009842872619628906, 0.010169506072998047, 0.010496139526367188, 0.010822772979736328, 0.011149406433105469, 0.01147603988647461, 0.01180267333984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 11.0, 6.0, 11.0, 20.0, 21.0, 33.0, 32.0, 48.0, 58.0, 75.0, 86.0, 83.0, 95.0, 64.0, 66.0, 63.0, 46.0, 30.0, 29.0, 19.0, 21.0, 13.0, 9.0, 7.0, 8.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.654594421386719e-05, -8.419528603553772e-05, -8.184462785720825e-05, -7.949396967887878e-05, -7.714331150054932e-05, -7.479265332221985e-05, -7.244199514389038e-05, -7.009133696556091e-05, -6.774067878723145e-05, -6.539002060890198e-05, -6.303936243057251e-05, -6.068870425224304e-05, -5.8338046073913574e-05, -5.5987387895584106e-05, -5.363672971725464e-05, -5.128607153892517e-05, -4.89354133605957e-05, -4.6584755182266235e-05, -4.423409700393677e-05, -4.18834388256073e-05, -3.953278064727783e-05, -3.7182122468948364e-05, -3.4831464290618896e-05, -3.248080611228943e-05, -3.013014793395996e-05, -2.7779489755630493e-05, -2.5428831577301025e-05, -2.3078173398971558e-05, -2.072751522064209e-05, -1.8376857042312622e-05, -1.6026198863983154e-05, -1.3675540685653687e-05, -1.1324882507324219e-05, -8.974224328994751e-06, -6.623566150665283e-06, -4.2729079723358154e-06, -1.9222497940063477e-06, 4.284083843231201e-07, 2.779066562652588e-06, 5.129724740982056e-06, 7.4803829193115234e-06, 9.831041097640991e-06, 1.2181699275970459e-05, 1.4532357454299927e-05, 1.6883015632629395e-05, 1.9233673810958862e-05, 2.158433198928833e-05, 2.3934990167617798e-05, 2.6285648345947266e-05, 2.8636306524276733e-05, 3.09869647026062e-05, 3.333762288093567e-05, 3.568828105926514e-05, 3.8038939237594604e-05, 4.038959741592407e-05, 4.274025559425354e-05, 4.509091377258301e-05, 4.7441571950912476e-05, 4.979223012924194e-05, 5.214288830757141e-05, 5.449354648590088e-05, 5.684420466423035e-05, 5.9194862842559814e-05, 6.154552102088928e-05, 6.389617919921875e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 11.0, 6.0, 12.0, 15.0, 20.0, 33.0, 47.0, 73.0, 102.0, 189.0, 273.0, 405.0, 739.0, 1332.0, 2660.0, 5914.0, 13455.0, 33805.0, 99478.0, 346051.0, 372799.0, 108021.0, 36357.0, 14418.0, 6116.0, 2838.0, 1457.0, 697.0, 402.0, 266.0, 178.0, 121.0, 75.0, 48.0, 46.0, 25.0, 24.0, 17.0, 7.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.01499176025390625, -0.014575719833374023, -0.014159679412841797, -0.01374363899230957, -0.013327598571777344, -0.012911558151245117, -0.01249551773071289, -0.012079477310180664, -0.011663436889648438, -0.011247396469116211, -0.010831356048583984, -0.010415315628051758, -0.009999275207519531, -0.009583234786987305, -0.009167194366455078, -0.008751153945922852, -0.008335113525390625, -0.007919073104858398, -0.007503032684326172, -0.007086992263793945, -0.006670951843261719, -0.006254911422729492, -0.005838871002197266, -0.005422830581665039, -0.0050067901611328125, -0.004590749740600586, -0.004174709320068359, -0.003758668899536133, -0.0033426284790039062, -0.0029265880584716797, -0.002510547637939453, -0.0020945072174072266, -0.001678466796875, -0.0012624263763427734, -0.0008463859558105469, -0.0004303455352783203, -1.430511474609375e-05, 0.0004017353057861328, 0.0008177757263183594, 0.001233816146850586, 0.0016498565673828125, 0.002065896987915039, 0.0024819374084472656, 0.002897977828979492, 0.0033140182495117188, 0.0037300586700439453, 0.004146099090576172, 0.0045621395111083984, 0.004978179931640625, 0.0053942203521728516, 0.005810260772705078, 0.006226301193237305, 0.006642341613769531, 0.007058382034301758, 0.007474422454833984, 0.007890462875366211, 0.008306503295898438, 0.008722543716430664, 0.00913858413696289, 0.009554624557495117, 0.009970664978027344, 0.01038670539855957, 0.010802745819091797, 0.011218786239624023, 0.01163482666015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 13.0, 15.0, 13.0, 14.0, 18.0, 28.0, 33.0, 57.0, 68.0, 88.0, 90.0, 109.0, 101.0, 85.0, 53.0, 60.0, 31.0, 25.0, 20.0, 19.0, 14.0, 11.0, 4.0, 6.0, 5.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.013248682022094727, -0.012779712677001953, -0.01231074333190918, -0.011841773986816406, -0.011372804641723633, -0.01090383529663086, -0.010434865951538086, -0.009965896606445312, -0.009496927261352539, -0.009027957916259766, -0.008558988571166992, -0.008090019226074219, -0.007621049880981445, -0.007152080535888672, -0.0066831111907958984, -0.006214141845703125, -0.0057451725006103516, -0.005276203155517578, -0.004807233810424805, -0.004338264465332031, -0.003869295120239258, -0.0034003257751464844, -0.002931356430053711, -0.0024623870849609375, -0.001993417739868164, -0.0015244483947753906, -0.0010554790496826172, -0.0005865097045898438, -0.00011754035949707031, 0.0003514289855957031, 0.0008203983306884766, 0.00128936767578125, 0.0017583370208740234, 0.002227306365966797, 0.0026962757110595703, 0.0031652450561523438, 0.003634214401245117, 0.004103183746337891, 0.004572153091430664, 0.0050411224365234375, 0.005510091781616211, 0.005979061126708984, 0.006448030471801758, 0.006916999816894531, 0.007385969161987305, 0.007854938507080078, 0.008323907852172852, 0.008792877197265625, 0.009261846542358398, 0.009730815887451172, 0.010199785232543945, 0.010668754577636719, 0.011137723922729492, 0.011606693267822266, 0.012075662612915039, 0.012544631958007812, 0.013013601303100586, 0.01348257064819336, 0.013951539993286133, 0.014420509338378906, 0.01488947868347168, 0.015358448028564453, 0.015827417373657227, 0.01629638671875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 53.0, 207.0, 413.0, 265.0, 51.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58975750207901, -0.5752612948417664, -0.5607650279998779, -0.5462688207626343, -0.5317725539207458, -0.5172763466835022, -0.5027800798416138, -0.4882838726043701, -0.4737876057624817, -0.45929136872291565, -0.4447951316833496, -0.43029889464378357, -0.41580265760421753, -0.4013064205646515, -0.38681018352508545, -0.3723139762878418, -0.35781773924827576, -0.3433215022087097, -0.3288252651691437, -0.31432902812957764, -0.2998327910900116, -0.28533655405044556, -0.2708403468132019, -0.2563440799713135, -0.24184785783290863, -0.2273516207933426, -0.21285538375377655, -0.1983591616153717, -0.18386292457580566, -0.16936668753623962, -0.15487045049667358, -0.14037421345710754, -0.1258779764175415, -0.11138173937797546, -0.09688550233840942, -0.08238927274942398, -0.06789303570985794, -0.0533967986702919, -0.03890056908130646, -0.024404332041740417, -0.009908095002174377, 0.004588140174746513, 0.019084375351667404, 0.033580608665943146, 0.048076845705509186, 0.06257308274507523, 0.07706931233406067, 0.09156554937362671, 0.10606178641319275, 0.12055802345275879, 0.13505426049232483, 0.14955049753189087, 0.1640467345714569, 0.17854297161102295, 0.1930391937494278, 0.20753543078899384, 0.22203166782855988, 0.23652790486812592, 0.25102412700653076, 0.2655203640460968, 0.28001660108566284, 0.2945128381252289, 0.3090090751647949, 0.32350531220436096, 0.338001549243927]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 6.0, 15.0, 16.0, 16.0, 16.0, 20.0, 19.0, 32.0, 42.0, 33.0, 26.0, 33.0, 43.0, 37.0, 45.0, 32.0, 43.0, 41.0, 48.0, 29.0, 44.0, 37.0, 33.0, 28.0, 25.0, 31.0, 22.0, 34.0, 34.0, 14.0, 10.0, 14.0, 12.0, 15.0, 14.0, 3.0, 5.0, 5.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09329289197921753, -0.09056613594293594, -0.08783937245607376, -0.08511261641979218, -0.08238585293292999, -0.07965909689664841, -0.07693234086036682, -0.07420557737350464, -0.07147882133722305, -0.06875206530094147, -0.06602530181407928, -0.0632985457777977, -0.060571786016225815, -0.05784502625465393, -0.055118270218372345, -0.05239151045680046, -0.04966475069522858, -0.04693799093365669, -0.04421123117208481, -0.04148447513580322, -0.03875771537423134, -0.036030955612659454, -0.03330419957637787, -0.030577439814805984, -0.0278506800532341, -0.025123920291662216, -0.02239716239273548, -0.019670404493808746, -0.016943644732236862, -0.014216885901987553, -0.011490127071738243, -0.008763369172811508, -0.006036609411239624, -0.0033098505809903145, -0.0005830917507410049, 0.0021436670795083046, 0.004870425909757614, 0.007597184740006924, 0.010323943570256233, 0.013050701469182968, 0.015777461230754852, 0.018504220992326736, 0.02123097889125347, 0.023957736790180206, 0.02668449655175209, 0.029411256313323975, 0.03213801234960556, 0.034864772111177444, 0.03759153187274933, 0.04031829163432121, 0.0430450513958931, 0.04577180743217468, 0.04849856719374657, 0.05122532695531845, 0.05395208299160004, 0.05667884275317192, 0.059405602514743805, 0.06213236227631569, 0.06485912203788757, 0.06758587807416916, 0.07031263411045074, 0.07303939759731293, 0.07576615363359451, 0.0784929096698761, 0.08121967315673828]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 10.0, 8.0, 24.0, 155.0, 2021.0, 4125488.0, 65563.0, 864.0, 105.0, 31.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26702117919921875, -0.2588958740234375, -0.25077056884765625, -0.242645263671875, -0.23451995849609375, -0.2263946533203125, -0.21826934814453125, -0.21014404296875, -0.20201873779296875, -0.1938934326171875, -0.18576812744140625, -0.177642822265625, -0.16951751708984375, -0.1613922119140625, -0.15326690673828125, -0.1451416015625, -0.13701629638671875, -0.1288909912109375, -0.12076568603515625, -0.112640380859375, -0.10451507568359375, -0.0963897705078125, -0.08826446533203125, -0.08013916015625, -0.07201385498046875, -0.0638885498046875, -0.05576324462890625, -0.047637939453125, -0.03951263427734375, -0.0313873291015625, -0.02326202392578125, -0.01513671875, -0.00701141357421875, 0.0011138916015625, 0.00923919677734375, 0.017364501953125, 0.02548980712890625, 0.0336151123046875, 0.04174041748046875, 0.04986572265625, 0.05799102783203125, 0.0661163330078125, 0.07424163818359375, 0.082366943359375, 0.09049224853515625, 0.0986175537109375, 0.10674285888671875, 0.1148681640625, 0.12299346923828125, 0.1311187744140625, 0.13924407958984375, 0.147369384765625, 0.15549468994140625, 0.1636199951171875, 0.17174530029296875, 0.17987060546875, 0.18799591064453125, 0.1961212158203125, 0.20424652099609375, 0.212371826171875, 0.22049713134765625, 0.2286224365234375, 0.23674774169921875, 0.244873046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 112.0, 231.0, 312.0, 224.0, 88.0, 15.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06519222259521484, -0.06318473815917969, -0.06117725372314453, -0.059169769287109375, -0.05716228485107422, -0.05515480041503906, -0.053147315979003906, -0.05113983154296875, -0.049132347106933594, -0.04712486267089844, -0.04511737823486328, -0.043109893798828125, -0.04110240936279297, -0.03909492492675781, -0.037087440490722656, -0.0350799560546875, -0.033072471618652344, -0.031064987182617188, -0.02905750274658203, -0.027050018310546875, -0.02504253387451172, -0.023035049438476562, -0.021027565002441406, -0.01902008056640625, -0.017012596130371094, -0.015005111694335938, -0.012997627258300781, -0.010990142822265625, -0.008982658386230469, -0.0069751739501953125, -0.004967689514160156, -0.002960205078125, -0.0009527206420898438, 0.0010547637939453125, 0.0030622482299804688, 0.005069732666015625, 0.007077217102050781, 0.009084701538085938, 0.011092185974121094, 0.01309967041015625, 0.015107154846191406, 0.017114639282226562, 0.01912212371826172, 0.021129608154296875, 0.02313709259033203, 0.025144577026367188, 0.027152061462402344, 0.0291595458984375, 0.031167030334472656, 0.03317451477050781, 0.03518199920654297, 0.037189483642578125, 0.03919696807861328, 0.04120445251464844, 0.043211936950683594, 0.04521942138671875, 0.047226905822753906, 0.04923439025878906, 0.05124187469482422, 0.053249359130859375, 0.05525684356689453, 0.05726432800292969, 0.059271812438964844, 0.061279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 16.0, 10.0, 18.0, 35.0, 59.0, 91.0, 142.0, 199.0, 382.0, 753.0, 1605.0, 4455.0, 14077.0, 58432.0, 427589.0, 3336988.0, 285386.0, 45675.0, 11502.0, 3672.0, 1436.0, 671.0, 433.0, 234.0, 139.0, 81.0, 50.0, 40.0, 30.0, 20.0, 10.0, 8.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023345947265625, -0.02257847785949707, -0.02181100845336914, -0.02104353904724121, -0.02027606964111328, -0.01950860023498535, -0.018741130828857422, -0.017973661422729492, -0.017206192016601562, -0.016438722610473633, -0.015671253204345703, -0.014903783798217773, -0.014136314392089844, -0.013368844985961914, -0.012601375579833984, -0.011833906173706055, -0.011066436767578125, -0.010298967361450195, -0.009531497955322266, -0.008764028549194336, -0.007996559143066406, -0.0072290897369384766, -0.006461620330810547, -0.005694150924682617, -0.0049266815185546875, -0.004159212112426758, -0.003391742706298828, -0.0026242733001708984, -0.0018568038940429688, -0.001089334487915039, -0.0003218650817871094, 0.0004456043243408203, 0.00121307373046875, 0.0019805431365966797, 0.0027480125427246094, 0.003515481948852539, 0.004282951354980469, 0.0050504207611083984, 0.005817890167236328, 0.006585359573364258, 0.0073528289794921875, 0.008120298385620117, 0.008887767791748047, 0.009655237197875977, 0.010422706604003906, 0.011190176010131836, 0.011957645416259766, 0.012725114822387695, 0.013492584228515625, 0.014260053634643555, 0.015027523040771484, 0.015794992446899414, 0.016562461853027344, 0.017329931259155273, 0.018097400665283203, 0.018864870071411133, 0.019632339477539062, 0.020399808883666992, 0.021167278289794922, 0.02193474769592285, 0.02270221710205078, 0.02346968650817871, 0.02423715591430664, 0.02500462532043457, 0.0257720947265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 13.0, 17.0, 33.0, 57.0, 80.0, 124.0, 245.0, 565.0, 1221.0, 888.0, 373.0, 187.0, 78.0, 64.0, 36.0, 33.0, 16.0, 13.0, 7.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176849365234375, -0.016833066940307617, -0.015981197357177734, -0.015129327774047852, -0.014277458190917969, -0.013425588607788086, -0.012573719024658203, -0.01172184944152832, -0.010869979858398438, -0.010018110275268555, -0.009166240692138672, -0.008314371109008789, -0.007462501525878906, -0.0066106319427490234, -0.005758762359619141, -0.004906892776489258, -0.004055023193359375, -0.003203153610229492, -0.0023512840270996094, -0.0014994144439697266, -0.0006475448608398438, 0.00020432472229003906, 0.0010561943054199219, 0.0019080638885498047, 0.0027599334716796875, 0.0036118030548095703, 0.004463672637939453, 0.005315542221069336, 0.006167411804199219, 0.0070192813873291016, 0.007871150970458984, 0.008723020553588867, 0.00957489013671875, 0.010426759719848633, 0.011278629302978516, 0.012130498886108398, 0.012982368469238281, 0.013834238052368164, 0.014686107635498047, 0.01553797721862793, 0.016389846801757812, 0.017241716384887695, 0.018093585968017578, 0.01894545555114746, 0.019797325134277344, 0.020649194717407227, 0.02150106430053711, 0.022352933883666992, 0.023204803466796875, 0.024056673049926758, 0.02490854263305664, 0.025760412216186523, 0.026612281799316406, 0.02746415138244629, 0.028316020965576172, 0.029167890548706055, 0.030019760131835938, 0.03087162971496582, 0.0317234992980957, 0.032575368881225586, 0.03342723846435547, 0.03427910804748535, 0.035130977630615234, 0.03598284721374512, 0.036834716796875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 21.0, 41.0, 84.0, 139.0, 186.0, 186.0, 151.0, 90.0, 43.0, 17.0, 13.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08364906907081604, -0.07913349568843842, -0.07461792975664139, -0.07010236382484436, -0.06558679044246674, -0.06107122078537941, -0.056555651128292084, -0.05204008147120476, -0.04752451181411743, -0.043008942157030106, -0.03849337249994278, -0.033977802842855453, -0.029462233185768127, -0.0249466635286808, -0.020431093871593475, -0.01591552421450615, -0.011399954557418823, -0.006884384900331497, -0.002368815243244171, 0.002146754413843155, 0.006662324070930481, 0.011177893728017807, 0.015693463385105133, 0.02020903304219246, 0.024724602699279785, 0.02924017235636711, 0.03375574201345444, 0.03827131167054176, 0.04278688132762909, 0.047302450984716415, 0.05181802064180374, 0.05633359029889107, 0.0608491450548172, 0.06536471843719482, 0.06988028436899185, 0.07439585030078888, 0.0789114236831665, 0.08342699706554413, 0.08794256299734116, 0.09245812892913818, 0.09697370231151581, 0.10148927569389343, 0.10600484162569046, 0.11052040755748749, 0.11503598093986511, 0.11955155432224274, 0.12406712025403976, 0.1285826861858368, 0.13309825956821442, 0.13761383295059204, 0.14212939143180847, 0.1466449648141861, 0.15116053819656372, 0.15567611157894135, 0.16019168496131897, 0.1647072434425354, 0.16922281682491302, 0.17373839020729065, 0.17825394868850708, 0.1827695220708847, 0.18728509545326233, 0.19180066883563995, 0.19631624221801758, 0.200831800699234, 0.20534737408161163]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 15.0, 15.0, 16.0, 11.0, 22.0, 18.0, 19.0, 24.0, 28.0, 24.0, 26.0, 35.0, 33.0, 47.0, 58.0, 51.0, 41.0, 49.0, 46.0, 45.0, 34.0, 39.0, 37.0, 53.0, 33.0, 28.0, 27.0, 23.0, 18.0, 20.0, 13.0, 12.0, 8.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.06870871782302856, -0.06682983785867691, -0.06495095789432526, -0.063072070479393, -0.06119319051504135, -0.0593143105506897, -0.057435426861047745, -0.05555654317140579, -0.05367766320705414, -0.051798783242702484, -0.04991989955306053, -0.04804101586341858, -0.046162135899066925, -0.04428325593471527, -0.04240437224507332, -0.040525488555431366, -0.03864660859107971, -0.03676772862672806, -0.034888844937086105, -0.03300996124744415, -0.0311310812830925, -0.029252199456095695, -0.027373317629098892, -0.02549443580210209, -0.023615553975105286, -0.021736672148108482, -0.01985779032111168, -0.017978908494114876, -0.016100026667118073, -0.01422114484012127, -0.012342263013124466, -0.010463381186127663, -0.00858449935913086, -0.006705617532134056, -0.004826735705137253, -0.0029478538781404495, -0.0010689720511436462, 0.000809909775853157, 0.0026887916028499603, 0.004567673429846764, 0.006446555256843567, 0.00832543708384037, 0.010204318910837173, 0.012083200737833977, 0.01396208256483078, 0.015840964391827583, 0.017719846218824387, 0.01959872804582119, 0.021477609872817993, 0.023356491699814796, 0.0252353735268116, 0.027114255353808403, 0.028993137180805206, 0.03087201900780201, 0.03275090083479881, 0.034629784524440765, 0.03650866448879242, 0.038387544453144073, 0.040266428142786026, 0.04214531183242798, 0.04402419179677963, 0.04590307176113129, 0.04778195545077324, 0.04966083914041519, 0.051539719104766846]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 2.0, 10.0, 14.0, 13.0, 29.0, 36.0, 48.0, 71.0, 99.0, 124.0, 196.0, 288.0, 437.0, 831.0, 2239.0, 14236.0, 343520.0, 656363.0, 24412.0, 3098.0, 940.0, 470.0, 330.0, 222.0, 157.0, 97.0, 64.0, 58.0, 43.0, 28.0, 18.0, 18.0, 12.0, 7.0, 6.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07373046875, -0.07101058959960938, -0.06829071044921875, -0.06557083129882812, -0.0628509521484375, -0.060131072998046875, -0.05741119384765625, -0.054691314697265625, -0.051971435546875, -0.049251556396484375, -0.04653167724609375, -0.043811798095703125, -0.0410919189453125, -0.038372039794921875, -0.03565216064453125, -0.032932281494140625, -0.03021240234375, -0.027492523193359375, -0.02477264404296875, -0.022052764892578125, -0.0193328857421875, -0.016613006591796875, -0.01389312744140625, -0.011173248291015625, -0.008453369140625, -0.005733489990234375, -0.00301361083984375, -0.000293731689453125, 0.0024261474609375, 0.005146026611328125, 0.00786590576171875, 0.010585784912109375, 0.0133056640625, 0.016025543212890625, 0.01874542236328125, 0.021465301513671875, 0.0241851806640625, 0.026905059814453125, 0.02962493896484375, 0.032344818115234375, 0.035064697265625, 0.037784576416015625, 0.04050445556640625, 0.043224334716796875, 0.0459442138671875, 0.048664093017578125, 0.05138397216796875, 0.054103851318359375, 0.05682373046875, 0.059543609619140625, 0.06226348876953125, 0.06498336791992188, 0.0677032470703125, 0.07042312622070312, 0.07314300537109375, 0.07586288452148438, 0.078582763671875, 0.08130264282226562, 0.08402252197265625, 0.08674240112304688, 0.0894622802734375, 0.09218215942382812, 0.09490203857421875, 0.09762191772460938, 0.100341796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 73.0, 205.0, 315.0, 252.0, 119.0, 23.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06360816955566406, -0.061603546142578125, -0.05959892272949219, -0.05759429931640625, -0.05558967590332031, -0.053585052490234375, -0.05158042907714844, -0.0495758056640625, -0.04757118225097656, -0.045566558837890625, -0.04356193542480469, -0.04155731201171875, -0.03955268859863281, -0.037548065185546875, -0.03554344177246094, -0.033538818359375, -0.03153419494628906, -0.029529571533203125, -0.027524948120117188, -0.02552032470703125, -0.023515701293945312, -0.021511077880859375, -0.019506454467773438, -0.0175018310546875, -0.015497207641601562, -0.013492584228515625, -0.011487960815429688, -0.00948333740234375, -0.0074787139892578125, -0.005474090576171875, -0.0034694671630859375, -0.00146484375, 0.0005397796630859375, 0.002544403076171875, 0.0045490264892578125, 0.00655364990234375, 0.008558273315429688, 0.010562896728515625, 0.012567520141601562, 0.0145721435546875, 0.016576766967773438, 0.018581390380859375, 0.020586013793945312, 0.02259063720703125, 0.024595260620117188, 0.026599884033203125, 0.028604507446289062, 0.030609130859375, 0.03261375427246094, 0.034618377685546875, 0.03662300109863281, 0.03862762451171875, 0.04063224792480469, 0.042636871337890625, 0.04464149475097656, 0.0466461181640625, 0.04865074157714844, 0.050655364990234375, 0.05265998840332031, 0.05466461181640625, 0.05666923522949219, 0.058673858642578125, 0.06067848205566406, 0.06268310546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 15.0, 11.0, 26.0, 50.0, 87.0, 142.0, 314.0, 812.0, 2184.0, 8872.0, 56849.0, 604162.0, 334731.0, 31644.0, 5819.0, 1635.0, 628.0, 265.0, 127.0, 65.0, 27.0, 20.0, 21.0, 12.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06085205078125, -0.058814048767089844, -0.05677604675292969, -0.05473804473876953, -0.052700042724609375, -0.05066204071044922, -0.04862403869628906, -0.046586036682128906, -0.04454803466796875, -0.042510032653808594, -0.04047203063964844, -0.03843402862548828, -0.036396026611328125, -0.03435802459716797, -0.03232002258300781, -0.030282020568847656, -0.0282440185546875, -0.026206016540527344, -0.024168014526367188, -0.02213001251220703, -0.020092010498046875, -0.01805400848388672, -0.016016006469726562, -0.013978004455566406, -0.01194000244140625, -0.009902000427246094, -0.007863998413085938, -0.005825996398925781, -0.003787994384765625, -0.0017499923706054688, 0.0002880096435546875, 0.0023260116577148438, 0.004364013671875, 0.006402015686035156, 0.008440017700195312, 0.010478019714355469, 0.012516021728515625, 0.014554023742675781, 0.016592025756835938, 0.018630027770996094, 0.02066802978515625, 0.022706031799316406, 0.024744033813476562, 0.02678203582763672, 0.028820037841796875, 0.03085803985595703, 0.03289604187011719, 0.034934043884277344, 0.0369720458984375, 0.039010047912597656, 0.04104804992675781, 0.04308605194091797, 0.045124053955078125, 0.04716205596923828, 0.04920005798339844, 0.051238059997558594, 0.05327606201171875, 0.055314064025878906, 0.05735206604003906, 0.05939006805419922, 0.061428070068359375, 0.06346607208251953, 0.06550407409667969, 0.06754207611083984, 0.069580078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 3.0, 5.0, 11.0, 15.0, 23.0, 23.0, 30.0, 38.0, 22.0, 40.0, 45.0, 64.0, 56.0, 64.0, 72.0, 60.0, 53.0, 42.0, 52.0, 47.0, 43.0, 37.0, 33.0, 21.0, 23.0, 17.0, 16.0, 10.0, 7.0, 3.0, 4.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05810546875, -0.056560516357421875, -0.05501556396484375, -0.053470611572265625, -0.0519256591796875, -0.050380706787109375, -0.04883575439453125, -0.047290802001953125, -0.045745849609375, -0.044200897216796875, -0.04265594482421875, -0.041110992431640625, -0.0395660400390625, -0.038021087646484375, -0.03647613525390625, -0.034931182861328125, -0.03338623046875, -0.031841278076171875, -0.03029632568359375, -0.028751373291015625, -0.0272064208984375, -0.025661468505859375, -0.02411651611328125, -0.022571563720703125, -0.021026611328125, -0.019481658935546875, -0.01793670654296875, -0.016391754150390625, -0.0148468017578125, -0.013301849365234375, -0.01175689697265625, -0.010211944580078125, -0.0086669921875, -0.007122039794921875, -0.00557708740234375, -0.004032135009765625, -0.0024871826171875, -0.000942230224609375, 0.00060272216796875, 0.002147674560546875, 0.003692626953125, 0.005237579345703125, 0.00678253173828125, 0.008327484130859375, 0.0098724365234375, 0.011417388916015625, 0.01296234130859375, 0.014507293701171875, 0.01605224609375, 0.017597198486328125, 0.01914215087890625, 0.020687103271484375, 0.0222320556640625, 0.023777008056640625, 0.02532196044921875, 0.026866912841796875, 0.028411865234375, 0.029956817626953125, 0.03150177001953125, 0.033046722412109375, 0.0345916748046875, 0.036136627197265625, 0.03768157958984375, 0.039226531982421875, 0.040771484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 13.0, 22.0, 52.0, 75.0, 121.0, 169.0, 305.0, 529.0, 848.0, 1532.0, 2950.0, 6221.0, 15693.0, 54707.0, 352222.0, 505340.0, 73350.0, 19354.0, 7335.0, 3462.0, 1776.0, 1017.0, 551.0, 348.0, 217.0, 126.0, 67.0, 48.0, 29.0, 15.0, 12.0, 16.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023673295974731445, -0.02288675308227539, -0.022100210189819336, -0.02131366729736328, -0.020527124404907227, -0.019740581512451172, -0.018954038619995117, -0.018167495727539062, -0.017380952835083008, -0.016594409942626953, -0.0158078670501709, -0.015021324157714844, -0.014234781265258789, -0.013448238372802734, -0.01266169548034668, -0.011875152587890625, -0.01108860969543457, -0.010302066802978516, -0.009515523910522461, -0.008728981018066406, -0.007942438125610352, -0.007155895233154297, -0.006369352340698242, -0.0055828094482421875, -0.004796266555786133, -0.004009723663330078, -0.0032231807708740234, -0.0024366378784179688, -0.001650094985961914, -0.0008635520935058594, -7.700920104980469e-05, 0.00070953369140625, 0.0014960765838623047, 0.0022826194763183594, 0.003069162368774414, 0.0038557052612304688, 0.0046422481536865234, 0.005428791046142578, 0.006215333938598633, 0.0070018768310546875, 0.007788419723510742, 0.008574962615966797, 0.009361505508422852, 0.010148048400878906, 0.010934591293334961, 0.011721134185791016, 0.01250767707824707, 0.013294219970703125, 0.01408076286315918, 0.014867305755615234, 0.01565384864807129, 0.016440391540527344, 0.0172269344329834, 0.018013477325439453, 0.018800020217895508, 0.019586563110351562, 0.020373106002807617, 0.021159648895263672, 0.021946191787719727, 0.02273273468017578, 0.023519277572631836, 0.02430582046508789, 0.025092363357543945, 0.02587890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 12.0, 6.0, 10.0, 16.0, 15.0, 10.0, 18.0, 32.0, 45.0, 49.0, 61.0, 70.0, 92.0, 89.0, 90.0, 63.0, 67.0, 54.0, 36.0, 40.0, 39.0, 18.0, 10.0, 16.0, 9.0, 7.0, 7.0, 7.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.014108657836914e-05, -5.79003244638443e-05, -5.565956234931946e-05, -5.341880023479462e-05, -5.1178038120269775e-05, -4.8937276005744934e-05, -4.669651389122009e-05, -4.445575177669525e-05, -4.221498966217041e-05, -3.997422754764557e-05, -3.773346543312073e-05, -3.5492703318595886e-05, -3.3251941204071045e-05, -3.1011179089546204e-05, -2.8770416975021362e-05, -2.652965486049652e-05, -2.428889274597168e-05, -2.204813063144684e-05, -1.9807368516921997e-05, -1.7566606402397156e-05, -1.5325844287872314e-05, -1.3085082173347473e-05, -1.0844320058822632e-05, -8.60355794429779e-06, -6.362795829772949e-06, -4.122033715248108e-06, -1.8812716007232666e-06, 3.594905138015747e-07, 2.600252628326416e-06, 4.841014742851257e-06, 7.081776857376099e-06, 9.32253897190094e-06, 1.1563301086425781e-05, 1.3804063200950623e-05, 1.6044825315475464e-05, 1.8285587430000305e-05, 2.0526349544525146e-05, 2.2767111659049988e-05, 2.500787377357483e-05, 2.724863588809967e-05, 2.9489398002624512e-05, 3.173016011714935e-05, 3.3970922231674194e-05, 3.6211684346199036e-05, 3.845244646072388e-05, 4.069320857524872e-05, 4.293397068977356e-05, 4.51747328042984e-05, 4.741549491882324e-05, 4.9656257033348083e-05, 5.1897019147872925e-05, 5.4137781262397766e-05, 5.637854337692261e-05, 5.861930549144745e-05, 6.086006760597229e-05, 6.310082972049713e-05, 6.534159183502197e-05, 6.758235394954681e-05, 6.982311606407166e-05, 7.20638781785965e-05, 7.430464029312134e-05, 7.654540240764618e-05, 7.878616452217102e-05, 8.102692663669586e-05, 8.32676887512207e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 11.0, 8.0, 14.0, 12.0, 16.0, 31.0, 41.0, 58.0, 96.0, 181.0, 299.0, 491.0, 1025.0, 2258.0, 4911.0, 12290.0, 34506.0, 119699.0, 532422.0, 247637.0, 59665.0, 19322.0, 7224.0, 3189.0, 1458.0, 714.0, 380.0, 229.0, 128.0, 77.0, 57.0, 30.0, 22.0, 16.0, 11.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.02006840705871582, -0.01941537857055664, -0.01876235008239746, -0.01810932159423828, -0.0174562931060791, -0.016803264617919922, -0.016150236129760742, -0.015497207641601562, -0.014844179153442383, -0.014191150665283203, -0.013538122177124023, -0.012885093688964844, -0.012232065200805664, -0.011579036712646484, -0.010926008224487305, -0.010272979736328125, -0.009619951248168945, -0.008966922760009766, -0.008313894271850586, -0.007660865783691406, -0.0070078372955322266, -0.006354808807373047, -0.005701780319213867, -0.0050487518310546875, -0.004395723342895508, -0.003742694854736328, -0.0030896663665771484, -0.0024366378784179688, -0.001783609390258789, -0.0011305809020996094, -0.0004775524139404297, 0.00017547607421875, 0.0008285045623779297, 0.0014815330505371094, 0.002134561538696289, 0.0027875900268554688, 0.0034406185150146484, 0.004093647003173828, 0.004746675491333008, 0.0053997039794921875, 0.006052732467651367, 0.006705760955810547, 0.0073587894439697266, 0.008011817932128906, 0.008664846420288086, 0.009317874908447266, 0.009970903396606445, 0.010623931884765625, 0.011276960372924805, 0.011929988861083984, 0.012583017349243164, 0.013236045837402344, 0.013889074325561523, 0.014542102813720703, 0.015195131301879883, 0.015848159790039062, 0.016501188278198242, 0.017154216766357422, 0.0178072452545166, 0.01846027374267578, 0.01911330223083496, 0.01976633071899414, 0.02041935920715332, 0.0210723876953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 12.0, 14.0, 15.0, 33.0, 34.0, 36.0, 55.0, 83.0, 103.0, 117.0, 91.0, 79.0, 74.0, 41.0, 40.0, 34.0, 20.0, 28.0, 11.0, 9.0, 9.0, 5.0, 7.0, 4.0, 7.0, 3.0, 3.0, 0.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.014934778213500977, -0.014244556427001953, -0.01355433464050293, -0.012864112854003906, -0.012173891067504883, -0.01148366928100586, -0.010793447494506836, -0.010103225708007812, -0.009413003921508789, -0.008722782135009766, -0.008032560348510742, -0.007342338562011719, -0.006652116775512695, -0.005961894989013672, -0.0052716732025146484, -0.004581451416015625, -0.0038912296295166016, -0.003201007843017578, -0.0025107860565185547, -0.0018205642700195312, -0.0011303424835205078, -0.0004401206970214844, 0.00025010108947753906, 0.0009403228759765625, 0.001630544662475586, 0.0023207664489746094, 0.003010988235473633, 0.0037012100219726562, 0.00439143180847168, 0.005081653594970703, 0.0057718753814697266, 0.00646209716796875, 0.0071523189544677734, 0.007842540740966797, 0.00853276252746582, 0.009222984313964844, 0.009913206100463867, 0.01060342788696289, 0.011293649673461914, 0.011983871459960938, 0.012674093246459961, 0.013364315032958984, 0.014054536819458008, 0.014744758605957031, 0.015434980392456055, 0.016125202178955078, 0.0168154239654541, 0.017505645751953125, 0.01819586753845215, 0.018886089324951172, 0.019576311111450195, 0.02026653289794922, 0.020956754684448242, 0.021646976470947266, 0.02233719825744629, 0.023027420043945312, 0.023717641830444336, 0.02440786361694336, 0.025098085403442383, 0.025788307189941406, 0.02647852897644043, 0.027168750762939453, 0.027858972549438477, 0.0285491943359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 21.0, 47.0, 151.0, 278.0, 275.0, 145.0, 54.0, 17.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6444089412689209, -0.6295187473297119, -0.6146285533905029, -0.599738359451294, -0.584848165512085, -0.569957971572876, -0.555067777633667, -0.540177583694458, -0.5252873301506042, -0.5103971362113953, -0.4955069422721863, -0.4806167483329773, -0.4657265245914459, -0.45083633065223694, -0.43594613671302795, -0.42105594277381897, -0.4061657786369324, -0.3912755846977234, -0.3763853907585144, -0.3614951968193054, -0.34660497307777405, -0.33171477913856506, -0.3168245851993561, -0.3019343912601471, -0.2870441675186157, -0.27215397357940674, -0.25726377964019775, -0.24237357079982758, -0.2274833768606186, -0.2125931680202484, -0.19770297408103943, -0.18281278014183044, -0.16792258620262146, -0.15303239226341248, -0.1381421834230423, -0.12325198948383331, -0.10836179554462433, -0.09347159415483475, -0.07858139276504517, -0.06369119882583618, -0.0488009974360466, -0.03391079977154732, -0.019020600244402885, -0.004130400717258453, 0.01075979694724083, 0.025649994611740112, 0.040540196001529694, 0.05543038994073868, 0.07032059133052826, 0.08521079272031784, 0.10010098665952682, 0.1149911880493164, 0.1298813819885254, 0.14477157592773438, 0.15966178476810455, 0.17455197870731354, 0.18944218754768372, 0.2043323814868927, 0.21922259032726288, 0.23411278426647186, 0.24900297820568085, 0.263893187046051, 0.27878338098526, 0.293673574924469, 0.308563768863678]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 10.0, 10.0, 16.0, 14.0, 25.0, 21.0, 25.0, 33.0, 33.0, 50.0, 37.0, 45.0, 51.0, 62.0, 51.0, 43.0, 49.0, 56.0, 67.0, 42.0, 49.0, 38.0, 42.0, 25.0, 19.0, 24.0, 21.0, 19.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2123175859451294, -0.20689621567726135, -0.2014748454093933, -0.19605349004268646, -0.19063211977481842, -0.18521074950695038, -0.17978939414024353, -0.1743680238723755, -0.16894665360450745, -0.1635252833366394, -0.15810391306877136, -0.15268255770206451, -0.14726118743419647, -0.14183981716632843, -0.13641846179962158, -0.13099709153175354, -0.1255757212638855, -0.12015435099601746, -0.11473298817873001, -0.10931162536144257, -0.10389025509357452, -0.09846888482570648, -0.09304752200841904, -0.08762615919113159, -0.08220478892326355, -0.07678341865539551, -0.07136205583810806, -0.06594069302082062, -0.060519322752952576, -0.05509795621037483, -0.04967658966779709, -0.044255223125219345, -0.0388338565826416, -0.03341249004006386, -0.027991123497486115, -0.02256975695490837, -0.017148390412330627, -0.011727023869752884, -0.00630565732717514, -0.0008842907845973969, 0.004537075757980347, 0.00995844230055809, 0.015379808843135834, 0.020801175385713577, 0.02622254192829132, 0.031643908470869064, 0.03706527501344681, 0.04248664155602455, 0.047908008098602295, 0.05332937464118004, 0.05875074118375778, 0.06417210400104523, 0.06959347426891327, 0.07501484453678131, 0.08043620735406876, 0.0858575701713562, 0.09127894043922424, 0.09670031070709229, 0.10212167352437973, 0.10754303634166718, 0.11296440660953522, 0.11838577687740326, 0.1238071396946907, 0.12922850251197815, 0.1346498727798462]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 7.0, 16.0, 32.0, 162.0, 1028.0, 5436.0, 82677.0, 4078399.0, 23119.0, 2445.0, 719.0, 119.0, 47.0, 30.0, 14.0, 14.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11102294921875, -0.10769462585449219, -0.10436630249023438, -0.10103797912597656, -0.09770965576171875, -0.09438133239746094, -0.09105300903320312, -0.08772468566894531, -0.0843963623046875, -0.08106803894042969, -0.07773971557617188, -0.07441139221191406, -0.07108306884765625, -0.06775474548339844, -0.06442642211914062, -0.06109809875488281, -0.057769775390625, -0.05444145202636719, -0.051113128662109375, -0.04778480529785156, -0.04445648193359375, -0.04112815856933594, -0.037799835205078125, -0.03447151184082031, -0.0311431884765625, -0.027814865112304688, -0.024486541748046875, -0.021158218383789062, -0.01782989501953125, -0.014501571655273438, -0.011173248291015625, -0.007844924926757812, -0.0045166015625, -0.0011882781982421875, 0.002140045166015625, 0.0054683685302734375, 0.00879669189453125, 0.012125015258789062, 0.015453338623046875, 0.018781661987304688, 0.0221099853515625, 0.025438308715820312, 0.028766632080078125, 0.03209495544433594, 0.03542327880859375, 0.03875160217285156, 0.042079925537109375, 0.04540824890136719, 0.048736572265625, 0.05206489562988281, 0.055393218994140625, 0.05872154235839844, 0.06204986572265625, 0.06537818908691406, 0.06870651245117188, 0.07203483581542969, 0.0753631591796875, 0.07869148254394531, 0.08201980590820312, 0.08534812927246094, 0.08867645263671875, 0.09200477600097656, 0.09533309936523438, 0.09866142272949219, 0.10198974609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 13.0, 62.0, 172.0, 269.0, 272.0, 149.0, 54.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.0664663314819336, -0.06445121765136719, -0.06243610382080078, -0.060420989990234375, -0.05840587615966797, -0.05639076232910156, -0.054375648498535156, -0.05236053466796875, -0.050345420837402344, -0.04833030700683594, -0.04631519317626953, -0.044300079345703125, -0.04228496551513672, -0.04026985168457031, -0.038254737854003906, -0.0362396240234375, -0.034224510192871094, -0.03220939636230469, -0.03019428253173828, -0.028179168701171875, -0.02616405487060547, -0.024148941040039062, -0.022133827209472656, -0.02011871337890625, -0.018103599548339844, -0.016088485717773438, -0.014073371887207031, -0.012058258056640625, -0.010043144226074219, -0.008028030395507812, -0.006012916564941406, -0.003997802734375, -0.0019826889038085938, 3.24249267578125e-05, 0.0020475387573242188, 0.004062652587890625, 0.006077766418457031, 0.008092880249023438, 0.010107994079589844, 0.01212310791015625, 0.014138221740722656, 0.016153335571289062, 0.01816844940185547, 0.020183563232421875, 0.02219867706298828, 0.024213790893554688, 0.026228904724121094, 0.0282440185546875, 0.030259132385253906, 0.03227424621582031, 0.03428936004638672, 0.036304473876953125, 0.03831958770751953, 0.04033470153808594, 0.042349815368652344, 0.04436492919921875, 0.046380043029785156, 0.04839515686035156, 0.05041027069091797, 0.052425384521484375, 0.05444049835205078, 0.05645561218261719, 0.058470726013183594, 0.06048583984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 19.0, 35.0, 45.0, 73.0, 117.0, 292.0, 733.0, 2148.0, 9092.0, 72680.0, 3216072.0, 847756.0, 36649.0, 5876.0, 1546.0, 578.0, 245.0, 125.0, 65.0, 40.0, 25.0, 16.0, 11.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040802001953125, -0.03909158706665039, -0.03738117218017578, -0.03567075729370117, -0.03396034240722656, -0.03224992752075195, -0.030539512634277344, -0.028829097747802734, -0.027118682861328125, -0.025408267974853516, -0.023697853088378906, -0.021987438201904297, -0.020277023315429688, -0.018566608428955078, -0.01685619354248047, -0.01514577865600586, -0.01343536376953125, -0.01172494888305664, -0.010014533996582031, -0.008304119110107422, -0.0065937042236328125, -0.004883289337158203, -0.0031728744506835938, -0.0014624595642089844, 0.000247955322265625, 0.0019583702087402344, 0.0036687850952148438, 0.005379199981689453, 0.0070896148681640625, 0.008800029754638672, 0.010510444641113281, 0.01222085952758789, 0.0139312744140625, 0.01564168930053711, 0.01735210418701172, 0.019062519073486328, 0.020772933959960938, 0.022483348846435547, 0.024193763732910156, 0.025904178619384766, 0.027614593505859375, 0.029325008392333984, 0.031035423278808594, 0.0327458381652832, 0.03445625305175781, 0.03616666793823242, 0.03787708282470703, 0.03958749771118164, 0.04129791259765625, 0.04300832748413086, 0.04471874237060547, 0.04642915725708008, 0.04813957214355469, 0.0498499870300293, 0.051560401916503906, 0.053270816802978516, 0.054981231689453125, 0.056691646575927734, 0.058402061462402344, 0.06011247634887695, 0.06182289123535156, 0.06353330612182617, 0.06524372100830078, 0.06695413589477539, 0.06866455078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 7.0, 14.0, 16.0, 20.0, 38.0, 68.0, 109.0, 205.0, 442.0, 976.0, 1132.0, 481.0, 222.0, 133.0, 81.0, 53.0, 21.0, 20.0, 9.0, 12.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020751953125, -0.01960277557373047, -0.018453598022460938, -0.017304420471191406, -0.016155242919921875, -0.015006065368652344, -0.013856887817382812, -0.012707710266113281, -0.01155853271484375, -0.010409355163574219, -0.009260177612304688, -0.008111000061035156, -0.006961822509765625, -0.005812644958496094, -0.0046634674072265625, -0.0035142898559570312, -0.0023651123046875, -0.0012159347534179688, -6.67572021484375e-05, 0.0010824203491210938, 0.002231597900390625, 0.0033807754516601562, 0.0045299530029296875, 0.005679130554199219, 0.00682830810546875, 0.007977485656738281, 0.009126663208007812, 0.010275840759277344, 0.011425018310546875, 0.012574195861816406, 0.013723373413085938, 0.014872550964355469, 0.016021728515625, 0.01717090606689453, 0.018320083618164062, 0.019469261169433594, 0.020618438720703125, 0.021767616271972656, 0.022916793823242188, 0.02406597137451172, 0.02521514892578125, 0.02636432647705078, 0.027513504028320312, 0.028662681579589844, 0.029811859130859375, 0.030961036682128906, 0.03211021423339844, 0.03325939178466797, 0.0344085693359375, 0.03555774688720703, 0.03670692443847656, 0.037856101989746094, 0.039005279541015625, 0.040154457092285156, 0.04130363464355469, 0.04245281219482422, 0.04360198974609375, 0.04475116729736328, 0.04590034484863281, 0.047049522399902344, 0.048198699951171875, 0.049347877502441406, 0.05049705505371094, 0.05164623260498047, 0.05279541015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 6.0, 23.0, 48.0, 102.0, 169.0, 220.0, 180.0, 108.0, 63.0, 42.0, 15.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26920008659362793, -0.2613925039768219, -0.25358492136001587, -0.24577733874320984, -0.23796974122524261, -0.23016215860843658, -0.22235457599163055, -0.21454699337482452, -0.2067394107580185, -0.19893182814121246, -0.19112424552440643, -0.1833166480064392, -0.17550906538963318, -0.16770148277282715, -0.15989390015602112, -0.1520863175392151, -0.14427873492240906, -0.13647115230560303, -0.128663569688797, -0.12085597962141037, -0.11304839700460434, -0.10524080693721771, -0.09743322432041168, -0.08962564170360565, -0.08181804418563843, -0.0740104615688324, -0.06620287150144577, -0.05839528888463974, -0.05058770626783371, -0.04278011992573738, -0.03497253358364105, -0.027164950966835022, -0.01935736835002899, -0.011549783870577812, -0.003742198459804058, 0.004065386950969696, 0.011872971430420876, 0.019680555909872055, 0.027488142251968384, 0.035295724868774414, 0.04310331121087074, 0.05091089755296707, 0.0587184801697731, 0.06652607023715973, 0.07433365285396576, 0.08214123547077179, 0.08994881808757782, 0.09775640070438385, 0.10556399077177048, 0.11337157338857651, 0.12117916345596313, 0.12898674607276917, 0.1367943286895752, 0.14460191130638123, 0.15240949392318726, 0.1602170765399933, 0.1680246740579605, 0.17583225667476654, 0.18363983929157257, 0.1914474368095398, 0.19925501942634583, 0.20706260204315186, 0.21487018465995789, 0.22267776727676392, 0.23048534989356995]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 7.0, 12.0, 16.0, 10.0, 12.0, 10.0, 22.0, 22.0, 28.0, 27.0, 34.0, 32.0, 39.0, 41.0, 59.0, 38.0, 51.0, 50.0, 35.0, 36.0, 51.0, 36.0, 40.0, 37.0, 36.0, 22.0, 30.0, 25.0, 19.0, 19.0, 19.0, 16.0, 14.0, 8.0, 12.0, 2.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07784855365753174, -0.07550067454576492, -0.07315279543399811, -0.0708049088716507, -0.06845702975988388, -0.06610915064811707, -0.06376126408576965, -0.06141338497400284, -0.05906550586223602, -0.05671762675046921, -0.054369743913412094, -0.05202186107635498, -0.049673981964588165, -0.04732610285282135, -0.044978220015764236, -0.04263033717870712, -0.04028245806694031, -0.03793457895517349, -0.03558669611811638, -0.033238813281059265, -0.03089093416929245, -0.028543053194880486, -0.02619517222046852, -0.023847291246056557, -0.021499410271644592, -0.019151529297232628, -0.016803648322820663, -0.014455767348408699, -0.012107886373996735, -0.00976000539958477, -0.007412124425172806, -0.005064243450760841, -0.002716362476348877, -0.00036848150193691254, 0.001979399472475052, 0.004327280446887016, 0.006675161421298981, 0.009023042395710945, 0.01137092337012291, 0.013718804344534874, 0.01606668531894684, 0.018414566293358803, 0.020762447267770767, 0.02311032824218273, 0.025458209216594696, 0.02780609019100666, 0.030153971165418625, 0.03250185400247574, 0.034849733114242554, 0.03719761222600937, 0.03954549506306648, 0.041893377900123596, 0.04424125701189041, 0.04658913612365723, 0.04893701896071434, 0.051284901797771454, 0.05363278090953827, 0.055980660021305084, 0.0583285428583622, 0.06067642569541931, 0.06302430480718613, 0.06537218391895294, 0.06772007048130035, 0.07006794959306717, 0.07241582870483398]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 7.0, 5.0, 6.0, 12.0, 14.0, 13.0, 20.0, 19.0, 25.0, 46.0, 56.0, 63.0, 97.0, 118.0, 151.0, 255.0, 356.0, 624.0, 1271.0, 4342.0, 27039.0, 470384.0, 506842.0, 29136.0, 4422.0, 1331.0, 631.0, 331.0, 246.0, 176.0, 144.0, 95.0, 87.0, 48.0, 29.0, 26.0, 29.0, 17.0, 8.0, 8.0, 10.0, 7.0, 6.0, 1.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.08741950988769531, -0.08450698852539062, -0.08159446716308594, -0.07868194580078125, -0.07576942443847656, -0.07285690307617188, -0.06994438171386719, -0.0670318603515625, -0.06411933898925781, -0.061206817626953125, -0.05829429626464844, -0.05538177490234375, -0.05246925354003906, -0.049556732177734375, -0.04664421081542969, -0.043731689453125, -0.04081916809082031, -0.037906646728515625, -0.03499412536621094, -0.03208160400390625, -0.029169082641601562, -0.026256561279296875, -0.023344039916992188, -0.0204315185546875, -0.017518997192382812, -0.014606475830078125, -0.011693954467773438, -0.00878143310546875, -0.0058689117431640625, -0.002956390380859375, -4.38690185546875e-05, 0.00286865234375, 0.0057811737060546875, 0.008693695068359375, 0.011606216430664062, 0.01451873779296875, 0.017431259155273438, 0.020343780517578125, 0.023256301879882812, 0.0261688232421875, 0.029081344604492188, 0.031993865966796875, 0.03490638732910156, 0.03781890869140625, 0.04073143005371094, 0.043643951416015625, 0.04655647277832031, 0.049468994140625, 0.05238151550292969, 0.055294036865234375, 0.05820655822753906, 0.06111907958984375, 0.06403160095214844, 0.06694412231445312, 0.06985664367675781, 0.0727691650390625, 0.07568168640136719, 0.07859420776367188, 0.08150672912597656, 0.08441925048828125, 0.08733177185058594, 0.09024429321289062, 0.09315681457519531, 0.0960693359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 36.0, 122.0, 257.0, 280.0, 199.0, 79.0, 18.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.0635833740234375, -0.061553955078125, -0.0595245361328125, -0.0574951171875, -0.0554656982421875, -0.053436279296875, -0.0514068603515625, -0.04937744140625, -0.0473480224609375, -0.045318603515625, -0.0432891845703125, -0.041259765625, -0.0392303466796875, -0.037200927734375, -0.0351715087890625, -0.03314208984375, -0.0311126708984375, -0.029083251953125, -0.0270538330078125, -0.0250244140625, -0.0229949951171875, -0.020965576171875, -0.0189361572265625, -0.01690673828125, -0.0148773193359375, -0.012847900390625, -0.0108184814453125, -0.0087890625, -0.0067596435546875, -0.004730224609375, -0.0027008056640625, -0.00067138671875, 0.0013580322265625, 0.003387451171875, 0.0054168701171875, 0.0074462890625, 0.0094757080078125, 0.011505126953125, 0.0135345458984375, 0.01556396484375, 0.0175933837890625, 0.019622802734375, 0.0216522216796875, 0.023681640625, 0.0257110595703125, 0.027740478515625, 0.0297698974609375, 0.03179931640625, 0.0338287353515625, 0.035858154296875, 0.0378875732421875, 0.0399169921875, 0.0419464111328125, 0.043975830078125, 0.0460052490234375, 0.04803466796875, 0.0500640869140625, 0.052093505859375, 0.0541229248046875, 0.05615234375, 0.0581817626953125, 0.060211181640625, 0.0622406005859375, 0.06427001953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 10.0, 11.0, 20.0, 27.0, 27.0, 36.0, 71.0, 80.0, 164.0, 258.0, 528.0, 1123.0, 2765.0, 7903.0, 29241.0, 180646.0, 660421.0, 130453.0, 23337.0, 6813.0, 2408.0, 1030.0, 509.0, 269.0, 125.0, 83.0, 50.0, 37.0, 33.0, 13.0, 21.0, 12.0, 5.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06275653839111328, -0.06069374084472656, -0.058630943298339844, -0.056568145751953125, -0.054505348205566406, -0.05244255065917969, -0.05037975311279297, -0.04831695556640625, -0.04625415802001953, -0.04419136047363281, -0.042128562927246094, -0.040065765380859375, -0.038002967834472656, -0.03594017028808594, -0.03387737274169922, -0.0318145751953125, -0.02975177764892578, -0.027688980102539062, -0.025626182556152344, -0.023563385009765625, -0.021500587463378906, -0.019437789916992188, -0.01737499237060547, -0.01531219482421875, -0.013249397277832031, -0.011186599731445312, -0.009123802185058594, -0.007061004638671875, -0.004998207092285156, -0.0029354095458984375, -0.0008726119995117188, 0.001190185546875, 0.0032529830932617188, 0.0053157806396484375, 0.007378578186035156, 0.009441375732421875, 0.011504173278808594, 0.013566970825195312, 0.01562976837158203, 0.01769256591796875, 0.01975536346435547, 0.021818161010742188, 0.023880958557128906, 0.025943756103515625, 0.028006553649902344, 0.030069351196289062, 0.03213214874267578, 0.0341949462890625, 0.03625774383544922, 0.03832054138183594, 0.040383338928222656, 0.042446136474609375, 0.044508934020996094, 0.04657173156738281, 0.04863452911376953, 0.05069732666015625, 0.05276012420654297, 0.05482292175292969, 0.056885719299316406, 0.058948516845703125, 0.061011314392089844, 0.06307411193847656, 0.06513690948486328, 0.06719970703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 8.0, 18.0, 17.0, 23.0, 23.0, 44.0, 45.0, 64.0, 56.0, 75.0, 85.0, 81.0, 74.0, 69.0, 53.0, 55.0, 36.0, 28.0, 33.0, 25.0, 22.0, 14.0, 6.0, 11.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07574462890625, -0.0736093521118164, -0.07147407531738281, -0.06933879852294922, -0.06720352172851562, -0.06506824493408203, -0.06293296813964844, -0.060797691345214844, -0.05866241455078125, -0.056527137756347656, -0.05439186096191406, -0.05225658416748047, -0.050121307373046875, -0.04798603057861328, -0.04585075378417969, -0.043715476989746094, -0.0415802001953125, -0.039444923400878906, -0.03730964660644531, -0.03517436981201172, -0.033039093017578125, -0.03090381622314453, -0.028768539428710938, -0.026633262634277344, -0.02449798583984375, -0.022362709045410156, -0.020227432250976562, -0.01809215545654297, -0.015956878662109375, -0.013821601867675781, -0.011686325073242188, -0.009551048278808594, -0.007415771484375, -0.005280494689941406, -0.0031452178955078125, -0.0010099411010742188, 0.001125335693359375, 0.0032606124877929688, 0.0053958892822265625, 0.007531166076660156, 0.00966644287109375, 0.011801719665527344, 0.013936996459960938, 0.01607227325439453, 0.018207550048828125, 0.02034282684326172, 0.022478103637695312, 0.024613380432128906, 0.0267486572265625, 0.028883934020996094, 0.031019210815429688, 0.03315448760986328, 0.035289764404296875, 0.03742504119873047, 0.03956031799316406, 0.041695594787597656, 0.04383087158203125, 0.045966148376464844, 0.04810142517089844, 0.05023670196533203, 0.052371978759765625, 0.05450725555419922, 0.05664253234863281, 0.058777809143066406, 0.0609130859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 7.0, 12.0, 12.0, 11.0, 22.0, 23.0, 43.0, 47.0, 104.0, 123.0, 191.0, 307.0, 453.0, 764.0, 1214.0, 2145.0, 3689.0, 7085.0, 15204.0, 39846.0, 197014.0, 616290.0, 110158.0, 28067.0, 11822.0, 6001.0, 3150.0, 1837.0, 1046.0, 611.0, 439.0, 262.0, 157.0, 111.0, 78.0, 63.0, 41.0, 27.0, 12.0, 20.0, 11.0, 8.0, 12.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0338134765625, -0.03273487091064453, -0.03165626525878906, -0.030577659606933594, -0.029499053955078125, -0.028420448303222656, -0.027341842651367188, -0.02626323699951172, -0.02518463134765625, -0.02410602569580078, -0.023027420043945312, -0.021948814392089844, -0.020870208740234375, -0.019791603088378906, -0.018712997436523438, -0.01763439178466797, -0.0165557861328125, -0.015477180480957031, -0.014398574829101562, -0.013319969177246094, -0.012241363525390625, -0.011162757873535156, -0.010084152221679688, -0.009005546569824219, -0.00792694091796875, -0.006848335266113281, -0.0057697296142578125, -0.004691123962402344, -0.003612518310546875, -0.0025339126586914062, -0.0014553070068359375, -0.00037670135498046875, 0.000701904296875, 0.0017805099487304688, 0.0028591156005859375, 0.003937721252441406, 0.005016326904296875, 0.006094932556152344, 0.0071735382080078125, 0.008252143859863281, 0.00933074951171875, 0.010409355163574219, 0.011487960815429688, 0.012566566467285156, 0.013645172119140625, 0.014723777770996094, 0.015802383422851562, 0.01688098907470703, 0.0179595947265625, 0.01903820037841797, 0.020116806030273438, 0.021195411682128906, 0.022274017333984375, 0.023352622985839844, 0.024431228637695312, 0.02550983428955078, 0.02658843994140625, 0.02766704559326172, 0.028745651245117188, 0.029824256896972656, 0.030902862548828125, 0.031981468200683594, 0.03306007385253906, 0.03413867950439453, 0.03521728515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 10.0, 16.0, 15.0, 20.0, 27.0, 38.0, 53.0, 102.0, 133.0, 131.0, 124.0, 81.0, 59.0, 37.0, 35.0, 14.0, 17.0, 12.0, 5.0, 3.0, 2.0, 10.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0001157522201538086, -0.00011227652430534363, -0.00010880082845687866, -0.0001053251326084137, -0.00010184943675994873, -9.837374091148376e-05, -9.48980450630188e-05, -9.142234921455383e-05, -8.794665336608887e-05, -8.44709575176239e-05, -8.099526166915894e-05, -7.751956582069397e-05, -7.4043869972229e-05, -7.056817412376404e-05, -6.709247827529907e-05, -6.36167824268341e-05, -6.014108657836914e-05, -5.6665390729904175e-05, -5.318969488143921e-05, -4.971399903297424e-05, -4.623830318450928e-05, -4.276260733604431e-05, -3.9286911487579346e-05, -3.581121563911438e-05, -3.2335519790649414e-05, -2.8859823942184448e-05, -2.5384128093719482e-05, -2.1908432245254517e-05, -1.843273639678955e-05, -1.4957040548324585e-05, -1.1481344699859619e-05, -8.005648851394653e-06, -4.5299530029296875e-06, -1.0542571544647217e-06, 2.421438694000244e-06, 5.89713454246521e-06, 9.372830390930176e-06, 1.2848526239395142e-05, 1.6324222087860107e-05, 1.9799917936325073e-05, 2.327561378479004e-05, 2.6751309633255005e-05, 3.022700548171997e-05, 3.3702701330184937e-05, 3.71783971786499e-05, 4.065409302711487e-05, 4.4129788875579834e-05, 4.76054847240448e-05, 5.1081180572509766e-05, 5.455687642097473e-05, 5.80325722694397e-05, 6.150826811790466e-05, 6.498396396636963e-05, 6.84596598148346e-05, 7.193535566329956e-05, 7.541105151176453e-05, 7.888674736022949e-05, 8.236244320869446e-05, 8.583813905715942e-05, 8.931383490562439e-05, 9.278953075408936e-05, 9.626522660255432e-05, 9.974092245101929e-05, 0.00010321661829948425, 0.00010669231414794922]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 17.0, 9.0, 13.0, 19.0, 27.0, 46.0, 63.0, 110.0, 175.0, 292.0, 510.0, 896.0, 1631.0, 3054.0, 6403.0, 14139.0, 36953.0, 134264.0, 570816.0, 198034.0, 48151.0, 17447.0, 7570.0, 3589.0, 1922.0, 984.0, 558.0, 305.0, 209.0, 113.0, 63.0, 47.0, 27.0, 22.0, 14.0, 11.0, 14.0, 9.0, 3.0, 2.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.032318115234375, -0.031327247619628906, -0.030336380004882812, -0.02934551239013672, -0.028354644775390625, -0.02736377716064453, -0.026372909545898438, -0.025382041931152344, -0.02439117431640625, -0.023400306701660156, -0.022409439086914062, -0.02141857147216797, -0.020427703857421875, -0.01943683624267578, -0.018445968627929688, -0.017455101013183594, -0.0164642333984375, -0.015473365783691406, -0.014482498168945312, -0.013491630554199219, -0.012500762939453125, -0.011509895324707031, -0.010519027709960938, -0.009528160095214844, -0.00853729248046875, -0.007546424865722656, -0.0065555572509765625, -0.005564689636230469, -0.004573822021484375, -0.0035829544067382812, -0.0025920867919921875, -0.0016012191772460938, -0.0006103515625, 0.00038051605224609375, 0.0013713836669921875, 0.0023622512817382812, 0.003353118896484375, 0.004343986511230469, 0.0053348541259765625, 0.006325721740722656, 0.00731658935546875, 0.008307456970214844, 0.009298324584960938, 0.010289192199707031, 0.011280059814453125, 0.012270927429199219, 0.013261795043945312, 0.014252662658691406, 0.0152435302734375, 0.016234397888183594, 0.017225265502929688, 0.01821613311767578, 0.019207000732421875, 0.02019786834716797, 0.021188735961914062, 0.022179603576660156, 0.02317047119140625, 0.024161338806152344, 0.025152206420898438, 0.02614307403564453, 0.027133941650390625, 0.02812480926513672, 0.029115676879882812, 0.030106544494628906, 0.031097412109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 9.0, 11.0, 13.0, 27.0, 28.0, 62.0, 85.0, 124.0, 141.0, 144.0, 105.0, 71.0, 50.0, 31.0, 19.0, 16.0, 12.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265655517578125, -0.02535223960876465, -0.024138927459716797, -0.022925615310668945, -0.021712303161621094, -0.020498991012573242, -0.01928567886352539, -0.01807236671447754, -0.016859054565429688, -0.015645742416381836, -0.014432430267333984, -0.013219118118286133, -0.012005805969238281, -0.01079249382019043, -0.009579181671142578, -0.008365869522094727, -0.007152557373046875, -0.0059392452239990234, -0.004725933074951172, -0.0035126209259033203, -0.0022993087768554688, -0.0010859966278076172, 0.00012731552124023438, 0.001340627670288086, 0.0025539398193359375, 0.003767251968383789, 0.004980564117431641, 0.006193876266479492, 0.007407188415527344, 0.008620500564575195, 0.009833812713623047, 0.011047124862670898, 0.01226043701171875, 0.013473749160766602, 0.014687061309814453, 0.015900373458862305, 0.017113685607910156, 0.018326997756958008, 0.01954030990600586, 0.02075362205505371, 0.021966934204101562, 0.023180246353149414, 0.024393558502197266, 0.025606870651245117, 0.02682018280029297, 0.02803349494934082, 0.029246807098388672, 0.030460119247436523, 0.031673431396484375, 0.03288674354553223, 0.03410005569458008, 0.03531336784362793, 0.03652667999267578, 0.03773999214172363, 0.038953304290771484, 0.040166616439819336, 0.04137992858886719, 0.04259324073791504, 0.04380655288696289, 0.04501986503601074, 0.046233177185058594, 0.047446489334106445, 0.0486598014831543, 0.04987311363220215, 0.05108642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 57.0, 165.0, 240.0, 243.0, 140.0, 54.0, 22.0, 14.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6857501864433289, -0.6677188873291016, -0.6496875286102295, -0.6316562294960022, -0.6136248707771301, -0.5955935716629028, -0.5775622129440308, -0.5595309138298035, -0.5414996147155762, -0.5234683156013489, -0.5054369568824768, -0.4874056279659271, -0.46937429904937744, -0.45134299993515015, -0.43331167101860046, -0.4152803421020508, -0.3972489833831787, -0.37921765446662903, -0.36118632555007935, -0.34315499663352966, -0.32512366771698, -0.3070923686027527, -0.289061039686203, -0.2710297107696533, -0.25299838185310364, -0.23496705293655396, -0.21693572402000427, -0.19890441000461578, -0.1808730810880661, -0.16284175217151642, -0.14481043815612793, -0.12677910923957825, -0.10874775052070618, -0.0907164216041565, -0.07268510013818741, -0.054653774946928024, -0.03662244975566864, -0.018591120839118958, -0.0005597993731498718, 0.017471522092819214, 0.035502851009368896, 0.05353417620062828, 0.07156550139188766, 0.08959682285785675, 0.10762815177440643, 0.12565948069095612, 0.1436907947063446, 0.1617221236228943, 0.17975345253944397, 0.19778478145599365, 0.21581611037254333, 0.23384742438793182, 0.2518787384033203, 0.2699100971221924, 0.2879413962364197, 0.30597272515296936, 0.32400405406951904, 0.3420353829860687, 0.3600667119026184, 0.3780980408191681, 0.3961293697357178, 0.41416066884994507, 0.43219199776649475, 0.45022332668304443, 0.4682546555995941]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 10.0, 10.0, 8.0, 19.0, 16.0, 32.0, 38.0, 38.0, 35.0, 44.0, 42.0, 45.0, 49.0, 59.0, 44.0, 41.0, 47.0, 54.0, 47.0, 50.0, 40.0, 31.0, 27.0, 35.0, 24.0, 30.0, 15.0, 14.0, 21.0, 7.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2079530954360962, -0.2026481330394745, -0.19734317064285278, -0.19203820824623108, -0.18673324584960938, -0.18142828345298767, -0.17612332105636597, -0.17081835865974426, -0.16551339626312256, -0.16020843386650085, -0.15490347146987915, -0.14959850907325745, -0.14429354667663574, -0.13898858428001404, -0.13368362188339233, -0.12837865948677063, -0.12307369709014893, -0.11776873469352722, -0.11246377229690552, -0.10715880990028381, -0.10185384750366211, -0.0965488851070404, -0.0912439227104187, -0.085938960313797, -0.08063399791717529, -0.07532903552055359, -0.07002407312393188, -0.06471911072731018, -0.05941414833068848, -0.05410918593406677, -0.04880422353744507, -0.043499261140823364, -0.03819429874420166, -0.032889336347579956, -0.027584373950958252, -0.022279411554336548, -0.016974449157714844, -0.01166948676109314, -0.0063645243644714355, -0.0010595619678497314, 0.004245400428771973, 0.009550362825393677, 0.01485532522201538, 0.020160287618637085, 0.02546525001525879, 0.030770212411880493, 0.0360751748085022, 0.0413801372051239, 0.046685099601745605, 0.05199006199836731, 0.057295024394989014, 0.06259998679161072, 0.06790494918823242, 0.07320991158485413, 0.07851487398147583, 0.08381983637809753, 0.08912479877471924, 0.09442976117134094, 0.09973472356796265, 0.10503968596458435, 0.11034464836120605, 0.11564961075782776, 0.12095457315444946, 0.12625953555107117, 0.13156449794769287]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 12.0, 29.0, 56.0, 281.0, 6266.0, 3995236.0, 190022.0, 2030.0, 217.0, 60.0, 28.0, 15.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21142578125, -0.2049884796142578, -0.19855117797851562, -0.19211387634277344, -0.18567657470703125, -0.17923927307128906, -0.17280197143554688, -0.1663646697998047, -0.1599273681640625, -0.1534900665283203, -0.14705276489257812, -0.14061546325683594, -0.13417816162109375, -0.12774085998535156, -0.12130355834960938, -0.11486625671386719, -0.108428955078125, -0.10199165344238281, -0.09555435180664062, -0.08911705017089844, -0.08267974853515625, -0.07624244689941406, -0.06980514526367188, -0.06336784362792969, -0.0569305419921875, -0.05049324035644531, -0.044055938720703125, -0.03761863708496094, -0.03118133544921875, -0.024744033813476562, -0.018306732177734375, -0.011869430541992188, -0.00543212890625, 0.0010051727294921875, 0.007442474365234375, 0.013879776000976562, 0.02031707763671875, 0.026754379272460938, 0.033191680908203125, 0.03962898254394531, 0.0460662841796875, 0.05250358581542969, 0.058940887451171875, 0.06537818908691406, 0.07181549072265625, 0.07825279235839844, 0.08469009399414062, 0.09112739562988281, 0.097564697265625, 0.10400199890136719, 0.11043930053710938, 0.11687660217285156, 0.12331390380859375, 0.12975120544433594, 0.13618850708007812, 0.1426258087158203, 0.1490631103515625, 0.1555004119873047, 0.16193771362304688, 0.16837501525878906, 0.17481231689453125, 0.18124961853027344, 0.18768692016601562, 0.1941242218017578, 0.2005615234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 28.0, 78.0, 145.0, 263.0, 222.0, 169.0, 69.0, 17.0, 12.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06427001953125, -0.06232309341430664, -0.06037616729736328, -0.05842924118041992, -0.05648231506347656, -0.0545353889465332, -0.052588462829589844, -0.050641536712646484, -0.048694610595703125, -0.046747684478759766, -0.044800758361816406, -0.04285383224487305, -0.04090690612792969, -0.03895998001098633, -0.03701305389404297, -0.03506612777709961, -0.03311920166015625, -0.03117227554321289, -0.02922534942626953, -0.027278423309326172, -0.025331497192382812, -0.023384571075439453, -0.021437644958496094, -0.019490718841552734, -0.017543792724609375, -0.015596866607666016, -0.013649940490722656, -0.011703014373779297, -0.009756088256835938, -0.007809162139892578, -0.005862236022949219, -0.003915309906005859, -0.0019683837890625, -2.1457672119140625e-05, 0.0019254684448242188, 0.003872394561767578, 0.0058193206787109375, 0.007766246795654297, 0.009713172912597656, 0.011660099029541016, 0.013607025146484375, 0.015553951263427734, 0.017500877380371094, 0.019447803497314453, 0.021394729614257812, 0.023341655731201172, 0.02528858184814453, 0.02723550796508789, 0.02918243408203125, 0.03112936019897461, 0.03307628631591797, 0.03502321243286133, 0.03697013854980469, 0.03891706466674805, 0.040863990783691406, 0.042810916900634766, 0.044757843017578125, 0.046704769134521484, 0.048651695251464844, 0.0505986213684082, 0.05254554748535156, 0.05449247360229492, 0.05643939971923828, 0.05838632583618164, 0.060333251953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 6.0, 6.0, 3.0, 11.0, 22.0, 32.0, 47.0, 58.0, 115.0, 207.0, 402.0, 723.0, 1529.0, 3472.0, 8619.0, 25737.0, 110515.0, 1891349.0, 1996565.0, 113306.0, 25977.0, 8797.0, 3489.0, 1542.0, 828.0, 375.0, 214.0, 127.0, 76.0, 45.0, 26.0, 22.0, 14.0, 13.0, 11.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0555419921875, -0.05399942398071289, -0.05245685577392578, -0.05091428756713867, -0.04937171936035156, -0.04782915115356445, -0.046286582946777344, -0.044744014739990234, -0.043201446533203125, -0.041658878326416016, -0.040116310119628906, -0.0385737419128418, -0.03703117370605469, -0.03548860549926758, -0.03394603729248047, -0.03240346908569336, -0.03086090087890625, -0.02931833267211914, -0.02777576446533203, -0.026233196258544922, -0.024690628051757812, -0.023148059844970703, -0.021605491638183594, -0.020062923431396484, -0.018520355224609375, -0.016977787017822266, -0.015435218811035156, -0.013892650604248047, -0.012350082397460938, -0.010807514190673828, -0.009264945983886719, -0.007722377777099609, -0.0061798095703125, -0.004637241363525391, -0.0030946731567382812, -0.0015521049499511719, -9.5367431640625e-06, 0.0015330314636230469, 0.0030755996704101562, 0.004618167877197266, 0.006160736083984375, 0.007703304290771484, 0.009245872497558594, 0.010788440704345703, 0.012331008911132812, 0.013873577117919922, 0.015416145324707031, 0.01695871353149414, 0.01850128173828125, 0.02004384994506836, 0.02158641815185547, 0.023128986358642578, 0.024671554565429688, 0.026214122772216797, 0.027756690979003906, 0.029299259185791016, 0.030841827392578125, 0.032384395599365234, 0.033926963806152344, 0.03546953201293945, 0.03701210021972656, 0.03855466842651367, 0.04009723663330078, 0.04163980484008789, 0.043182373046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 16.0, 22.0, 28.0, 42.0, 59.0, 104.0, 143.0, 237.0, 475.0, 1034.0, 944.0, 353.0, 204.0, 113.0, 80.0, 42.0, 38.0, 32.0, 18.0, 19.0, 12.0, 9.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03314208984375, -0.03186225891113281, -0.030582427978515625, -0.029302597045898438, -0.02802276611328125, -0.026742935180664062, -0.025463104248046875, -0.024183273315429688, -0.0229034423828125, -0.021623611450195312, -0.020343780517578125, -0.019063949584960938, -0.01778411865234375, -0.016504287719726562, -0.015224456787109375, -0.013944625854492188, -0.012664794921875, -0.011384963989257812, -0.010105133056640625, -0.008825302124023438, -0.00754547119140625, -0.0062656402587890625, -0.004985809326171875, -0.0037059783935546875, -0.0024261474609375, -0.0011463165283203125, 0.000133514404296875, 0.0014133453369140625, 0.00269317626953125, 0.0039730072021484375, 0.005252838134765625, 0.0065326690673828125, 0.0078125, 0.009092330932617188, 0.010372161865234375, 0.011651992797851562, 0.01293182373046875, 0.014211654663085938, 0.015491485595703125, 0.016771316528320312, 0.0180511474609375, 0.019330978393554688, 0.020610809326171875, 0.021890640258789062, 0.02317047119140625, 0.024450302124023438, 0.025730133056640625, 0.027009963989257812, 0.028289794921875, 0.029569625854492188, 0.030849456787109375, 0.03212928771972656, 0.03340911865234375, 0.03468894958496094, 0.035968780517578125, 0.03724861145019531, 0.0385284423828125, 0.03980827331542969, 0.041088104248046875, 0.04236793518066406, 0.04364776611328125, 0.04492759704589844, 0.046207427978515625, 0.04748725891113281, 0.04876708984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 5.0, 16.0, 59.0, 122.0, 250.0, 277.0, 177.0, 59.0, 19.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40764015913009644, -0.39084571599960327, -0.3740512728691101, -0.35725682973861694, -0.3404623866081238, -0.3236679434776306, -0.30687350034713745, -0.2900790572166443, -0.2732846140861511, -0.25649017095565796, -0.2396957278251648, -0.22290128469467163, -0.20610684156417847, -0.1893123984336853, -0.17251795530319214, -0.15572351217269897, -0.1389290690422058, -0.12213462591171265, -0.10534018278121948, -0.08854573965072632, -0.07175129652023315, -0.05495685338973999, -0.038162410259246826, -0.021367967128753662, -0.004573523998260498, 0.012220919132232666, 0.02901536226272583, 0.045809805393218994, 0.06260424852371216, 0.07939869165420532, 0.09619313478469849, 0.11298757791519165, 0.1297820806503296, 0.14657652378082275, 0.16337096691131592, 0.18016541004180908, 0.19695985317230225, 0.2137542963027954, 0.23054873943328857, 0.24734318256378174, 0.2641376256942749, 0.28093206882476807, 0.29772651195526123, 0.3145209550857544, 0.33131539821624756, 0.3481098413467407, 0.3649042844772339, 0.38169872760772705, 0.3984931707382202, 0.4152876138687134, 0.43208205699920654, 0.4488765001296997, 0.46567094326019287, 0.48246538639068604, 0.4992598295211792, 0.5160542726516724, 0.5328487157821655, 0.5496431589126587, 0.5664376020431519, 0.583232045173645, 0.6000264883041382, 0.6168209314346313, 0.6336153745651245, 0.6504098176956177, 0.6672042608261108]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 11.0, 8.0, 11.0, 13.0, 15.0, 19.0, 29.0, 33.0, 38.0, 42.0, 47.0, 54.0, 56.0, 59.0, 43.0, 51.0, 51.0, 44.0, 52.0, 45.0, 54.0, 39.0, 46.0, 25.0, 25.0, 26.0, 17.0, 12.0, 9.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13766473531723022, -0.13339976966381073, -0.12913478910923004, -0.12486982345581055, -0.12060485035181046, -0.11633987724781036, -0.11207491159439087, -0.10780993849039078, -0.10354496538639069, -0.0992799922823906, -0.0950150191783905, -0.09075005352497101, -0.08648508042097092, -0.08222010731697083, -0.07795514166355133, -0.07369016855955124, -0.06942519545555115, -0.06516022235155106, -0.06089525297284126, -0.05663028359413147, -0.05236531049013138, -0.04810033738613129, -0.043835368007421494, -0.0395703986287117, -0.03530542552471161, -0.031040454283356667, -0.026775483042001724, -0.022510511800646782, -0.01824554055929184, -0.013980569317936897, -0.009715598076581955, -0.005450626835227013, -0.0011856555938720703, 0.003079315647482872, 0.007344286888837814, 0.011609258130192757, 0.0158742293715477, 0.02013920061290264, 0.024404171854257584, 0.028669143095612526, 0.03293411433696747, 0.03719908744096756, 0.04146405681967735, 0.045729026198387146, 0.04999399930238724, 0.05425897240638733, 0.05852394178509712, 0.06278891116380692, 0.067053884267807, 0.0713188573718071, 0.07558383047580719, 0.07984879612922668, 0.08411376923322678, 0.08837874233722687, 0.09264370799064636, 0.09690868109464645, 0.10117365419864655, 0.10543862730264664, 0.10970360040664673, 0.11396856606006622, 0.11823353916406631, 0.1224985122680664, 0.1267634779214859, 0.1310284584760666, 0.13529342412948608]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 2.0, 8.0, 13.0, 13.0, 10.0, 14.0, 17.0, 32.0, 42.0, 64.0, 59.0, 75.0, 120.0, 176.0, 230.0, 304.0, 441.0, 729.0, 1792.0, 9417.0, 97134.0, 709832.0, 205619.0, 16990.0, 2637.0, 917.0, 524.0, 333.0, 258.0, 178.0, 122.0, 109.0, 78.0, 61.0, 39.0, 35.0, 21.0, 23.0, 21.0, 13.0, 13.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.117919921875, -0.11430740356445312, -0.11069488525390625, -0.10708236694335938, -0.1034698486328125, -0.09985733032226562, -0.09624481201171875, -0.09263229370117188, -0.089019775390625, -0.08540725708007812, -0.08179473876953125, -0.07818222045898438, -0.0745697021484375, -0.07095718383789062, -0.06734466552734375, -0.06373214721679688, -0.06011962890625, -0.056507110595703125, -0.05289459228515625, -0.049282073974609375, -0.0456695556640625, -0.042057037353515625, -0.03844451904296875, -0.034832000732421875, -0.031219482421875, -0.027606964111328125, -0.02399444580078125, -0.020381927490234375, -0.0167694091796875, -0.013156890869140625, -0.00954437255859375, -0.005931854248046875, -0.0023193359375, 0.001293182373046875, 0.00490570068359375, 0.008518218994140625, 0.0121307373046875, 0.015743255615234375, 0.01935577392578125, 0.022968292236328125, 0.026580810546875, 0.030193328857421875, 0.03380584716796875, 0.037418365478515625, 0.0410308837890625, 0.044643402099609375, 0.04825592041015625, 0.051868438720703125, 0.05548095703125, 0.059093475341796875, 0.06270599365234375, 0.06631851196289062, 0.0699310302734375, 0.07354354858398438, 0.07715606689453125, 0.08076858520507812, 0.084381103515625, 0.08799362182617188, 0.09160614013671875, 0.09521865844726562, 0.0988311767578125, 0.10244369506835938, 0.10605621337890625, 0.10966873168945312, 0.11328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 33.0, 82.0, 198.0, 251.0, 231.0, 134.0, 57.0, 7.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06656837463378906, -0.06447219848632812, -0.06237602233886719, -0.06027984619140625, -0.05818367004394531, -0.056087493896484375, -0.05399131774902344, -0.0518951416015625, -0.04979896545410156, -0.047702789306640625, -0.04560661315917969, -0.04351043701171875, -0.04141426086425781, -0.039318084716796875, -0.03722190856933594, -0.035125732421875, -0.03302955627441406, -0.030933380126953125, -0.028837203979492188, -0.02674102783203125, -0.024644851684570312, -0.022548675537109375, -0.020452499389648438, -0.0183563232421875, -0.016260147094726562, -0.014163970947265625, -0.012067794799804688, -0.00997161865234375, -0.007875442504882812, -0.005779266357421875, -0.0036830902099609375, -0.0015869140625, 0.0005092620849609375, 0.002605438232421875, 0.0047016143798828125, 0.00679779052734375, 0.008893966674804688, 0.010990142822265625, 0.013086318969726562, 0.0151824951171875, 0.017278671264648438, 0.019374847412109375, 0.021471023559570312, 0.02356719970703125, 0.025663375854492188, 0.027759552001953125, 0.029855728149414062, 0.031951904296875, 0.03404808044433594, 0.036144256591796875, 0.03824043273925781, 0.04033660888671875, 0.04243278503417969, 0.044528961181640625, 0.04662513732910156, 0.0487213134765625, 0.05081748962402344, 0.052913665771484375, 0.05500984191894531, 0.05710601806640625, 0.05920219421386719, 0.061298370361328125, 0.06339454650878906, 0.06549072265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 12.0, 12.0, 20.0, 31.0, 40.0, 61.0, 91.0, 154.0, 213.0, 401.0, 735.0, 1366.0, 2800.0, 5605.0, 13214.0, 32553.0, 90004.0, 256386.0, 379784.0, 167105.0, 58191.0, 21849.0, 9233.0, 4183.0, 2013.0, 1029.0, 570.0, 336.0, 217.0, 116.0, 70.0, 51.0, 31.0, 20.0, 11.0, 13.0, 5.0, 7.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.046234130859375, -0.0447077751159668, -0.043181419372558594, -0.04165506362915039, -0.04012870788574219, -0.038602352142333984, -0.03707599639892578, -0.03554964065551758, -0.034023284912109375, -0.03249692916870117, -0.03097057342529297, -0.029444217681884766, -0.027917861938476562, -0.02639150619506836, -0.024865150451660156, -0.023338794708251953, -0.02181243896484375, -0.020286083221435547, -0.018759727478027344, -0.01723337173461914, -0.015707015991210938, -0.014180660247802734, -0.012654304504394531, -0.011127948760986328, -0.009601593017578125, -0.008075237274169922, -0.006548881530761719, -0.005022525787353516, -0.0034961700439453125, -0.0019698143005371094, -0.00044345855712890625, 0.0010828971862792969, 0.0026092529296875, 0.004135608673095703, 0.005661964416503906, 0.007188320159912109, 0.008714675903320312, 0.010241031646728516, 0.011767387390136719, 0.013293743133544922, 0.014820098876953125, 0.016346454620361328, 0.01787281036376953, 0.019399166107177734, 0.020925521850585938, 0.02245187759399414, 0.023978233337402344, 0.025504589080810547, 0.02703094482421875, 0.028557300567626953, 0.030083656311035156, 0.03161001205444336, 0.03313636779785156, 0.034662723541259766, 0.03618907928466797, 0.03771543502807617, 0.039241790771484375, 0.04076814651489258, 0.04229450225830078, 0.043820858001708984, 0.04534721374511719, 0.04687356948852539, 0.048399925231933594, 0.0499262809753418, 0.05145263671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 5.0, 6.0, 2.0, 12.0, 15.0, 13.0, 13.0, 17.0, 30.0, 29.0, 19.0, 39.0, 43.0, 32.0, 46.0, 45.0, 45.0, 64.0, 47.0, 45.0, 44.0, 52.0, 45.0, 49.0, 41.0, 18.0, 20.0, 28.0, 21.0, 22.0, 9.0, 14.0, 12.0, 12.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.06365966796875, -0.061914920806884766, -0.06017017364501953, -0.0584254264831543, -0.05668067932128906, -0.05493593215942383, -0.053191184997558594, -0.05144643783569336, -0.049701690673828125, -0.04795694351196289, -0.046212196350097656, -0.04446744918823242, -0.04272270202636719, -0.04097795486450195, -0.03923320770263672, -0.037488460540771484, -0.03574371337890625, -0.033998966217041016, -0.03225421905517578, -0.030509471893310547, -0.028764724731445312, -0.027019977569580078, -0.025275230407714844, -0.02353048324584961, -0.021785736083984375, -0.02004098892211914, -0.018296241760253906, -0.016551494598388672, -0.014806747436523438, -0.013062000274658203, -0.011317253112792969, -0.009572505950927734, -0.0078277587890625, -0.006083011627197266, -0.004338264465332031, -0.002593517303466797, -0.0008487701416015625, 0.0008959770202636719, 0.0026407241821289062, 0.004385471343994141, 0.006130218505859375, 0.00787496566772461, 0.009619712829589844, 0.011364459991455078, 0.013109207153320312, 0.014853954315185547, 0.01659870147705078, 0.018343448638916016, 0.02008819580078125, 0.021832942962646484, 0.02357769012451172, 0.025322437286376953, 0.027067184448242188, 0.028811931610107422, 0.030556678771972656, 0.03230142593383789, 0.034046173095703125, 0.03579092025756836, 0.037535667419433594, 0.03928041458129883, 0.04102516174316406, 0.0427699089050293, 0.04451465606689453, 0.046259403228759766, 0.048004150390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 10.0, 10.0, 16.0, 38.0, 37.0, 38.0, 67.0, 127.0, 165.0, 278.0, 403.0, 660.0, 1092.0, 1791.0, 2958.0, 4959.0, 9104.0, 17958.0, 41065.0, 124373.0, 421920.0, 283575.0, 77785.0, 29042.0, 13567.0, 7134.0, 4019.0, 2372.0, 1466.0, 928.0, 564.0, 356.0, 217.0, 142.0, 116.0, 53.0, 49.0, 25.0, 18.0, 14.0, 12.0, 5.0, 10.0, 6.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0312042236328125, -0.03022313117980957, -0.02924203872680664, -0.02826094627380371, -0.02727985382080078, -0.02629876136779785, -0.025317668914794922, -0.024336576461791992, -0.023355484008789062, -0.022374391555786133, -0.021393299102783203, -0.020412206649780273, -0.019431114196777344, -0.018450021743774414, -0.017468929290771484, -0.016487836837768555, -0.015506744384765625, -0.014525651931762695, -0.013544559478759766, -0.012563467025756836, -0.011582374572753906, -0.010601282119750977, -0.009620189666748047, -0.008639097213745117, -0.0076580047607421875, -0.006676912307739258, -0.005695819854736328, -0.0047147274017333984, -0.0037336349487304688, -0.002752542495727539, -0.0017714500427246094, -0.0007903575897216797, 0.00019073486328125, 0.0011718273162841797, 0.0021529197692871094, 0.003134012222290039, 0.004115104675292969, 0.0050961971282958984, 0.006077289581298828, 0.007058382034301758, 0.008039474487304688, 0.009020566940307617, 0.010001659393310547, 0.010982751846313477, 0.011963844299316406, 0.012944936752319336, 0.013926029205322266, 0.014907121658325195, 0.015888214111328125, 0.016869306564331055, 0.017850399017333984, 0.018831491470336914, 0.019812583923339844, 0.020793676376342773, 0.021774768829345703, 0.022755861282348633, 0.023736953735351562, 0.024718046188354492, 0.025699138641357422, 0.02668023109436035, 0.02766132354736328, 0.02864241600036621, 0.02962350845336914, 0.03060460090637207, 0.031585693359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 15.0, 7.0, 10.0, 8.0, 25.0, 18.0, 30.0, 24.0, 28.0, 41.0, 64.0, 70.0, 75.0, 65.0, 69.0, 72.0, 60.0, 51.0, 38.0, 40.0, 26.0, 18.0, 21.0, 15.0, 23.0, 11.0, 9.0, 5.0, 5.0, 3.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.94044104218483e-05, -5.765445530414581e-05, -5.590450018644333e-05, -5.4154545068740845e-05, -5.240458995103836e-05, -5.0654634833335876e-05, -4.890467971563339e-05, -4.715472459793091e-05, -4.5404769480228424e-05, -4.365481436252594e-05, -4.1904859244823456e-05, -4.015490412712097e-05, -3.840494900941849e-05, -3.6654993891716003e-05, -3.490503877401352e-05, -3.3155083656311035e-05, -3.140512853860855e-05, -2.9655173420906067e-05, -2.7905218303203583e-05, -2.61552631855011e-05, -2.4405308067798615e-05, -2.265535295009613e-05, -2.0905397832393646e-05, -1.9155442714691162e-05, -1.7405487596988678e-05, -1.5655532479286194e-05, -1.390557736158371e-05, -1.2155622243881226e-05, -1.0405667126178741e-05, -8.655712008476257e-06, -6.905756890773773e-06, -5.155801773071289e-06, -3.405846655368805e-06, -1.6558915376663208e-06, 9.406358003616333e-08, 1.8440186977386475e-06, 3.5939738154411316e-06, 5.343928933143616e-06, 7.0938840508461e-06, 8.843839168548584e-06, 1.0593794286251068e-05, 1.2343749403953552e-05, 1.4093704521656036e-05, 1.584365963935852e-05, 1.7593614757061005e-05, 1.934356987476349e-05, 2.1093524992465973e-05, 2.2843480110168457e-05, 2.459343522787094e-05, 2.6343390345573425e-05, 2.809334546327591e-05, 2.9843300580978394e-05, 3.159325569868088e-05, 3.334321081638336e-05, 3.5093165934085846e-05, 3.684312105178833e-05, 3.8593076169490814e-05, 4.03430312871933e-05, 4.209298640489578e-05, 4.3842941522598267e-05, 4.559289664030075e-05, 4.7342851758003235e-05, 4.909280687570572e-05, 5.08427619934082e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 4.0, 4.0, 6.0, 12.0, 15.0, 12.0, 25.0, 35.0, 61.0, 92.0, 150.0, 251.0, 477.0, 890.0, 1598.0, 3085.0, 6175.0, 14714.0, 40575.0, 139522.0, 478903.0, 255429.0, 66606.0, 21999.0, 9042.0, 4178.0, 2073.0, 1138.0, 609.0, 356.0, 220.0, 99.0, 61.0, 42.0, 30.0, 25.0, 5.0, 7.0, 8.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0380859375, -0.03698873519897461, -0.03589153289794922, -0.03479433059692383, -0.03369712829589844, -0.03259992599487305, -0.031502723693847656, -0.030405521392822266, -0.029308319091796875, -0.028211116790771484, -0.027113914489746094, -0.026016712188720703, -0.024919509887695312, -0.023822307586669922, -0.02272510528564453, -0.02162790298461914, -0.02053070068359375, -0.01943349838256836, -0.01833629608154297, -0.017239093780517578, -0.016141891479492188, -0.015044689178466797, -0.013947486877441406, -0.012850284576416016, -0.011753082275390625, -0.010655879974365234, -0.009558677673339844, -0.008461475372314453, -0.0073642730712890625, -0.006267070770263672, -0.005169868469238281, -0.004072666168212891, -0.0029754638671875, -0.0018782615661621094, -0.0007810592651367188, 0.0003161430358886719, 0.0014133453369140625, 0.002510547637939453, 0.0036077499389648438, 0.004704952239990234, 0.005802154541015625, 0.006899356842041016, 0.007996559143066406, 0.009093761444091797, 0.010190963745117188, 0.011288166046142578, 0.012385368347167969, 0.01348257064819336, 0.01457977294921875, 0.01567697525024414, 0.01677417755126953, 0.017871379852294922, 0.018968582153320312, 0.020065784454345703, 0.021162986755371094, 0.022260189056396484, 0.023357391357421875, 0.024454593658447266, 0.025551795959472656, 0.026648998260498047, 0.027746200561523438, 0.028843402862548828, 0.02994060516357422, 0.03103780746459961, 0.032135009765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 3.0, 6.0, 13.0, 10.0, 10.0, 13.0, 18.0, 38.0, 21.0, 35.0, 32.0, 55.0, 72.0, 83.0, 92.0, 113.0, 73.0, 49.0, 51.0, 32.0, 25.0, 21.0, 21.0, 12.0, 10.0, 11.0, 11.0, 13.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0289764404296875, -0.02806711196899414, -0.02715778350830078, -0.026248455047607422, -0.025339126586914062, -0.024429798126220703, -0.023520469665527344, -0.022611141204833984, -0.021701812744140625, -0.020792484283447266, -0.019883155822753906, -0.018973827362060547, -0.018064498901367188, -0.017155170440673828, -0.01624584197998047, -0.01533651351928711, -0.01442718505859375, -0.01351785659790039, -0.012608528137207031, -0.011699199676513672, -0.010789871215820312, -0.009880542755126953, -0.008971214294433594, -0.008061885833740234, -0.007152557373046875, -0.006243228912353516, -0.005333900451660156, -0.004424571990966797, -0.0035152435302734375, -0.002605915069580078, -0.0016965866088867188, -0.0007872581481933594, 0.0001220703125, 0.0010313987731933594, 0.0019407272338867188, 0.002850055694580078, 0.0037593841552734375, 0.004668712615966797, 0.005578041076660156, 0.006487369537353516, 0.007396697998046875, 0.008306026458740234, 0.009215354919433594, 0.010124683380126953, 0.011034011840820312, 0.011943340301513672, 0.012852668762207031, 0.01376199722290039, 0.01467132568359375, 0.01558065414428711, 0.01648998260498047, 0.017399311065673828, 0.018308639526367188, 0.019217967987060547, 0.020127296447753906, 0.021036624908447266, 0.021945953369140625, 0.022855281829833984, 0.023764610290527344, 0.024673938751220703, 0.025583267211914062, 0.026492595672607422, 0.02740192413330078, 0.02831125259399414, 0.0292205810546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 9.0, 17.0, 39.0, 71.0, 122.0, 157.0, 205.0, 139.0, 120.0, 60.0, 27.0, 16.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5905942916870117, -0.5747577548027039, -0.5589211583137512, -0.5430846214294434, -0.5272480249404907, -0.5114114880561829, -0.4955749213695526, -0.47973835468292236, -0.4639017879962921, -0.44806522130966187, -0.4322286546230316, -0.41639208793640137, -0.4005555510520935, -0.38471895456314087, -0.368882417678833, -0.35304585099220276, -0.3372092843055725, -0.32137271761894226, -0.305536150932312, -0.28969958424568176, -0.2738630175590515, -0.25802648067474365, -0.2421899139881134, -0.22635334730148315, -0.2105167806148529, -0.19468021392822266, -0.1788436472415924, -0.16300709545612335, -0.1471705287694931, -0.13133396208286285, -0.1154974028468132, -0.09966084361076355, -0.08382433652877808, -0.06798776984214783, -0.052151210606098175, -0.036314647644758224, -0.020478084683418274, -0.004641517996788025, 0.011195041239261627, 0.02703160047531128, 0.04286816716194153, 0.05870473012328148, 0.07454129308462143, 0.09037785232067108, 0.10621441900730133, 0.12205098569393158, 0.13788753747940063, 0.15372410416603088, 0.16956067085266113, 0.18539723753929138, 0.20123380422592163, 0.21707035601139069, 0.23290692269802094, 0.24874348938465118, 0.26458004117012024, 0.2804166078567505, 0.29625317454338074, 0.312089741230011, 0.32792630791664124, 0.3437628746032715, 0.35959941148757935, 0.375436007976532, 0.39127254486083984, 0.4071091115474701, 0.42294567823410034]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 13.0, 8.0, 16.0, 12.0, 18.0, 23.0, 26.0, 44.0, 25.0, 46.0, 52.0, 51.0, 44.0, 50.0, 56.0, 46.0, 54.0, 42.0, 40.0, 49.0, 30.0, 32.0, 41.0, 37.0, 27.0, 20.0, 20.0, 13.0, 14.0, 10.0, 8.0, 2.0, 3.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.23809468746185303, -0.23166514933109283, -0.22523559629917145, -0.21880605816841125, -0.21237650513648987, -0.20594696700572968, -0.19951742887496948, -0.1930878758430481, -0.1866583377122879, -0.1802287995815277, -0.17379924654960632, -0.16736970841884613, -0.16094017028808594, -0.15451061725616455, -0.14808107912540436, -0.14165154099464417, -0.13522198796272278, -0.12879244983196259, -0.1223628968000412, -0.115933358669281, -0.10950381308794022, -0.10307426750659943, -0.09664472937583923, -0.09021518379449844, -0.08378563821315765, -0.07735609263181686, -0.07092654705047607, -0.06449700891971588, -0.05806746333837509, -0.0516379177570343, -0.04520837590098381, -0.03877883404493332, -0.03234928846359253, -0.02591974474489689, -0.019490201026201248, -0.013060657307505608, -0.006631113588809967, -0.00020156800746917725, 0.006227973848581314, 0.012657515704631805, 0.019087061285972595, 0.025516605004668236, 0.031946148723363876, 0.03837569057941437, 0.04480523616075516, 0.05123478174209595, 0.05766432359814644, 0.06409386545419693, 0.07052341103553772, 0.07695295661687851, 0.0833825021982193, 0.08981204032897949, 0.09624158591032028, 0.10267113149166107, 0.10910066962242126, 0.11553021520376205, 0.12195976078510284, 0.12838929891586304, 0.13481885194778442, 0.14124839007854462, 0.1476779282093048, 0.1541074812412262, 0.1605370193719864, 0.16696655750274658, 0.17339611053466797]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 13.0, 38.0, 118.0, 707.0, 12676.0, 3952871.0, 223890.0, 3506.0, 266.0, 104.0, 37.0, 17.0, 7.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.187744140625, -0.1820220947265625, -0.176300048828125, -0.1705780029296875, -0.16485595703125, -0.1591339111328125, -0.153411865234375, -0.1476898193359375, -0.1419677734375, -0.1362457275390625, -0.130523681640625, -0.1248016357421875, -0.11907958984375, -0.1133575439453125, -0.107635498046875, -0.1019134521484375, -0.09619140625, -0.0904693603515625, -0.084747314453125, -0.0790252685546875, -0.07330322265625, -0.0675811767578125, -0.061859130859375, -0.0561370849609375, -0.0504150390625, -0.0446929931640625, -0.038970947265625, -0.0332489013671875, -0.02752685546875, -0.0218048095703125, -0.016082763671875, -0.0103607177734375, -0.004638671875, 0.0010833740234375, 0.006805419921875, 0.0125274658203125, 0.01824951171875, 0.0239715576171875, 0.029693603515625, 0.0354156494140625, 0.0411376953125, 0.0468597412109375, 0.052581787109375, 0.0583038330078125, 0.06402587890625, 0.0697479248046875, 0.075469970703125, 0.0811920166015625, 0.0869140625, 0.0926361083984375, 0.098358154296875, 0.1040802001953125, 0.10980224609375, 0.1155242919921875, 0.121246337890625, 0.1269683837890625, 0.1326904296875, 0.1384124755859375, 0.144134521484375, 0.1498565673828125, 0.15557861328125, 0.1613006591796875, 0.167022705078125, 0.1727447509765625, 0.178466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 24.0, 62.0, 99.0, 177.0, 209.0, 174.0, 148.0, 70.0, 25.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06283092498779297, -0.06078147888183594, -0.058732032775878906, -0.056682586669921875, -0.054633140563964844, -0.05258369445800781, -0.05053424835205078, -0.04848480224609375, -0.04643535614013672, -0.04438591003417969, -0.042336463928222656, -0.040287017822265625, -0.038237571716308594, -0.03618812561035156, -0.03413867950439453, -0.0320892333984375, -0.03003978729248047, -0.027990341186523438, -0.025940895080566406, -0.023891448974609375, -0.021842002868652344, -0.019792556762695312, -0.01774311065673828, -0.01569366455078125, -0.013644218444824219, -0.011594772338867188, -0.009545326232910156, -0.007495880126953125, -0.005446434020996094, -0.0033969879150390625, -0.0013475418090820312, 0.000701904296875, 0.0027513504028320312, 0.0048007965087890625, 0.006850242614746094, 0.008899688720703125, 0.010949134826660156, 0.012998580932617188, 0.015048027038574219, 0.01709747314453125, 0.01914691925048828, 0.021196365356445312, 0.023245811462402344, 0.025295257568359375, 0.027344703674316406, 0.029394149780273438, 0.03144359588623047, 0.0334930419921875, 0.03554248809814453, 0.03759193420410156, 0.039641380310058594, 0.041690826416015625, 0.043740272521972656, 0.04578971862792969, 0.04783916473388672, 0.04988861083984375, 0.05193805694580078, 0.05398750305175781, 0.056036949157714844, 0.058086395263671875, 0.060135841369628906, 0.06218528747558594, 0.06423473358154297, 0.0662841796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 15.0, 26.0, 27.0, 67.0, 121.0, 201.0, 420.0, 941.0, 2171.0, 6124.0, 22284.0, 133848.0, 3365117.0, 592344.0, 52362.0, 11719.0, 3760.0, 1450.0, 618.0, 301.0, 162.0, 73.0, 34.0, 39.0, 18.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0916748046875, -0.08953094482421875, -0.0873870849609375, -0.08524322509765625, -0.083099365234375, -0.08095550537109375, -0.0788116455078125, -0.07666778564453125, -0.07452392578125, -0.07238006591796875, -0.0702362060546875, -0.06809234619140625, -0.065948486328125, -0.06380462646484375, -0.0616607666015625, -0.05951690673828125, -0.057373046875, -0.05522918701171875, -0.0530853271484375, -0.05094146728515625, -0.048797607421875, -0.04665374755859375, -0.0445098876953125, -0.04236602783203125, -0.04022216796875, -0.03807830810546875, -0.0359344482421875, -0.03379058837890625, -0.031646728515625, -0.02950286865234375, -0.0273590087890625, -0.02521514892578125, -0.0230712890625, -0.02092742919921875, -0.0187835693359375, -0.01663970947265625, -0.014495849609375, -0.01235198974609375, -0.0102081298828125, -0.00806427001953125, -0.00592041015625, -0.00377655029296875, -0.0016326904296875, 0.00051116943359375, 0.002655029296875, 0.00479888916015625, 0.0069427490234375, 0.00908660888671875, 0.01123046875, 0.01337432861328125, 0.0155181884765625, 0.01766204833984375, 0.019805908203125, 0.02194976806640625, 0.0240936279296875, 0.02623748779296875, 0.02838134765625, 0.03052520751953125, 0.0326690673828125, 0.03481292724609375, 0.036956787109375, 0.03910064697265625, 0.0412445068359375, 0.04338836669921875, 0.0455322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 7.0, 14.0, 19.0, 15.0, 26.0, 30.0, 41.0, 69.0, 92.0, 135.0, 168.0, 328.0, 606.0, 919.0, 618.0, 309.0, 185.0, 116.0, 83.0, 60.0, 51.0, 36.0, 31.0, 19.0, 16.0, 9.0, 16.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028594970703125, -0.02755451202392578, -0.026514053344726562, -0.025473594665527344, -0.024433135986328125, -0.023392677307128906, -0.022352218627929688, -0.02131175994873047, -0.02027130126953125, -0.01923084259033203, -0.018190383911132812, -0.017149925231933594, -0.016109466552734375, -0.015069007873535156, -0.014028549194335938, -0.012988090515136719, -0.0119476318359375, -0.010907173156738281, -0.009866714477539062, -0.008826255798339844, -0.007785797119140625, -0.006745338439941406, -0.0057048797607421875, -0.004664421081542969, -0.00362396240234375, -0.0025835037231445312, -0.0015430450439453125, -0.0005025863647460938, 0.000537872314453125, 0.0015783309936523438, 0.0026187896728515625, 0.0036592483520507812, 0.00469970703125, 0.005740165710449219, 0.0067806243896484375, 0.007821083068847656, 0.008861541748046875, 0.009902000427246094, 0.010942459106445312, 0.011982917785644531, 0.01302337646484375, 0.014063835144042969, 0.015104293823242188, 0.016144752502441406, 0.017185211181640625, 0.018225669860839844, 0.019266128540039062, 0.02030658721923828, 0.0213470458984375, 0.02238750457763672, 0.023427963256835938, 0.024468421936035156, 0.025508880615234375, 0.026549339294433594, 0.027589797973632812, 0.02863025665283203, 0.02967071533203125, 0.03071117401123047, 0.03175163269042969, 0.032792091369628906, 0.033832550048828125, 0.034873008728027344, 0.03591346740722656, 0.03695392608642578, 0.037994384765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 21.0, 54.0, 136.0, 212.0, 249.0, 179.0, 80.0, 34.0, 13.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318085253238678, -0.30235299468040466, -0.28662076592445374, -0.2708885073661804, -0.2551562786102295, -0.23942402005195618, -0.22369176149368286, -0.20795951783657074, -0.19222727417945862, -0.1764950305223465, -0.16076278686523438, -0.14503052830696106, -0.12929828464984894, -0.11356604099273682, -0.0978337898850441, -0.08210153877735138, -0.06636929512023926, -0.05063704773783684, -0.03490480035543442, -0.019172552973031998, -0.0034403055906295776, 0.012291938066482544, 0.028024189174175262, 0.04375644028186798, 0.0594886839389801, 0.07522092759609222, 0.09095317870378494, 0.10668542981147766, 0.12241767346858978, 0.1381499171257019, 0.15388217568397522, 0.16961441934108734, 0.18534666299819946, 0.20107890665531158, 0.2168111503124237, 0.23254340887069702, 0.24827565252780914, 0.26400789618492126, 0.2797401547431946, 0.2954723834991455, 0.3112046420574188, 0.32693690061569214, 0.34266912937164307, 0.3584013879299164, 0.3741336464881897, 0.3898658752441406, 0.40559813380241394, 0.42133039236068726, 0.4370626211166382, 0.4527948796749115, 0.4685271084308624, 0.48425936698913574, 0.49999159574508667, 0.5157238245010376, 0.5314561128616333, 0.5471883416175842, 0.5629205703735352, 0.5786527991294861, 0.5943850874900818, 0.6101173162460327, 0.6258495450019836, 0.6415817737579346, 0.6573140621185303, 0.6730462908744812, 0.6887785792350769]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 13.0, 15.0, 16.0, 18.0, 24.0, 20.0, 29.0, 35.0, 32.0, 38.0, 48.0, 29.0, 47.0, 47.0, 46.0, 50.0, 50.0, 46.0, 38.0, 36.0, 41.0, 32.0, 28.0, 33.0, 24.0, 32.0, 13.0, 16.0, 17.0, 16.0, 17.0, 7.0, 10.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11295676231384277, -0.10939712077379227, -0.10583748668432236, -0.10227784514427185, -0.09871821105480194, -0.09515856951475143, -0.09159892797470093, -0.08803929388523102, -0.08447965234518051, -0.08092001080513, -0.0773603767156601, -0.07380073517560959, -0.07024109363555908, -0.06668145954608917, -0.06312181800603867, -0.05956218019127846, -0.05600254237651825, -0.05244290456175804, -0.04888326674699783, -0.04532362520694733, -0.04176398739218712, -0.03820434957742691, -0.034644708037376404, -0.031085070222616196, -0.027525432407855988, -0.02396579459309578, -0.020406154915690422, -0.016846515238285065, -0.013286877423524857, -0.009727239608764648, -0.006167599931359291, -0.0026079602539539337, 0.0009516775608062744, 0.004511316306889057, 0.00807095505297184, 0.011630593799054623, 0.015190232545137405, 0.018749870359897614, 0.02230951003730297, 0.025869149714708328, 0.029428787529468536, 0.032988425344228745, 0.03654806315898895, 0.04010770469903946, 0.04366734251379967, 0.047226980328559875, 0.05078662186861038, 0.05434625968337059, 0.0579058974981308, 0.061465535312891006, 0.06502517312765121, 0.06858481466770172, 0.07214444875717163, 0.07570409029722214, 0.07926373183727264, 0.08282336592674255, 0.08638300746679306, 0.08994264900684357, 0.09350228309631348, 0.09706192463636398, 0.10062156617641449, 0.1041812002658844, 0.1077408418059349, 0.11130048334598541, 0.11486011743545532]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 12.0, 9.0, 17.0, 33.0, 32.0, 55.0, 102.0, 127.0, 176.0, 316.0, 531.0, 1289.0, 4942.0, 36577.0, 429914.0, 518924.0, 46547.0, 5989.0, 1470.0, 581.0, 287.0, 199.0, 139.0, 84.0, 59.0, 41.0, 25.0, 17.0, 9.0, 12.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15074539184570312, -0.14572906494140625, -0.14071273803710938, -0.1356964111328125, -0.13068008422851562, -0.12566375732421875, -0.12064743041992188, -0.115631103515625, -0.11061477661132812, -0.10559844970703125, -0.10058212280273438, -0.0955657958984375, -0.09054946899414062, -0.08553314208984375, -0.08051681518554688, -0.07550048828125, -0.07048416137695312, -0.06546783447265625, -0.060451507568359375, -0.0554351806640625, -0.050418853759765625, -0.04540252685546875, -0.040386199951171875, -0.035369873046875, -0.030353546142578125, -0.02533721923828125, -0.020320892333984375, -0.0153045654296875, -0.010288238525390625, -0.00527191162109375, -0.000255584716796875, 0.0047607421875, 0.009777069091796875, 0.01479339599609375, 0.019809722900390625, 0.0248260498046875, 0.029842376708984375, 0.03485870361328125, 0.039875030517578125, 0.044891357421875, 0.049907684326171875, 0.05492401123046875, 0.059940338134765625, 0.0649566650390625, 0.06997299194335938, 0.07498931884765625, 0.08000564575195312, 0.08502197265625, 0.09003829956054688, 0.09505462646484375, 0.10007095336914062, 0.1050872802734375, 0.11010360717773438, 0.11511993408203125, 0.12013626098632812, 0.125152587890625, 0.13016891479492188, 0.13518524169921875, 0.14020156860351562, 0.1452178955078125, 0.15023422241210938, 0.15525054931640625, 0.16026687622070312, 0.165283203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 19.0, 61.0, 121.0, 175.0, 210.0, 177.0, 132.0, 65.0, 26.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06501293182373047, -0.06288719177246094, -0.060761451721191406, -0.058635711669921875, -0.056509971618652344, -0.05438423156738281, -0.05225849151611328, -0.05013275146484375, -0.04800701141357422, -0.04588127136230469, -0.043755531311035156, -0.041629791259765625, -0.039504051208496094, -0.03737831115722656, -0.03525257110595703, -0.0331268310546875, -0.03100109100341797, -0.028875350952148438, -0.026749610900878906, -0.024623870849609375, -0.022498130798339844, -0.020372390747070312, -0.01824665069580078, -0.01612091064453125, -0.013995170593261719, -0.011869430541992188, -0.009743690490722656, -0.007617950439453125, -0.005492210388183594, -0.0033664703369140625, -0.0012407302856445312, 0.000885009765625, 0.0030107498168945312, 0.0051364898681640625, 0.007262229919433594, 0.009387969970703125, 0.011513710021972656, 0.013639450073242188, 0.01576519012451172, 0.01789093017578125, 0.02001667022705078, 0.022142410278320312, 0.024268150329589844, 0.026393890380859375, 0.028519630432128906, 0.030645370483398438, 0.03277111053466797, 0.0348968505859375, 0.03702259063720703, 0.03914833068847656, 0.041274070739746094, 0.043399810791015625, 0.045525550842285156, 0.04765129089355469, 0.04977703094482422, 0.05190277099609375, 0.05402851104736328, 0.05615425109863281, 0.058279991149902344, 0.060405731201171875, 0.0625314712524414, 0.06465721130371094, 0.06678295135498047, 0.06890869140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 25.0, 39.0, 68.0, 92.0, 146.0, 278.0, 448.0, 733.0, 1327.0, 2709.0, 5755.0, 12298.0, 29794.0, 76892.0, 206185.0, 371099.0, 208605.0, 78028.0, 30032.0, 12503.0, 5513.0, 2668.0, 1444.0, 723.0, 460.0, 258.0, 148.0, 96.0, 46.0, 34.0, 29.0, 14.0, 14.0, 6.0, 11.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.055428504943847656, -0.05348396301269531, -0.05153942108154297, -0.049594879150390625, -0.04765033721923828, -0.04570579528808594, -0.043761253356933594, -0.04181671142578125, -0.039872169494628906, -0.03792762756347656, -0.03598308563232422, -0.034038543701171875, -0.03209400177001953, -0.030149459838867188, -0.028204917907714844, -0.0262603759765625, -0.024315834045410156, -0.022371292114257812, -0.02042675018310547, -0.018482208251953125, -0.01653766632080078, -0.014593124389648438, -0.012648582458496094, -0.01070404052734375, -0.008759498596191406, -0.0068149566650390625, -0.004870414733886719, -0.002925872802734375, -0.0009813308715820312, 0.0009632110595703125, 0.0029077529907226562, 0.004852294921875, 0.006796836853027344, 0.008741378784179688, 0.010685920715332031, 0.012630462646484375, 0.014575004577636719, 0.016519546508789062, 0.018464088439941406, 0.02040863037109375, 0.022353172302246094, 0.024297714233398438, 0.02624225616455078, 0.028186798095703125, 0.03013134002685547, 0.03207588195800781, 0.034020423889160156, 0.0359649658203125, 0.037909507751464844, 0.03985404968261719, 0.04179859161376953, 0.043743133544921875, 0.04568767547607422, 0.04763221740722656, 0.049576759338378906, 0.05152130126953125, 0.053465843200683594, 0.05541038513183594, 0.05735492706298828, 0.059299468994140625, 0.06124401092529297, 0.06318855285644531, 0.06513309478759766, 0.06707763671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 7.0, 7.0, 4.0, 9.0, 11.0, 14.0, 16.0, 12.0, 26.0, 29.0, 37.0, 31.0, 44.0, 47.0, 47.0, 56.0, 61.0, 49.0, 61.0, 51.0, 56.0, 51.0, 49.0, 42.0, 41.0, 29.0, 32.0, 24.0, 16.0, 8.0, 5.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07361507415771484, -0.07130241394042969, -0.06898975372314453, -0.06667709350585938, -0.06436443328857422, -0.06205177307128906, -0.059739112854003906, -0.05742645263671875, -0.055113792419433594, -0.05280113220214844, -0.05048847198486328, -0.048175811767578125, -0.04586315155029297, -0.04355049133300781, -0.041237831115722656, -0.0389251708984375, -0.036612510681152344, -0.03429985046386719, -0.03198719024658203, -0.029674530029296875, -0.02736186981201172, -0.025049209594726562, -0.022736549377441406, -0.02042388916015625, -0.018111228942871094, -0.015798568725585938, -0.013485908508300781, -0.011173248291015625, -0.008860588073730469, -0.0065479278564453125, -0.004235267639160156, -0.001922607421875, 0.00039005279541015625, 0.0027027130126953125, 0.005015373229980469, 0.007328033447265625, 0.009640693664550781, 0.011953353881835938, 0.014266014099121094, 0.01657867431640625, 0.018891334533691406, 0.021203994750976562, 0.02351665496826172, 0.025829315185546875, 0.02814197540283203, 0.030454635620117188, 0.032767295837402344, 0.0350799560546875, 0.037392616271972656, 0.03970527648925781, 0.04201793670654297, 0.044330596923828125, 0.04664325714111328, 0.04895591735839844, 0.051268577575683594, 0.05358123779296875, 0.055893898010253906, 0.05820655822753906, 0.06051921844482422, 0.06283187866210938, 0.06514453887939453, 0.06745719909667969, 0.06976985931396484, 0.07208251953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 2.0, 9.0, 7.0, 7.0, 3.0, 6.0, 13.0, 18.0, 29.0, 27.0, 42.0, 72.0, 86.0, 142.0, 187.0, 309.0, 408.0, 538.0, 788.0, 1224.0, 1730.0, 2882.0, 4990.0, 11957.0, 44965.0, 313607.0, 550845.0, 79754.0, 17562.0, 6541.0, 3310.0, 2008.0, 1294.0, 925.0, 659.0, 472.0, 329.0, 240.0, 159.0, 107.0, 89.0, 61.0, 38.0, 33.0, 26.0, 20.0, 13.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.08270263671875, -0.08013153076171875, -0.0775604248046875, -0.07498931884765625, -0.072418212890625, -0.06984710693359375, -0.0672760009765625, -0.06470489501953125, -0.0621337890625, -0.05956268310546875, -0.0569915771484375, -0.05442047119140625, -0.051849365234375, -0.04927825927734375, -0.0467071533203125, -0.04413604736328125, -0.04156494140625, -0.03899383544921875, -0.0364227294921875, -0.03385162353515625, -0.031280517578125, -0.02870941162109375, -0.0261383056640625, -0.02356719970703125, -0.02099609375, -0.01842498779296875, -0.0158538818359375, -0.01328277587890625, -0.010711669921875, -0.00814056396484375, -0.0055694580078125, -0.00299835205078125, -0.00042724609375, 0.00214385986328125, 0.0047149658203125, 0.00728607177734375, 0.009857177734375, 0.01242828369140625, 0.0149993896484375, 0.01757049560546875, 0.0201416015625, 0.02271270751953125, 0.0252838134765625, 0.02785491943359375, 0.030426025390625, 0.03299713134765625, 0.0355682373046875, 0.03813934326171875, 0.04071044921875, 0.04328155517578125, 0.0458526611328125, 0.04842376708984375, 0.050994873046875, 0.05356597900390625, 0.0561370849609375, 0.05870819091796875, 0.061279296875, 0.06385040283203125, 0.0664215087890625, 0.06899261474609375, 0.071563720703125, 0.07413482666015625, 0.0767059326171875, 0.07927703857421875, 0.08184814453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 12.0, 17.0, 19.0, 26.0, 30.0, 44.0, 53.0, 96.0, 120.0, 138.0, 104.0, 88.0, 48.0, 37.0, 40.0, 33.0, 17.0, 12.0, 14.0, 9.0, 6.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011986494064331055, -0.00011617504060268402, -0.0001124851405620575, -0.00010879524052143097, -0.00010510534048080444, -0.00010141544044017792, -9.772554039955139e-05, -9.403564035892487e-05, -9.034574031829834e-05, -8.665584027767181e-05, -8.296594023704529e-05, -7.927604019641876e-05, -7.558614015579224e-05, -7.189624011516571e-05, -6.820634007453918e-05, -6.451644003391266e-05, -6.082653999328613e-05, -5.713663995265961e-05, -5.344673991203308e-05, -4.9756839871406555e-05, -4.606693983078003e-05, -4.2377039790153503e-05, -3.868713974952698e-05, -3.499723970890045e-05, -3.1307339668273926e-05, -2.76174396276474e-05, -2.3927539587020874e-05, -2.0237639546394348e-05, -1.6547739505767822e-05, -1.2857839465141296e-05, -9.16793942451477e-06, -5.478039383888245e-06, -1.7881393432617188e-06, 1.9017606973648071e-06, 5.591660737991333e-06, 9.281560778617859e-06, 1.2971460819244385e-05, 1.666136085987091e-05, 2.0351260900497437e-05, 2.4041160941123962e-05, 2.7731060981750488e-05, 3.1420961022377014e-05, 3.511086106300354e-05, 3.8800761103630066e-05, 4.249066114425659e-05, 4.618056118488312e-05, 4.9870461225509644e-05, 5.356036126613617e-05, 5.7250261306762695e-05, 6.094016134738922e-05, 6.463006138801575e-05, 6.831996142864227e-05, 7.20098614692688e-05, 7.569976150989532e-05, 7.938966155052185e-05, 8.307956159114838e-05, 8.67694616317749e-05, 9.045936167240143e-05, 9.414926171302795e-05, 9.783916175365448e-05, 0.000101529061794281, 0.00010521896183490753, 0.00010890886187553406, 0.00011259876191616058, 0.00011628866195678711]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 12.0, 16.0, 33.0, 39.0, 73.0, 93.0, 112.0, 192.0, 257.0, 431.0, 670.0, 1194.0, 1980.0, 4070.0, 10047.0, 37383.0, 262210.0, 606419.0, 92273.0, 18075.0, 6130.0, 2881.0, 1570.0, 889.0, 524.0, 327.0, 202.0, 133.0, 95.0, 61.0, 37.0, 32.0, 16.0, 16.0, 17.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08015632629394531, -0.07767105102539062, -0.07518577575683594, -0.07270050048828125, -0.07021522521972656, -0.06772994995117188, -0.06524467468261719, -0.0627593994140625, -0.06027412414550781, -0.057788848876953125, -0.05530357360839844, -0.05281829833984375, -0.05033302307128906, -0.047847747802734375, -0.04536247253417969, -0.042877197265625, -0.04039192199707031, -0.037906646728515625, -0.03542137145996094, -0.03293609619140625, -0.030450820922851562, -0.027965545654296875, -0.025480270385742188, -0.0229949951171875, -0.020509719848632812, -0.018024444580078125, -0.015539169311523438, -0.01305389404296875, -0.010568618774414062, -0.008083343505859375, -0.0055980682373046875, -0.00311279296875, -0.0006275177001953125, 0.001857757568359375, 0.0043430328369140625, 0.00682830810546875, 0.009313583374023438, 0.011798858642578125, 0.014284133911132812, 0.0167694091796875, 0.019254684448242188, 0.021739959716796875, 0.024225234985351562, 0.02671051025390625, 0.029195785522460938, 0.031681060791015625, 0.03416633605957031, 0.036651611328125, 0.03913688659667969, 0.041622161865234375, 0.04410743713378906, 0.04659271240234375, 0.04907798767089844, 0.051563262939453125, 0.05404853820800781, 0.0565338134765625, 0.05901908874511719, 0.061504364013671875, 0.06398963928222656, 0.06647491455078125, 0.06896018981933594, 0.07144546508789062, 0.07393074035644531, 0.076416015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 11.0, 9.0, 11.0, 6.0, 19.0, 25.0, 44.0, 39.0, 73.0, 79.0, 113.0, 102.0, 116.0, 100.0, 65.0, 60.0, 38.0, 23.0, 14.0, 14.0, 11.0, 8.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0596923828125, -0.057801246643066406, -0.05591011047363281, -0.05401897430419922, -0.052127838134765625, -0.05023670196533203, -0.04834556579589844, -0.046454429626464844, -0.04456329345703125, -0.042672157287597656, -0.04078102111816406, -0.03888988494873047, -0.036998748779296875, -0.03510761260986328, -0.03321647644042969, -0.031325340270996094, -0.0294342041015625, -0.027543067932128906, -0.025651931762695312, -0.02376079559326172, -0.021869659423828125, -0.01997852325439453, -0.018087387084960938, -0.016196250915527344, -0.01430511474609375, -0.012413978576660156, -0.010522842407226562, -0.008631706237792969, -0.006740570068359375, -0.004849433898925781, -0.0029582977294921875, -0.0010671615600585938, 0.000823974609375, 0.0027151107788085938, 0.0046062469482421875, 0.006497383117675781, 0.008388519287109375, 0.010279655456542969, 0.012170791625976562, 0.014061927795410156, 0.01595306396484375, 0.017844200134277344, 0.019735336303710938, 0.02162647247314453, 0.023517608642578125, 0.02540874481201172, 0.027299880981445312, 0.029191017150878906, 0.0310821533203125, 0.032973289489746094, 0.03486442565917969, 0.03675556182861328, 0.038646697998046875, 0.04053783416748047, 0.04242897033691406, 0.044320106506347656, 0.04621124267578125, 0.048102378845214844, 0.04999351501464844, 0.05188465118408203, 0.053775787353515625, 0.05566692352294922, 0.05755805969238281, 0.059449195861816406, 0.06134033203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 20.0, 55.0, 119.0, 223.0, 268.0, 161.0, 76.0, 29.0, 14.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.948332667350769, -0.9133965969085693, -0.8784605264663696, -0.8435244560241699, -0.8085883855819702, -0.7736523151397705, -0.7387163043022156, -0.7037802338600159, -0.6688441634178162, -0.6339080929756165, -0.5989720225334167, -0.564035952091217, -0.5290999412536621, -0.49416384100914, -0.4592278003692627, -0.424291729927063, -0.3893556594848633, -0.3544195890426636, -0.31948351860046387, -0.28454747796058655, -0.24961140751838684, -0.21467533707618713, -0.17973928153514862, -0.1448032259941101, -0.1098671555519104, -0.07493109256029129, -0.03999502956867218, -0.00505896657705307, 0.02987709641456604, 0.06481316685676575, 0.09974922239780426, 0.13468527793884277, 0.16962134838104248, 0.2045574188232422, 0.2394934743642807, 0.2744295299053192, 0.3093656003475189, 0.34430167078971863, 0.37923771142959595, 0.41417378187179565, 0.44910985231399536, 0.48404592275619507, 0.5189819931983948, 0.5539180636405945, 0.5888540744781494, 0.6237901449203491, 0.6587262153625488, 0.6936622858047485, 0.7285983562469482, 0.763534426689148, 0.7984704971313477, 0.8334065675735474, 0.8683426380157471, 0.9032787084579468, 0.9382147192955017, 0.9731507897377014, 1.008086919784546, 1.0430229902267456, 1.0779590606689453, 1.112895131111145, 1.1478312015533447, 1.1827672719955444, 1.2177033424377441, 1.2526392936706543, 1.287575364112854]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 3.0, 8.0, 9.0, 10.0, 10.0, 15.0, 15.0, 23.0, 25.0, 37.0, 35.0, 29.0, 44.0, 33.0, 49.0, 39.0, 43.0, 44.0, 34.0, 47.0, 52.0, 53.0, 40.0, 39.0, 35.0, 26.0, 27.0, 28.0, 28.0, 26.0, 16.0, 22.0, 8.0, 12.0, 8.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0], "bins": [-0.287497341632843, -0.28001266717910767, -0.2725279927253723, -0.26504331827163696, -0.2575586438179016, -0.25007396936416626, -0.2425892949104309, -0.23510462045669556, -0.2276199460029602, -0.22013527154922485, -0.2126505970954895, -0.20516592264175415, -0.1976812481880188, -0.19019657373428345, -0.1827118992805481, -0.17522722482681274, -0.1677425503730774, -0.16025787591934204, -0.1527732014656067, -0.14528852701187134, -0.137803852558136, -0.13031917810440063, -0.12283450365066528, -0.11534982919692993, -0.10786515474319458, -0.10038048028945923, -0.09289580583572388, -0.08541113138198853, -0.07792645692825317, -0.07044178247451782, -0.06295710802078247, -0.05547243356704712, -0.04798775911331177, -0.040503084659576416, -0.033018410205841064, -0.025533735752105713, -0.01804906129837036, -0.01056438684463501, -0.003079712390899658, 0.004404962062835693, 0.011889636516571045, 0.019374310970306396, 0.026858985424041748, 0.0343436598777771, 0.04182833433151245, 0.0493130087852478, 0.056797683238983154, 0.0642823576927185, 0.07176703214645386, 0.07925170660018921, 0.08673638105392456, 0.09422105550765991, 0.10170572996139526, 0.10919040441513062, 0.11667507886886597, 0.12415975332260132, 0.13164442777633667, 0.13912910223007202, 0.14661377668380737, 0.15409845113754272, 0.16158312559127808, 0.16906780004501343, 0.17655247449874878, 0.18403714895248413, 0.19152182340621948]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 17.0, 44.0, 161.0, 1124.0, 19784.0, 3951692.0, 216467.0, 4419.0, 413.0, 93.0, 37.0, 11.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2325439453125, -0.22522544860839844, -0.21790695190429688, -0.2105884552001953, -0.20326995849609375, -0.1959514617919922, -0.18863296508789062, -0.18131446838378906, -0.1739959716796875, -0.16667747497558594, -0.15935897827148438, -0.1520404815673828, -0.14472198486328125, -0.1374034881591797, -0.13008499145507812, -0.12276649475097656, -0.115447998046875, -0.10812950134277344, -0.10081100463867188, -0.09349250793457031, -0.08617401123046875, -0.07885551452636719, -0.07153701782226562, -0.06421852111816406, -0.0569000244140625, -0.04958152770996094, -0.042263031005859375, -0.03494453430175781, -0.02762603759765625, -0.020307540893554688, -0.012989044189453125, -0.0056705474853515625, 0.00164794921875, 0.008966445922851562, 0.016284942626953125, 0.023603439331054688, 0.03092193603515625, 0.03824043273925781, 0.045558929443359375, 0.05287742614746094, 0.0601959228515625, 0.06751441955566406, 0.07483291625976562, 0.08215141296386719, 0.08946990966796875, 0.09678840637207031, 0.10410690307617188, 0.11142539978027344, 0.118743896484375, 0.12606239318847656, 0.13338088989257812, 0.1406993865966797, 0.14801788330078125, 0.1553363800048828, 0.16265487670898438, 0.16997337341308594, 0.1772918701171875, 0.18461036682128906, 0.19192886352539062, 0.1992473602294922, 0.20656585693359375, 0.2138843536376953, 0.22120285034179688, 0.22852134704589844, 0.23583984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 18.0, 28.0, 59.0, 113.0, 134.0, 155.0, 165.0, 132.0, 89.0, 70.0, 22.0, 12.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.06089496612548828, -0.05886268615722656, -0.056830406188964844, -0.054798126220703125, -0.052765846252441406, -0.05073356628417969, -0.04870128631591797, -0.04666900634765625, -0.04463672637939453, -0.04260444641113281, -0.040572166442871094, -0.038539886474609375, -0.036507606506347656, -0.03447532653808594, -0.03244304656982422, -0.0304107666015625, -0.02837848663330078, -0.026346206665039062, -0.024313926696777344, -0.022281646728515625, -0.020249366760253906, -0.018217086791992188, -0.01618480682373047, -0.01415252685546875, -0.012120246887207031, -0.010087966918945312, -0.008055686950683594, -0.006023406982421875, -0.003991127014160156, -0.0019588470458984375, 7.343292236328125e-05, 0.002105712890625, 0.004137992858886719, 0.0061702728271484375, 0.008202552795410156, 0.010234832763671875, 0.012267112731933594, 0.014299392700195312, 0.01633167266845703, 0.01836395263671875, 0.02039623260498047, 0.022428512573242188, 0.024460792541503906, 0.026493072509765625, 0.028525352478027344, 0.030557632446289062, 0.03258991241455078, 0.0346221923828125, 0.03665447235107422, 0.03868675231933594, 0.040719032287597656, 0.042751312255859375, 0.044783592224121094, 0.04681587219238281, 0.04884815216064453, 0.05088043212890625, 0.05291271209716797, 0.05494499206542969, 0.056977272033691406, 0.059009552001953125, 0.061041831970214844, 0.06307411193847656, 0.06510639190673828, 0.067138671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 6.0, 10.0, 10.0, 25.0, 27.0, 49.0, 61.0, 103.0, 158.0, 217.0, 379.0, 670.0, 1064.0, 1917.0, 3576.0, 7529.0, 17953.0, 53296.0, 230219.0, 2826805.0, 878900.0, 115007.0, 32363.0, 12153.0, 5396.0, 2701.0, 1434.0, 907.0, 477.0, 337.0, 210.0, 101.0, 85.0, 54.0, 39.0, 14.0, 10.0, 10.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.05586385726928711, -0.05398845672607422, -0.05211305618286133, -0.05023765563964844, -0.04836225509643555, -0.046486854553222656, -0.044611454010009766, -0.042736053466796875, -0.040860652923583984, -0.038985252380371094, -0.0371098518371582, -0.03523445129394531, -0.03335905075073242, -0.03148365020751953, -0.02960824966430664, -0.02773284912109375, -0.02585744857788086, -0.02398204803466797, -0.022106647491455078, -0.020231246948242188, -0.018355846405029297, -0.016480445861816406, -0.014605045318603516, -0.012729644775390625, -0.010854244232177734, -0.008978843688964844, -0.007103443145751953, -0.0052280426025390625, -0.003352642059326172, -0.0014772415161132812, 0.0003981590270996094, 0.0022735595703125, 0.004148960113525391, 0.006024360656738281, 0.007899761199951172, 0.009775161743164062, 0.011650562286376953, 0.013525962829589844, 0.015401363372802734, 0.017276763916015625, 0.019152164459228516, 0.021027565002441406, 0.022902965545654297, 0.024778366088867188, 0.026653766632080078, 0.02852916717529297, 0.03040456771850586, 0.03227996826171875, 0.03415536880493164, 0.03603076934814453, 0.03790616989135742, 0.03978157043457031, 0.0416569709777832, 0.043532371520996094, 0.045407772064208984, 0.047283172607421875, 0.049158573150634766, 0.051033973693847656, 0.05290937423706055, 0.05478477478027344, 0.05666017532348633, 0.05853557586669922, 0.06041097640991211, 0.062286376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 12.0, 14.0, 13.0, 28.0, 33.0, 54.0, 55.0, 107.0, 137.0, 191.0, 352.0, 710.0, 1037.0, 532.0, 266.0, 170.0, 89.0, 67.0, 52.0, 35.0, 27.0, 19.0, 14.0, 9.0, 7.0, 5.0, 6.0, 9.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.05963134765625, -0.05798530578613281, -0.056339263916015625, -0.05469322204589844, -0.05304718017578125, -0.05140113830566406, -0.049755096435546875, -0.04810905456542969, -0.0464630126953125, -0.04481697082519531, -0.043170928955078125, -0.04152488708496094, -0.03987884521484375, -0.03823280334472656, -0.036586761474609375, -0.03494071960449219, -0.033294677734375, -0.03164863586425781, -0.030002593994140625, -0.028356552124023438, -0.02671051025390625, -0.025064468383789062, -0.023418426513671875, -0.021772384643554688, -0.0201263427734375, -0.018480300903320312, -0.016834259033203125, -0.015188217163085938, -0.01354217529296875, -0.011896133422851562, -0.010250091552734375, -0.008604049682617188, -0.0069580078125, -0.0053119659423828125, -0.003665924072265625, -0.0020198822021484375, -0.00037384033203125, 0.0012722015380859375, 0.002918243408203125, 0.0045642852783203125, 0.0062103271484375, 0.007856369018554688, 0.009502410888671875, 0.011148452758789062, 0.01279449462890625, 0.014440536499023438, 0.016086578369140625, 0.017732620239257812, 0.019378662109375, 0.021024703979492188, 0.022670745849609375, 0.024316787719726562, 0.02596282958984375, 0.027608871459960938, 0.029254913330078125, 0.030900955200195312, 0.0325469970703125, 0.03419303894042969, 0.035839080810546875, 0.03748512268066406, 0.03913116455078125, 0.04077720642089844, 0.042423248291015625, 0.04406929016113281, 0.04571533203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 20.0, 22.0, 40.0, 54.0, 112.0, 154.0, 179.0, 167.0, 100.0, 54.0, 41.0, 26.0, 13.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2858421802520752, -0.27044135332107544, -0.25504055619239807, -0.23963972926139832, -0.22423893213272095, -0.2088381052017212, -0.19343729317188263, -0.17803648114204407, -0.1626356691122055, -0.14723485708236694, -0.13183404505252838, -0.11643322557210922, -0.10103241354227066, -0.0856316015124321, -0.07023078203201294, -0.05482997000217438, -0.039429157972335815, -0.024028344079852104, -0.008627530187368393, 0.0067732855677604675, 0.02217409759759903, 0.03757490962743759, 0.05297572910785675, 0.06837654113769531, 0.08377735316753387, 0.09917816519737244, 0.114578977227211, 0.12997978925704956, 0.14538061618804932, 0.16078141331672668, 0.17618224024772644, 0.191583052277565, 0.20698386430740356, 0.22238467633724213, 0.2377854883670807, 0.25318631529808044, 0.2685871124267578, 0.28398793935775757, 0.2993887662887573, 0.3147895634174347, 0.33019036054611206, 0.3455911874771118, 0.3609919846057892, 0.37639281153678894, 0.3917936086654663, 0.40719443559646606, 0.4225952625274658, 0.4379960596561432, 0.45339688658714294, 0.4687977135181427, 0.48419851064682007, 0.4995993375778198, 0.5150001645088196, 0.5304009318351746, 0.5458017587661743, 0.5612025856971741, 0.5766034126281738, 0.5920042395591736, 0.6074050664901733, 0.6228058338165283, 0.6382066607475281, 0.6536074876785278, 0.6690083146095276, 0.6844091415405273, 0.6998099088668823]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 13.0, 7.0, 4.0, 12.0, 9.0, 8.0, 14.0, 13.0, 22.0, 23.0, 20.0, 30.0, 38.0, 37.0, 31.0, 24.0, 33.0, 43.0, 42.0, 52.0, 40.0, 42.0, 40.0, 44.0, 41.0, 44.0, 39.0, 29.0, 29.0, 29.0, 23.0, 27.0, 16.0, 17.0, 14.0, 8.0, 5.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.14816880226135254, -0.143440380692482, -0.13871195912361145, -0.1339835524559021, -0.12925513088703156, -0.12452670931816101, -0.11979828774929047, -0.11506986618041992, -0.11034145206212997, -0.10561303049325943, -0.10088461637496948, -0.09615619480609894, -0.0914277732372284, -0.08669935911893845, -0.0819709375500679, -0.07724252343177795, -0.07251410186290741, -0.06778568029403687, -0.06305726617574692, -0.05832884460687637, -0.05360042676329613, -0.04887200891971588, -0.04414358735084534, -0.03941516950726509, -0.034686751663684845, -0.0299583338201046, -0.025229914113879204, -0.02050149440765381, -0.015773076564073563, -0.011044658720493317, -0.0063162390142679214, -0.0015878193080425262, 0.0031405985355377197, 0.00786901731044054, 0.012597436085343361, 0.017325855791568756, 0.022054273635149002, 0.026782691478729248, 0.03151111304759979, 0.03623953089118004, 0.040967948734760284, 0.04569636657834053, 0.050424784421920776, 0.05515320599079132, 0.05988162383437157, 0.06461004167795181, 0.06933846324682236, 0.0740668773651123, 0.07879529893398285, 0.0835237205028534, 0.08825213462114334, 0.09298055619001389, 0.09770897030830383, 0.10243739187717438, 0.10716581344604492, 0.11189423501491547, 0.11662264913320541, 0.12135107070207596, 0.1260794848203659, 0.13080790638923645, 0.135536327958107, 0.14026474952697754, 0.1449931561946869, 0.14972157776355743, 0.15444999933242798]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 5.0, 11.0, 15.0, 14.0, 24.0, 40.0, 53.0, 89.0, 120.0, 212.0, 347.0, 787.0, 1967.0, 7122.0, 33543.0, 178853.0, 545100.0, 225151.0, 42159.0, 8865.0, 2259.0, 797.0, 390.0, 214.0, 119.0, 92.0, 57.0, 52.0, 27.0, 23.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148681640625, -0.14381790161132812, -0.13895416259765625, -0.13409042358398438, -0.1292266845703125, -0.12436294555664062, -0.11949920654296875, -0.11463546752929688, -0.109771728515625, -0.10490798950195312, -0.10004425048828125, -0.09518051147460938, -0.0903167724609375, -0.08545303344726562, -0.08058929443359375, -0.07572555541992188, -0.07086181640625, -0.06599807739257812, -0.06113433837890625, -0.056270599365234375, -0.0514068603515625, -0.046543121337890625, -0.04167938232421875, -0.036815643310546875, -0.031951904296875, -0.027088165283203125, -0.02222442626953125, -0.017360687255859375, -0.0124969482421875, -0.007633209228515625, -0.00276947021484375, 0.002094268798828125, 0.0069580078125, 0.011821746826171875, 0.01668548583984375, 0.021549224853515625, 0.0264129638671875, 0.031276702880859375, 0.03614044189453125, 0.041004180908203125, 0.045867919921875, 0.050731658935546875, 0.05559539794921875, 0.060459136962890625, 0.0653228759765625, 0.07018661499023438, 0.07505035400390625, 0.07991409301757812, 0.08477783203125, 0.08964157104492188, 0.09450531005859375, 0.09936904907226562, 0.1042327880859375, 0.10909652709960938, 0.11396026611328125, 0.11882400512695312, 0.123687744140625, 0.12855148315429688, 0.13341522216796875, 0.13827896118164062, 0.1431427001953125, 0.14800643920898438, 0.15287017822265625, 0.15773391723632812, 0.16259765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 12.0, 24.0, 54.0, 72.0, 101.0, 164.0, 147.0, 150.0, 122.0, 70.0, 49.0, 21.0, 9.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06494808197021484, -0.06281852722167969, -0.06068897247314453, -0.058559417724609375, -0.05642986297607422, -0.05430030822753906, -0.052170753479003906, -0.05004119873046875, -0.047911643981933594, -0.04578208923339844, -0.04365253448486328, -0.041522979736328125, -0.03939342498779297, -0.03726387023925781, -0.035134315490722656, -0.0330047607421875, -0.030875205993652344, -0.028745651245117188, -0.02661609649658203, -0.024486541748046875, -0.02235698699951172, -0.020227432250976562, -0.018097877502441406, -0.01596832275390625, -0.013838768005371094, -0.011709213256835938, -0.009579658508300781, -0.007450103759765625, -0.005320549011230469, -0.0031909942626953125, -0.0010614395141601562, 0.001068115234375, 0.0031976699829101562, 0.0053272247314453125, 0.007456779479980469, 0.009586334228515625, 0.011715888977050781, 0.013845443725585938, 0.015974998474121094, 0.01810455322265625, 0.020234107971191406, 0.022363662719726562, 0.02449321746826172, 0.026622772216796875, 0.02875232696533203, 0.030881881713867188, 0.033011436462402344, 0.0351409912109375, 0.037270545959472656, 0.03940010070800781, 0.04152965545654297, 0.043659210205078125, 0.04578876495361328, 0.04791831970214844, 0.050047874450683594, 0.05217742919921875, 0.054306983947753906, 0.05643653869628906, 0.05856609344482422, 0.060695648193359375, 0.06282520294189453, 0.06495475769042969, 0.06708431243896484, 0.0692138671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 7.0, 11.0, 11.0, 22.0, 18.0, 26.0, 44.0, 80.0, 117.0, 192.0, 306.0, 572.0, 1165.0, 2445.0, 5255.0, 12223.0, 31256.0, 82182.0, 217071.0, 361491.0, 205557.0, 76972.0, 29877.0, 11834.0, 5066.0, 2228.0, 1120.0, 570.0, 326.0, 188.0, 100.0, 63.0, 30.0, 44.0, 26.0, 16.0, 8.0, 6.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07563400268554688, -0.07277679443359375, -0.06991958618164062, -0.0670623779296875, -0.06420516967773438, -0.06134796142578125, -0.058490753173828125, -0.055633544921875, -0.052776336669921875, -0.04991912841796875, -0.047061920166015625, -0.0442047119140625, -0.041347503662109375, -0.03849029541015625, -0.035633087158203125, -0.03277587890625, -0.029918670654296875, -0.02706146240234375, -0.024204254150390625, -0.0213470458984375, -0.018489837646484375, -0.01563262939453125, -0.012775421142578125, -0.009918212890625, -0.007061004638671875, -0.00420379638671875, -0.001346588134765625, 0.0015106201171875, 0.004367828369140625, 0.00722503662109375, 0.010082244873046875, 0.012939453125, 0.015796661376953125, 0.01865386962890625, 0.021511077880859375, 0.0243682861328125, 0.027225494384765625, 0.03008270263671875, 0.032939910888671875, 0.035797119140625, 0.038654327392578125, 0.04151153564453125, 0.044368743896484375, 0.0472259521484375, 0.050083160400390625, 0.05294036865234375, 0.055797576904296875, 0.05865478515625, 0.061511993408203125, 0.06436920166015625, 0.06722640991210938, 0.0700836181640625, 0.07294082641601562, 0.07579803466796875, 0.07865524291992188, 0.081512451171875, 0.08436965942382812, 0.08722686767578125, 0.09008407592773438, 0.0929412841796875, 0.09579849243164062, 0.09865570068359375, 0.10151290893554688, 0.1043701171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 6.0, 6.0, 5.0, 9.0, 8.0, 12.0, 10.0, 16.0, 16.0, 30.0, 25.0, 26.0, 27.0, 41.0, 32.0, 46.0, 28.0, 36.0, 33.0, 42.0, 51.0, 46.0, 42.0, 40.0, 30.0, 36.0, 31.0, 36.0, 28.0, 24.0, 24.0, 24.0, 16.0, 15.0, 14.0, 15.0, 12.0, 11.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.08294677734375, -0.08051300048828125, -0.0780792236328125, -0.07564544677734375, -0.073211669921875, -0.07077789306640625, -0.0683441162109375, -0.06591033935546875, -0.0634765625, -0.06104278564453125, -0.0586090087890625, -0.05617523193359375, -0.053741455078125, -0.05130767822265625, -0.0488739013671875, -0.04644012451171875, -0.04400634765625, -0.04157257080078125, -0.0391387939453125, -0.03670501708984375, -0.034271240234375, -0.03183746337890625, -0.0294036865234375, -0.02696990966796875, -0.0245361328125, -0.02210235595703125, -0.0196685791015625, -0.01723480224609375, -0.014801025390625, -0.01236724853515625, -0.0099334716796875, -0.00749969482421875, -0.00506591796875, -0.00263214111328125, -0.0001983642578125, 0.00223541259765625, 0.004669189453125, 0.00710296630859375, 0.0095367431640625, 0.01197052001953125, 0.014404296875, 0.01683807373046875, 0.0192718505859375, 0.02170562744140625, 0.024139404296875, 0.02657318115234375, 0.0290069580078125, 0.03144073486328125, 0.03387451171875, 0.03630828857421875, 0.0387420654296875, 0.04117584228515625, 0.043609619140625, 0.04604339599609375, 0.0484771728515625, 0.05091094970703125, 0.0533447265625, 0.05577850341796875, 0.0582122802734375, 0.06064605712890625, 0.063079833984375, 0.06551361083984375, 0.0679473876953125, 0.07038116455078125, 0.07281494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 7.0, 8.0, 18.0, 21.0, 30.0, 41.0, 48.0, 84.0, 99.0, 150.0, 219.0, 320.0, 482.0, 740.0, 1316.0, 2404.0, 5063.0, 13187.0, 59825.0, 734139.0, 190998.0, 23908.0, 7589.0, 3276.0, 1717.0, 971.0, 630.0, 376.0, 259.0, 174.0, 121.0, 93.0, 81.0, 44.0, 33.0, 23.0, 19.0, 9.0, 4.0, 11.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.15937042236328125, -0.1538238525390625, -0.14827728271484375, -0.142730712890625, -0.13718414306640625, -0.1316375732421875, -0.12609100341796875, -0.12054443359375, -0.11499786376953125, -0.1094512939453125, -0.10390472412109375, -0.098358154296875, -0.09281158447265625, -0.0872650146484375, -0.08171844482421875, -0.076171875, -0.07062530517578125, -0.0650787353515625, -0.05953216552734375, -0.053985595703125, -0.04843902587890625, -0.0428924560546875, -0.03734588623046875, -0.03179931640625, -0.02625274658203125, -0.0207061767578125, -0.01515960693359375, -0.009613037109375, -0.00406646728515625, 0.0014801025390625, 0.00702667236328125, 0.0125732421875, 0.01811981201171875, 0.0236663818359375, 0.02921295166015625, 0.034759521484375, 0.04030609130859375, 0.0458526611328125, 0.05139923095703125, 0.05694580078125, 0.06249237060546875, 0.0680389404296875, 0.07358551025390625, 0.079132080078125, 0.08467864990234375, 0.0902252197265625, 0.09577178955078125, 0.101318359375, 0.10686492919921875, 0.1124114990234375, 0.11795806884765625, 0.123504638671875, 0.12905120849609375, 0.1345977783203125, 0.14014434814453125, 0.14569091796875, 0.15123748779296875, 0.1567840576171875, 0.16233062744140625, 0.167877197265625, 0.17342376708984375, 0.1789703369140625, 0.18451690673828125, 0.1900634765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 10.0, 8.0, 15.0, 13.0, 20.0, 21.0, 44.0, 51.0, 75.0, 101.0, 115.0, 112.0, 103.0, 86.0, 50.0, 57.0, 28.0, 21.0, 16.0, 17.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.790327072143555e-05, -7.561221718788147e-05, -7.332116365432739e-05, -7.103011012077332e-05, -6.873905658721924e-05, -6.644800305366516e-05, -6.415694952011108e-05, -6.186589598655701e-05, -5.957484245300293e-05, -5.728378891944885e-05, -5.4992735385894775e-05, -5.27016818523407e-05, -5.041062831878662e-05, -4.8119574785232544e-05, -4.582852125167847e-05, -4.353746771812439e-05, -4.124641418457031e-05, -3.8955360651016235e-05, -3.666430711746216e-05, -3.437325358390808e-05, -3.2082200050354004e-05, -2.9791146516799927e-05, -2.750009298324585e-05, -2.5209039449691772e-05, -2.2917985916137695e-05, -2.0626932382583618e-05, -1.833587884902954e-05, -1.6044825315475464e-05, -1.3753771781921387e-05, -1.146271824836731e-05, -9.171664714813232e-06, -6.880611181259155e-06, -4.589557647705078e-06, -2.298504114151001e-06, -7.450580596923828e-09, 2.2836029529571533e-06, 4.5746564865112305e-06, 6.865710020065308e-06, 9.156763553619385e-06, 1.1447817087173462e-05, 1.3738870620727539e-05, 1.6029924154281616e-05, 1.8320977687835693e-05, 2.061203122138977e-05, 2.2903084754943848e-05, 2.5194138288497925e-05, 2.7485191822052002e-05, 2.977624535560608e-05, 3.2067298889160156e-05, 3.4358352422714233e-05, 3.664940595626831e-05, 3.894045948982239e-05, 4.1231513023376465e-05, 4.352256655693054e-05, 4.581362009048462e-05, 4.8104673624038696e-05, 5.0395727157592773e-05, 5.268678069114685e-05, 5.497783422470093e-05, 5.7268887758255005e-05, 5.955994129180908e-05, 6.185099482536316e-05, 6.414204835891724e-05, 6.643310189247131e-05, 6.872415542602539e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 12.0, 13.0, 13.0, 19.0, 31.0, 42.0, 59.0, 118.0, 156.0, 255.0, 451.0, 702.0, 1185.0, 2169.0, 3966.0, 8623.0, 34676.0, 698073.0, 262989.0, 20540.0, 6647.0, 3289.0, 1789.0, 1098.0, 628.0, 383.0, 230.0, 133.0, 107.0, 43.0, 36.0, 18.0, 16.0, 8.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.22036170959472656, -0.21403884887695312, -0.2077159881591797, -0.20139312744140625, -0.1950702667236328, -0.18874740600585938, -0.18242454528808594, -0.1761016845703125, -0.16977882385253906, -0.16345596313476562, -0.1571331024169922, -0.15081024169921875, -0.1444873809814453, -0.13816452026367188, -0.13184165954589844, -0.125518798828125, -0.11919593811035156, -0.11287307739257812, -0.10655021667480469, -0.10022735595703125, -0.09390449523925781, -0.08758163452148438, -0.08125877380371094, -0.0749359130859375, -0.06861305236816406, -0.062290191650390625, -0.05596733093261719, -0.04964447021484375, -0.04332160949707031, -0.036998748779296875, -0.030675888061523438, -0.02435302734375, -0.018030166625976562, -0.011707305908203125, -0.0053844451904296875, 0.00093841552734375, 0.0072612762451171875, 0.013584136962890625, 0.019906997680664062, 0.0262298583984375, 0.03255271911621094, 0.038875579833984375, 0.04519844055175781, 0.05152130126953125, 0.05784416198730469, 0.06416702270507812, 0.07048988342285156, 0.076812744140625, 0.08313560485839844, 0.08945846557617188, 0.09578132629394531, 0.10210418701171875, 0.10842704772949219, 0.11474990844726562, 0.12107276916503906, 0.1273956298828125, 0.13371849060058594, 0.14004135131835938, 0.1463642120361328, 0.15268707275390625, 0.1590099334716797, 0.16533279418945312, 0.17165565490722656, 0.177978515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 12.0, 17.0, 23.0, 29.0, 70.0, 113.0, 228.0, 200.0, 123.0, 61.0, 32.0, 17.0, 11.0, 11.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1905517578125, -0.18566226959228516, -0.1807727813720703, -0.17588329315185547, -0.17099380493164062, -0.16610431671142578, -0.16121482849121094, -0.1563253402709961, -0.15143585205078125, -0.1465463638305664, -0.14165687561035156, -0.13676738739013672, -0.13187789916992188, -0.12698841094970703, -0.12209892272949219, -0.11720943450927734, -0.1123199462890625, -0.10743045806884766, -0.10254096984863281, -0.09765148162841797, -0.09276199340820312, -0.08787250518798828, -0.08298301696777344, -0.0780935287475586, -0.07320404052734375, -0.0683145523071289, -0.06342506408691406, -0.05853557586669922, -0.053646087646484375, -0.04875659942626953, -0.04386711120605469, -0.038977622985839844, -0.034088134765625, -0.029198646545410156, -0.024309158325195312, -0.01941967010498047, -0.014530181884765625, -0.009640693664550781, -0.0047512054443359375, 0.00013828277587890625, 0.00502777099609375, 0.009917259216308594, 0.014806747436523438, 0.01969623565673828, 0.024585723876953125, 0.02947521209716797, 0.03436470031738281, 0.039254188537597656, 0.0441436767578125, 0.049033164978027344, 0.05392265319824219, 0.05881214141845703, 0.06370162963867188, 0.06859111785888672, 0.07348060607910156, 0.0783700942993164, 0.08325958251953125, 0.0881490707397461, 0.09303855895996094, 0.09792804718017578, 0.10281753540039062, 0.10770702362060547, 0.11259651184082031, 0.11748600006103516, 0.12237548828125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 11.0, 17.0, 25.0, 29.0, 74.0, 134.0, 167.0, 168.0, 128.0, 86.0, 49.0, 26.0, 26.0, 18.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2190868854522705, -1.1799559593200684, -1.1408249139785767, -1.1016939878463745, -1.0625630617141724, -1.0234320163726807, -0.9843010902404785, -0.9451701045036316, -0.9060391187667847, -0.8669081330299377, -0.8277772068977356, -0.7886462211608887, -0.7495152354240417, -0.7103842496871948, -0.6712533235549927, -0.6321223378181458, -0.5929914116859436, -0.5538604259490967, -0.5147294998168945, -0.4755985140800476, -0.4364675283432007, -0.39733657240867615, -0.3582056164741516, -0.3190746307373047, -0.27994367480278015, -0.24081270396709442, -0.2016817331314087, -0.16255077719688416, -0.12341980636119843, -0.0842888355255127, -0.04515787959098816, -0.006026893854141235, 0.0331040620803833, 0.07223503291606903, 0.11136599630117416, 0.1504969596862793, 0.18962793052196503, 0.22875890135765076, 0.2678898572921753, 0.3070208430290222, 0.34615179896354675, 0.3852827548980713, 0.4244137406349182, 0.46354469656944275, 0.5026756525039673, 0.5418066382408142, 0.5809376239776611, 0.6200685501098633, 0.6591995358467102, 0.6983305215835571, 0.7374614477157593, 0.7765924334526062, 0.8157234191894531, 0.8548543453216553, 0.8939853310585022, 0.9331163167953491, 0.9722472429275513, 1.0113781690597534, 1.0505092144012451, 1.0896401405334473, 1.1287710666656494, 1.1679021120071411, 1.2070330381393433, 1.246164083480835, 1.285295009613037]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 5.0, 7.0, 17.0, 10.0, 16.0, 14.0, 29.0, 27.0, 25.0, 37.0, 37.0, 43.0, 38.0, 35.0, 53.0, 32.0, 57.0, 45.0, 53.0, 42.0, 52.0, 38.0, 48.0, 31.0, 44.0, 29.0, 35.0, 18.0, 15.0, 17.0, 9.0, 8.0, 6.0, 8.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4381658434867859, -0.42410337924957275, -0.41004088521003723, -0.3959784209728241, -0.38191595673561096, -0.36785346269607544, -0.3537909984588623, -0.33972853422164917, -0.32566606998443604, -0.3116036057472229, -0.2975411117076874, -0.28347864747047424, -0.2694161832332611, -0.2553536891937256, -0.24129122495651245, -0.22722876071929932, -0.213166281580925, -0.19910380244255066, -0.18504133820533752, -0.1709788590669632, -0.15691639482975006, -0.14285391569137573, -0.1287914514541626, -0.11472897231578827, -0.10066650062799454, -0.0866040289402008, -0.07254155725240707, -0.058479081839323044, -0.04441661015152931, -0.030354134738445282, -0.01629166305065155, -0.0022291913628578186, 0.011833280324935913, 0.025895752012729645, 0.039958223700523376, 0.05402069911360741, 0.06808316707611084, 0.08214564621448517, 0.0962081179022789, 0.11027058959007263, 0.12433306127786636, 0.1383955329656601, 0.15245801210403442, 0.16652047634124756, 0.1805829554796219, 0.19464543461799622, 0.20870789885520935, 0.22277036309242249, 0.23683284223079681, 0.25089532136917114, 0.2649577856063843, 0.2790202498435974, 0.29308274388313293, 0.30714520812034607, 0.3212076723575592, 0.3352701663970947, 0.34933263063430786, 0.363395094871521, 0.3774575889110565, 0.39152005314826965, 0.4055825173854828, 0.4196450114250183, 0.43370747566223145, 0.4477699398994446, 0.4618324041366577]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 10.0, 10.0, 13.0, 28.0, 30.0, 40.0, 78.0, 123.0, 222.0, 417.0, 703.0, 1236.0, 2474.0, 5489.0, 14510.0, 46171.0, 301789.0, 3350145.0, 392775.0, 50868.0, 15512.0, 5937.0, 2629.0, 1352.0, 706.0, 399.0, 223.0, 146.0, 83.0, 50.0, 25.0, 30.0, 15.0, 13.0, 9.0, 11.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12084770202636719, -0.11724472045898438, -0.11364173889160156, -0.11003875732421875, -0.10643577575683594, -0.10283279418945312, -0.09922981262207031, -0.0956268310546875, -0.09202384948730469, -0.08842086791992188, -0.08481788635253906, -0.08121490478515625, -0.07761192321777344, -0.07400894165039062, -0.07040596008300781, -0.066802978515625, -0.06319999694824219, -0.059597015380859375, -0.05599403381347656, -0.05239105224609375, -0.04878807067871094, -0.045185089111328125, -0.04158210754394531, -0.0379791259765625, -0.03437614440917969, -0.030773162841796875, -0.027170181274414062, -0.02356719970703125, -0.019964218139648438, -0.016361236572265625, -0.012758255004882812, -0.0091552734375, -0.0055522918701171875, -0.001949310302734375, 0.0016536712646484375, 0.00525665283203125, 0.008859634399414062, 0.012462615966796875, 0.016065597534179688, 0.0196685791015625, 0.023271560668945312, 0.026874542236328125, 0.030477523803710938, 0.03408050537109375, 0.03768348693847656, 0.041286468505859375, 0.04488945007324219, 0.048492431640625, 0.05209541320800781, 0.055698394775390625, 0.05930137634277344, 0.06290435791015625, 0.06650733947753906, 0.07011032104492188, 0.07371330261230469, 0.0773162841796875, 0.08091926574707031, 0.08452224731445312, 0.08812522888183594, 0.09172821044921875, 0.09533119201660156, 0.09893417358398438, 0.10253715515136719, 0.10614013671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 14.0, 23.0, 35.0, 58.0, 57.0, 100.0, 92.0, 101.0, 117.0, 104.0, 72.0, 92.0, 49.0, 33.0, 20.0, 13.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0626220703125, -0.060461997985839844, -0.05830192565917969, -0.05614185333251953, -0.053981781005859375, -0.05182170867919922, -0.04966163635253906, -0.047501564025878906, -0.04534149169921875, -0.043181419372558594, -0.04102134704589844, -0.03886127471923828, -0.036701202392578125, -0.03454113006591797, -0.03238105773925781, -0.030220985412597656, -0.0280609130859375, -0.025900840759277344, -0.023740768432617188, -0.02158069610595703, -0.019420623779296875, -0.01726055145263672, -0.015100479125976562, -0.012940406799316406, -0.01078033447265625, -0.008620262145996094, -0.0064601898193359375, -0.004300117492675781, -0.002140045166015625, 2.002716064453125e-05, 0.0021800994873046875, 0.004340171813964844, 0.006500244140625, 0.008660316467285156, 0.010820388793945312, 0.012980461120605469, 0.015140533447265625, 0.01730060577392578, 0.019460678100585938, 0.021620750427246094, 0.02378082275390625, 0.025940895080566406, 0.028100967407226562, 0.03026103973388672, 0.032421112060546875, 0.03458118438720703, 0.03674125671386719, 0.038901329040527344, 0.0410614013671875, 0.043221473693847656, 0.04538154602050781, 0.04754161834716797, 0.049701690673828125, 0.05186176300048828, 0.05402183532714844, 0.056181907653808594, 0.05834197998046875, 0.060502052307128906, 0.06266212463378906, 0.06482219696044922, 0.06698226928710938, 0.06914234161376953, 0.07130241394042969, 0.07346248626708984, 0.07562255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 12.0, 9.0, 22.0, 22.0, 39.0, 72.0, 76.0, 114.0, 208.0, 307.0, 531.0, 769.0, 1304.0, 2333.0, 4450.0, 8441.0, 18219.0, 44727.0, 137475.0, 749511.0, 2719995.0, 356378.0, 88681.0, 31928.0, 13739.0, 6590.0, 3472.0, 1905.0, 1090.0, 655.0, 405.0, 282.0, 170.0, 120.0, 70.0, 44.0, 42.0, 25.0, 16.0, 11.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.072998046875, -0.07066726684570312, -0.06833648681640625, -0.06600570678710938, -0.0636749267578125, -0.061344146728515625, -0.05901336669921875, -0.056682586669921875, -0.054351806640625, -0.052021026611328125, -0.04969024658203125, -0.047359466552734375, -0.0450286865234375, -0.042697906494140625, -0.04036712646484375, -0.038036346435546875, -0.03570556640625, -0.033374786376953125, -0.03104400634765625, -0.028713226318359375, -0.0263824462890625, -0.024051666259765625, -0.02172088623046875, -0.019390106201171875, -0.017059326171875, -0.014728546142578125, -0.01239776611328125, -0.010066986083984375, -0.0077362060546875, -0.005405426025390625, -0.00307464599609375, -0.000743865966796875, 0.0015869140625, 0.003917694091796875, 0.00624847412109375, 0.008579254150390625, 0.0109100341796875, 0.013240814208984375, 0.01557159423828125, 0.017902374267578125, 0.020233154296875, 0.022563934326171875, 0.02489471435546875, 0.027225494384765625, 0.0295562744140625, 0.031887054443359375, 0.03421783447265625, 0.036548614501953125, 0.03887939453125, 0.041210174560546875, 0.04354095458984375, 0.045871734619140625, 0.0482025146484375, 0.050533294677734375, 0.05286407470703125, 0.055194854736328125, 0.057525634765625, 0.059856414794921875, 0.06218719482421875, 0.06451797485351562, 0.0668487548828125, 0.06917953491210938, 0.07151031494140625, 0.07384109497070312, 0.076171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 16.0, 11.0, 31.0, 15.0, 28.0, 48.0, 71.0, 127.0, 170.0, 278.0, 500.0, 948.0, 762.0, 361.0, 209.0, 158.0, 85.0, 61.0, 49.0, 35.0, 19.0, 9.0, 16.0, 7.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08953857421875, -0.08687877655029297, -0.08421897888183594, -0.0815591812133789, -0.07889938354492188, -0.07623958587646484, -0.07357978820800781, -0.07091999053955078, -0.06826019287109375, -0.06560039520263672, -0.06294059753417969, -0.060280799865722656, -0.057621002197265625, -0.054961204528808594, -0.05230140686035156, -0.04964160919189453, -0.0469818115234375, -0.04432201385498047, -0.04166221618652344, -0.039002418518066406, -0.036342620849609375, -0.033682823181152344, -0.031023025512695312, -0.02836322784423828, -0.02570343017578125, -0.02304363250732422, -0.020383834838867188, -0.017724037170410156, -0.015064239501953125, -0.012404441833496094, -0.009744644165039062, -0.007084846496582031, -0.004425048828125, -0.0017652511596679688, 0.0008945465087890625, 0.0035543441772460938, 0.006214141845703125, 0.008873939514160156, 0.011533737182617188, 0.014193534851074219, 0.01685333251953125, 0.01951313018798828, 0.022172927856445312, 0.024832725524902344, 0.027492523193359375, 0.030152320861816406, 0.03281211853027344, 0.03547191619873047, 0.0381317138671875, 0.04079151153564453, 0.04345130920410156, 0.046111106872558594, 0.048770904541015625, 0.051430702209472656, 0.05409049987792969, 0.05675029754638672, 0.05941009521484375, 0.06206989288330078, 0.06472969055175781, 0.06738948822021484, 0.07004928588867188, 0.0727090835571289, 0.07536888122558594, 0.07802867889404297, 0.0806884765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 14.0, 16.0, 37.0, 50.0, 101.0, 139.0, 145.0, 141.0, 114.0, 96.0, 54.0, 45.0, 13.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3961721658706665, -0.3748897612094879, -0.3536073565483093, -0.33232492208480835, -0.31104251742362976, -0.28976011276245117, -0.2684776782989502, -0.2471952736377716, -0.22591286897659302, -0.20463046431541443, -0.18334804475307465, -0.16206562519073486, -0.14078322052955627, -0.11950080841779709, -0.0982183963060379, -0.07693597674369812, -0.05565357208251953, -0.034371159970760345, -0.01308874785900116, 0.008193664252758026, 0.029476076364517212, 0.0507584884762764, 0.07204090058803558, 0.09332332015037537, 0.11460572481155396, 0.13588812947273254, 0.15717054903507233, 0.1784529685974121, 0.1997353732585907, 0.2210177779197693, 0.24230019748210907, 0.26358261704444885, 0.28486502170562744, 0.30614742636680603, 0.3274298310279846, 0.3487122654914856, 0.3699946701526642, 0.3912770748138428, 0.41255950927734375, 0.43384191393852234, 0.4551243185997009, 0.4764067232608795, 0.4976891279220581, 0.5189715623855591, 0.5402539968490601, 0.5615363717079163, 0.5828188061714172, 0.6041011810302734, 0.6253836154937744, 0.6466660499572754, 0.6679484248161316, 0.6892308592796326, 0.7105132341384888, 0.7317956686019897, 0.7530781030654907, 0.7743605375289917, 0.7956429123878479, 0.8169253468513489, 0.8382077217102051, 0.859490156173706, 0.880772590637207, 0.9020549654960632, 0.9233373999595642, 0.9446197748184204, 0.9659022092819214]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 7.0, 6.0, 3.0, 9.0, 9.0, 12.0, 19.0, 16.0, 14.0, 19.0, 15.0, 26.0, 18.0, 30.0, 34.0, 32.0, 25.0, 37.0, 52.0, 35.0, 35.0, 35.0, 48.0, 34.0, 39.0, 39.0, 30.0, 30.0, 23.0, 41.0, 31.0, 17.0, 27.0, 23.0, 16.0, 14.0, 17.0, 10.0, 14.0, 15.0, 8.0, 14.0, 8.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2591901421546936, -0.2510605454444885, -0.24293096363544464, -0.23480138182640076, -0.22667178511619568, -0.2185421884059906, -0.21041260659694672, -0.20228302478790283, -0.19415342807769775, -0.18602383136749268, -0.1778942495584488, -0.1697646677494049, -0.16163507103919983, -0.15350547432899475, -0.14537589251995087, -0.13724631071090698, -0.1291167140007019, -0.12098712474107742, -0.11285753548145294, -0.10472794622182846, -0.09659835696220398, -0.0884687677025795, -0.08033917844295502, -0.07220958918333054, -0.06407999992370605, -0.055950410664081573, -0.04782082140445709, -0.03969123214483261, -0.03156164288520813, -0.02343205362558365, -0.015302464365959167, -0.007172875106334686, 0.0009567141532897949, 0.009086303412914276, 0.017215892672538757, 0.02534548193216324, 0.03347507119178772, 0.0416046604514122, 0.04973424971103668, 0.05786383897066116, 0.06599342823028564, 0.07412301748991013, 0.0822526067495346, 0.09038219600915909, 0.09851178526878357, 0.10664137452840805, 0.11477096378803253, 0.12290055304765701, 0.1310301423072815, 0.13915973901748657, 0.14728932082653046, 0.15541890263557434, 0.16354849934577942, 0.1716780960559845, 0.17980767786502838, 0.18793725967407227, 0.19606685638427734, 0.20419645309448242, 0.2123260349035263, 0.2204556167125702, 0.22858521342277527, 0.23671481013298035, 0.24484439194202423, 0.2529739737510681, 0.2611035704612732]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 11.0, 22.0, 24.0, 38.0, 57.0, 89.0, 109.0, 182.0, 296.0, 435.0, 721.0, 1312.0, 2334.0, 4275.0, 8317.0, 17161.0, 38034.0, 90467.0, 214113.0, 323316.0, 196723.0, 82490.0, 34922.0, 16001.0, 7782.0, 3937.0, 2209.0, 1300.0, 630.0, 426.0, 303.0, 165.0, 105.0, 83.0, 45.0, 35.0, 25.0, 18.0, 16.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09210205078125, -0.0891733169555664, -0.08624458312988281, -0.08331584930419922, -0.08038711547851562, -0.07745838165283203, -0.07452964782714844, -0.07160091400146484, -0.06867218017578125, -0.06574344635009766, -0.06281471252441406, -0.05988597869873047, -0.056957244873046875, -0.05402851104736328, -0.05109977722167969, -0.048171043395996094, -0.0452423095703125, -0.042313575744628906, -0.03938484191894531, -0.03645610809326172, -0.033527374267578125, -0.03059864044189453, -0.027669906616210938, -0.024741172790527344, -0.02181243896484375, -0.018883705139160156, -0.015954971313476562, -0.013026237487792969, -0.010097503662109375, -0.007168769836425781, -0.0042400360107421875, -0.0013113021850585938, 0.001617431640625, 0.004546165466308594, 0.0074748992919921875, 0.010403633117675781, 0.013332366943359375, 0.01626110076904297, 0.019189834594726562, 0.022118568420410156, 0.02504730224609375, 0.027976036071777344, 0.030904769897460938, 0.03383350372314453, 0.036762237548828125, 0.03969097137451172, 0.04261970520019531, 0.045548439025878906, 0.0484771728515625, 0.051405906677246094, 0.05433464050292969, 0.05726337432861328, 0.060192108154296875, 0.06312084197998047, 0.06604957580566406, 0.06897830963134766, 0.07190704345703125, 0.07483577728271484, 0.07776451110839844, 0.08069324493408203, 0.08362197875976562, 0.08655071258544922, 0.08947944641113281, 0.0924081802368164, 0.0953369140625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 7.0, 14.0, 16.0, 18.0, 27.0, 44.0, 60.0, 62.0, 76.0, 91.0, 78.0, 98.0, 76.0, 82.0, 66.0, 58.0, 47.0, 33.0, 21.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06295585632324219, -0.060848236083984375, -0.05874061584472656, -0.05663299560546875, -0.05452537536621094, -0.052417755126953125, -0.05031013488769531, -0.0482025146484375, -0.04609489440917969, -0.043987274169921875, -0.04187965393066406, -0.03977203369140625, -0.03766441345214844, -0.035556793212890625, -0.03344917297363281, -0.031341552734375, -0.029233932495117188, -0.027126312255859375, -0.025018692016601562, -0.02291107177734375, -0.020803451538085938, -0.018695831298828125, -0.016588211059570312, -0.0144805908203125, -0.012372970581054688, -0.010265350341796875, -0.008157730102539062, -0.00605010986328125, -0.0039424896240234375, -0.001834869384765625, 0.0002727508544921875, 0.00238037109375, 0.0044879913330078125, 0.006595611572265625, 0.008703231811523438, 0.01081085205078125, 0.012918472290039062, 0.015026092529296875, 0.017133712768554688, 0.0192413330078125, 0.021348953247070312, 0.023456573486328125, 0.025564193725585938, 0.02767181396484375, 0.029779434204101562, 0.031887054443359375, 0.03399467468261719, 0.036102294921875, 0.03820991516113281, 0.040317535400390625, 0.04242515563964844, 0.04453277587890625, 0.04664039611816406, 0.048748016357421875, 0.05085563659667969, 0.0529632568359375, 0.05507087707519531, 0.057178497314453125, 0.05928611755371094, 0.06139373779296875, 0.06350135803222656, 0.06560897827148438, 0.06771659851074219, 0.06982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 7.0, 3.0, 11.0, 16.0, 24.0, 35.0, 53.0, 81.0, 166.0, 278.0, 431.0, 882.0, 1529.0, 3039.0, 6012.0, 13174.0, 31323.0, 85516.0, 266210.0, 396849.0, 153110.0, 51491.0, 20064.0, 8897.0, 4358.0, 2250.0, 1150.0, 609.0, 391.0, 221.0, 130.0, 93.0, 50.0, 32.0, 23.0, 11.0, 8.0, 12.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10385513305664062, -0.10053253173828125, -0.09720993041992188, -0.0938873291015625, -0.09056472778320312, -0.08724212646484375, -0.08391952514648438, -0.080596923828125, -0.07727432250976562, -0.07395172119140625, -0.07062911987304688, -0.0673065185546875, -0.06398391723632812, -0.06066131591796875, -0.057338714599609375, -0.05401611328125, -0.050693511962890625, -0.04737091064453125, -0.044048309326171875, -0.0407257080078125, -0.037403106689453125, -0.03408050537109375, -0.030757904052734375, -0.027435302734375, -0.024112701416015625, -0.02079010009765625, -0.017467498779296875, -0.0141448974609375, -0.010822296142578125, -0.00749969482421875, -0.004177093505859375, -0.0008544921875, 0.002468109130859375, 0.00579071044921875, 0.009113311767578125, 0.0124359130859375, 0.015758514404296875, 0.01908111572265625, 0.022403717041015625, 0.025726318359375, 0.029048919677734375, 0.03237152099609375, 0.035694122314453125, 0.0390167236328125, 0.042339324951171875, 0.04566192626953125, 0.048984527587890625, 0.05230712890625, 0.055629730224609375, 0.05895233154296875, 0.062274932861328125, 0.0655975341796875, 0.06892013549804688, 0.07224273681640625, 0.07556533813476562, 0.078887939453125, 0.08221054077148438, 0.08553314208984375, 0.08885574340820312, 0.0921783447265625, 0.09550094604492188, 0.09882354736328125, 0.10214614868164062, 0.10546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 9.0, 9.0, 8.0, 14.0, 11.0, 18.0, 19.0, 27.0, 40.0, 44.0, 42.0, 58.0, 43.0, 71.0, 56.0, 60.0, 70.0, 52.0, 52.0, 52.0, 47.0, 35.0, 26.0, 16.0, 23.0, 19.0, 15.0, 11.0, 9.0, 9.0, 6.0, 2.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15755748748779297, -0.15312767028808594, -0.1486978530883789, -0.14426803588867188, -0.13983821868896484, -0.1354084014892578, -0.13097858428955078, -0.12654876708984375, -0.12211894989013672, -0.11768913269042969, -0.11325931549072266, -0.10882949829101562, -0.1043996810913086, -0.09996986389160156, -0.09554004669189453, -0.0911102294921875, -0.08668041229248047, -0.08225059509277344, -0.0778207778930664, -0.07339096069335938, -0.06896114349365234, -0.06453132629394531, -0.06010150909423828, -0.05567169189453125, -0.05124187469482422, -0.04681205749511719, -0.042382240295410156, -0.037952423095703125, -0.033522605895996094, -0.029092788696289062, -0.02466297149658203, -0.020233154296875, -0.01580333709716797, -0.011373519897460938, -0.006943702697753906, -0.002513885498046875, 0.0019159317016601562, 0.0063457489013671875, 0.010775566101074219, 0.01520538330078125, 0.01963520050048828, 0.024065017700195312, 0.028494834899902344, 0.032924652099609375, 0.037354469299316406, 0.04178428649902344, 0.04621410369873047, 0.0506439208984375, 0.05507373809814453, 0.05950355529785156, 0.0639333724975586, 0.06836318969726562, 0.07279300689697266, 0.07722282409667969, 0.08165264129638672, 0.08608245849609375, 0.09051227569580078, 0.09494209289550781, 0.09937191009521484, 0.10380172729492188, 0.1082315444946289, 0.11266136169433594, 0.11709117889404297, 0.12152099609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 7.0, 9.0, 12.0, 25.0, 29.0, 51.0, 52.0, 103.0, 131.0, 192.0, 286.0, 358.0, 560.0, 783.0, 1292.0, 1842.0, 2831.0, 4471.0, 7053.0, 12028.0, 20252.0, 39932.0, 92713.0, 243741.0, 337054.0, 153821.0, 59574.0, 28106.0, 15564.0, 9165.0, 5810.0, 3525.0, 2326.0, 1636.0, 1011.0, 727.0, 426.0, 329.0, 215.0, 150.0, 100.0, 71.0, 52.0, 44.0, 34.0, 17.0, 9.0, 13.0, 12.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030853271484375, -0.02986621856689453, -0.028879165649414062, -0.027892112731933594, -0.026905059814453125, -0.025918006896972656, -0.024930953979492188, -0.02394390106201172, -0.02295684814453125, -0.02196979522705078, -0.020982742309570312, -0.019995689392089844, -0.019008636474609375, -0.018021583557128906, -0.017034530639648438, -0.01604747772216797, -0.0150604248046875, -0.014073371887207031, -0.013086318969726562, -0.012099266052246094, -0.011112213134765625, -0.010125160217285156, -0.009138107299804688, -0.008151054382324219, -0.00716400146484375, -0.006176948547363281, -0.0051898956298828125, -0.004202842712402344, -0.003215789794921875, -0.0022287368774414062, -0.0012416839599609375, -0.00025463104248046875, 0.000732421875, 0.0017194747924804688, 0.0027065277099609375, 0.0036935806274414062, 0.004680633544921875, 0.005667686462402344, 0.0066547393798828125, 0.007641792297363281, 0.00862884521484375, 0.009615898132324219, 0.010602951049804688, 0.011590003967285156, 0.012577056884765625, 0.013564109802246094, 0.014551162719726562, 0.015538215637207031, 0.0165252685546875, 0.01751232147216797, 0.018499374389648438, 0.019486427307128906, 0.020473480224609375, 0.021460533142089844, 0.022447586059570312, 0.02343463897705078, 0.02442169189453125, 0.02540874481201172, 0.026395797729492188, 0.027382850646972656, 0.028369903564453125, 0.029356956481933594, 0.030344009399414062, 0.03133106231689453, 0.032318115234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 8.0, 9.0, 11.0, 16.0, 17.0, 22.0, 27.0, 34.0, 48.0, 45.0, 66.0, 66.0, 100.0, 94.0, 82.0, 74.0, 42.0, 38.0, 34.0, 32.0, 20.0, 17.0, 21.0, 12.0, 5.0, 7.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.2928924560546875e-05, -5.153939127922058e-05, -5.014985799789429e-05, -4.876032471656799e-05, -4.73707914352417e-05, -4.5981258153915405e-05, -4.459172487258911e-05, -4.320219159126282e-05, -4.1812658309936523e-05, -4.042312502861023e-05, -3.9033591747283936e-05, -3.764405846595764e-05, -3.625452518463135e-05, -3.4864991903305054e-05, -3.347545862197876e-05, -3.2085925340652466e-05, -3.069639205932617e-05, -2.9306858777999878e-05, -2.7917325496673584e-05, -2.652779221534729e-05, -2.5138258934020996e-05, -2.3748725652694702e-05, -2.2359192371368408e-05, -2.0969659090042114e-05, -1.958012580871582e-05, -1.8190592527389526e-05, -1.6801059246063232e-05, -1.541152596473694e-05, -1.4021992683410645e-05, -1.263245940208435e-05, -1.1242926120758057e-05, -9.853392839431763e-06, -8.463859558105469e-06, -7.074326276779175e-06, -5.684792995452881e-06, -4.295259714126587e-06, -2.905726432800293e-06, -1.516193151473999e-06, -1.2665987014770508e-07, 1.2628734111785889e-06, 2.652406692504883e-06, 4.041939973831177e-06, 5.431473255157471e-06, 6.821006536483765e-06, 8.210539817810059e-06, 9.600073099136353e-06, 1.0989606380462646e-05, 1.237913966178894e-05, 1.3768672943115234e-05, 1.5158206224441528e-05, 1.6547739505767822e-05, 1.7937272787094116e-05, 1.932680606842041e-05, 2.0716339349746704e-05, 2.2105872631072998e-05, 2.3495405912399292e-05, 2.4884939193725586e-05, 2.627447247505188e-05, 2.7664005756378174e-05, 2.9053539037704468e-05, 3.0443072319030762e-05, 3.1832605600357056e-05, 3.322213888168335e-05, 3.4611672163009644e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 12.0, 8.0, 4.0, 16.0, 16.0, 28.0, 27.0, 49.0, 85.0, 133.0, 223.0, 330.0, 645.0, 1133.0, 2201.0, 4570.0, 9957.0, 23924.0, 71214.0, 265664.0, 445240.0, 149517.0, 43261.0, 16154.0, 6938.0, 3312.0, 1638.0, 895.0, 523.0, 298.0, 193.0, 123.0, 83.0, 56.0, 24.0, 16.0, 15.0, 9.0, 8.0, 8.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04400634765625, -0.04259967803955078, -0.04119300842285156, -0.039786338806152344, -0.038379669189453125, -0.036972999572753906, -0.03556632995605469, -0.03415966033935547, -0.03275299072265625, -0.03134632110595703, -0.029939651489257812, -0.028532981872558594, -0.027126312255859375, -0.025719642639160156, -0.024312973022460938, -0.02290630340576172, -0.0214996337890625, -0.02009296417236328, -0.018686294555664062, -0.017279624938964844, -0.015872955322265625, -0.014466285705566406, -0.013059616088867188, -0.011652946472167969, -0.01024627685546875, -0.008839607238769531, -0.0074329376220703125, -0.006026268005371094, -0.004619598388671875, -0.0032129287719726562, -0.0018062591552734375, -0.00039958953857421875, 0.001007080078125, 0.0024137496948242188, 0.0038204193115234375, 0.005227088928222656, 0.006633758544921875, 0.008040428161621094, 0.009447097778320312, 0.010853767395019531, 0.01226043701171875, 0.013667106628417969, 0.015073776245117188, 0.016480445861816406, 0.017887115478515625, 0.019293785095214844, 0.020700454711914062, 0.02210712432861328, 0.0235137939453125, 0.02492046356201172, 0.026327133178710938, 0.027733802795410156, 0.029140472412109375, 0.030547142028808594, 0.03195381164550781, 0.03336048126220703, 0.03476715087890625, 0.03617382049560547, 0.03758049011230469, 0.038987159729003906, 0.040393829345703125, 0.041800498962402344, 0.04320716857910156, 0.04461383819580078, 0.0460205078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 15.0, 15.0, 21.0, 36.0, 42.0, 39.0, 79.0, 84.0, 85.0, 99.0, 94.0, 90.0, 72.0, 35.0, 37.0, 24.0, 28.0, 14.0, 12.0, 6.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054107666015625, -0.05243062973022461, -0.05075359344482422, -0.04907655715942383, -0.04739952087402344, -0.04572248458862305, -0.044045448303222656, -0.042368412017822266, -0.040691375732421875, -0.039014339447021484, -0.037337303161621094, -0.0356602668762207, -0.03398323059082031, -0.03230619430541992, -0.03062915802001953, -0.02895212173461914, -0.02727508544921875, -0.02559804916381836, -0.02392101287841797, -0.022243976593017578, -0.020566940307617188, -0.018889904022216797, -0.017212867736816406, -0.015535831451416016, -0.013858795166015625, -0.012181758880615234, -0.010504722595214844, -0.008827686309814453, -0.0071506500244140625, -0.005473613739013672, -0.0037965774536132812, -0.0021195411682128906, -0.0004425048828125, 0.0012345314025878906, 0.0029115676879882812, 0.004588603973388672, 0.0062656402587890625, 0.007942676544189453, 0.009619712829589844, 0.011296749114990234, 0.012973785400390625, 0.014650821685791016, 0.016327857971191406, 0.018004894256591797, 0.019681930541992188, 0.021358966827392578, 0.02303600311279297, 0.02471303939819336, 0.02639007568359375, 0.02806711196899414, 0.02974414825439453, 0.03142118453979492, 0.03309822082519531, 0.0347752571105957, 0.036452293395996094, 0.038129329681396484, 0.039806365966796875, 0.041483402252197266, 0.043160438537597656, 0.04483747482299805, 0.04651451110839844, 0.04819154739379883, 0.04986858367919922, 0.05154561996459961, 0.05322265625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 27.0, 40.0, 82.0, 145.0, 170.0, 164.0, 152.0, 92.0, 46.0, 25.0, 13.0, 11.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8332950472831726, -0.8010374903678894, -0.7687799334526062, -0.736522376537323, -0.7042648196220398, -0.6720072627067566, -0.6397497057914734, -0.6074921488761902, -0.575234591960907, -0.5429770350456238, -0.5107194781303406, -0.4784619212150574, -0.44620436429977417, -0.41394680738449097, -0.38168925046920776, -0.34943169355392456, -0.31717413663864136, -0.28491657972335815, -0.25265902280807495, -0.22040146589279175, -0.18814390897750854, -0.15588635206222534, -0.12362879514694214, -0.09137123823165894, -0.05911368131637573, -0.02685612440109253, 0.005401432514190674, 0.03765898942947388, 0.06991654634475708, 0.10217410326004028, 0.1344316601753235, 0.1666892170906067, 0.19894683361053467, 0.23120439052581787, 0.2634619474411011, 0.2957195043563843, 0.3279770612716675, 0.3602346181869507, 0.3924921751022339, 0.4247497320175171, 0.4570072889328003, 0.4892648458480835, 0.5215224027633667, 0.5537799596786499, 0.5860375165939331, 0.6182950735092163, 0.6505526304244995, 0.6828101873397827, 0.7150677442550659, 0.7473253011703491, 0.7795828580856323, 0.8118404150009155, 0.8440979719161987, 0.8763555288314819, 0.9086130857467651, 0.9408706426620483, 0.9731281995773315, 1.0053857564926147, 1.037643313407898, 1.0699008703231812, 1.1021584272384644, 1.1344159841537476, 1.1666735410690308, 1.198931097984314, 1.2311886548995972]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 4.0, 10.0, 17.0, 15.0, 7.0, 14.0, 21.0, 20.0, 30.0, 27.0, 27.0, 27.0, 35.0, 32.0, 38.0, 32.0, 45.0, 39.0, 42.0, 43.0, 42.0, 32.0, 47.0, 40.0, 35.0, 26.0, 19.0, 30.0, 19.0, 40.0, 20.0, 12.0, 19.0, 15.0, 10.0, 11.0, 10.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.33496761322021484, -0.32481276988983154, -0.31465792655944824, -0.30450308322906494, -0.29434823989868164, -0.28419339656829834, -0.27403855323791504, -0.26388370990753174, -0.25372886657714844, -0.24357402324676514, -0.23341917991638184, -0.22326433658599854, -0.21310949325561523, -0.20295464992523193, -0.19279980659484863, -0.18264496326446533, -0.17249010503292084, -0.16233526170253754, -0.15218041837215424, -0.14202557504177094, -0.13187073171138763, -0.12171588838100433, -0.11156103760004044, -0.10140619426965714, -0.09125135093927383, -0.08109650760889053, -0.07094166427850723, -0.06078681722283363, -0.05063197389245033, -0.04047713056206703, -0.030322283506393433, -0.020167440176010132, -0.010012596845626831, 0.00014224741607904434, 0.01029709167778492, 0.02045193687081337, 0.03060678020119667, 0.04076162353157997, 0.05091647058725357, 0.06107131391763687, 0.07122615724802017, 0.08138100057840347, 0.09153584390878677, 0.10169069468975067, 0.11184553802013397, 0.12200038135051727, 0.13215522468090057, 0.14231006801128387, 0.15246491134166718, 0.16261975467205048, 0.17277459800243378, 0.18292944133281708, 0.19308428466320038, 0.20323912799358368, 0.21339398622512817, 0.22354882955551147, 0.23370367288589478, 0.24385851621627808, 0.2540133595466614, 0.2641682028770447, 0.274323046207428, 0.2844778895378113, 0.2946327328681946, 0.3047875761985779, 0.3149424195289612]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 13.0, 16.0, 27.0, 48.0, 96.0, 166.0, 360.0, 717.0, 1584.0, 4048.0, 11620.0, 43989.0, 401609.0, 3360010.0, 314181.0, 38726.0, 10508.0, 3822.0, 1440.0, 600.0, 318.0, 138.0, 90.0, 38.0, 30.0, 15.0, 10.0, 9.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12363338470458984, -0.11970329284667969, -0.11577320098876953, -0.11184310913085938, -0.10791301727294922, -0.10398292541503906, -0.1000528335571289, -0.09612274169921875, -0.0921926498413086, -0.08826255798339844, -0.08433246612548828, -0.08040237426757812, -0.07647228240966797, -0.07254219055175781, -0.06861209869384766, -0.0646820068359375, -0.060751914978027344, -0.05682182312011719, -0.05289173126220703, -0.048961639404296875, -0.04503154754638672, -0.04110145568847656, -0.037171363830566406, -0.03324127197265625, -0.029311180114746094, -0.025381088256835938, -0.02145099639892578, -0.017520904541015625, -0.013590812683105469, -0.009660720825195312, -0.005730628967285156, -0.001800537109375, 0.0021295547485351562, 0.0060596466064453125, 0.009989738464355469, 0.013919830322265625, 0.01784992218017578, 0.021780014038085938, 0.025710105895996094, 0.02964019775390625, 0.033570289611816406, 0.03750038146972656, 0.04143047332763672, 0.045360565185546875, 0.04929065704345703, 0.05322074890136719, 0.057150840759277344, 0.0610809326171875, 0.06501102447509766, 0.06894111633300781, 0.07287120819091797, 0.07680130004882812, 0.08073139190673828, 0.08466148376464844, 0.0885915756225586, 0.09252166748046875, 0.0964517593383789, 0.10038185119628906, 0.10431194305419922, 0.10824203491210938, 0.11217212677001953, 0.11610221862792969, 0.12003231048583984, 0.12396240234375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 8.0, 8.0, 16.0, 35.0, 27.0, 46.0, 56.0, 62.0, 63.0, 83.0, 72.0, 84.0, 68.0, 92.0, 74.0, 53.0, 38.0, 39.0, 24.0, 23.0, 11.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0615234375, -0.05948066711425781, -0.057437896728515625, -0.05539512634277344, -0.05335235595703125, -0.05130958557128906, -0.049266815185546875, -0.04722404479980469, -0.0451812744140625, -0.04313850402832031, -0.041095733642578125, -0.03905296325683594, -0.03701019287109375, -0.03496742248535156, -0.032924652099609375, -0.030881881713867188, -0.028839111328125, -0.026796340942382812, -0.024753570556640625, -0.022710800170898438, -0.02066802978515625, -0.018625259399414062, -0.016582489013671875, -0.014539718627929688, -0.0124969482421875, -0.010454177856445312, -0.008411407470703125, -0.0063686370849609375, -0.00432586669921875, -0.0022830963134765625, -0.000240325927734375, 0.0018024444580078125, 0.00384521484375, 0.0058879852294921875, 0.007930755615234375, 0.009973526000976562, 0.01201629638671875, 0.014059066772460938, 0.016101837158203125, 0.018144607543945312, 0.0201873779296875, 0.022230148315429688, 0.024272918701171875, 0.026315689086914062, 0.02835845947265625, 0.030401229858398438, 0.032444000244140625, 0.03448677062988281, 0.036529541015625, 0.03857231140136719, 0.040615081787109375, 0.04265785217285156, 0.04470062255859375, 0.04674339294433594, 0.048786163330078125, 0.05082893371582031, 0.0528717041015625, 0.05491447448730469, 0.056957244873046875, 0.05900001525878906, 0.06104278564453125, 0.06308555603027344, 0.06512832641601562, 0.06717109680175781, 0.0692138671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 13.0, 16.0, 29.0, 42.0, 50.0, 78.0, 124.0, 189.0, 274.0, 405.0, 635.0, 1030.0, 1692.0, 2758.0, 4907.0, 8724.0, 17208.0, 36746.0, 94399.0, 376144.0, 2704730.0, 714921.0, 134848.0, 48000.0, 21556.0, 10740.0, 5696.0, 3212.0, 1825.0, 1202.0, 716.0, 439.0, 334.0, 200.0, 141.0, 81.0, 52.0, 36.0, 31.0, 13.0, 16.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07293701171875, -0.07070350646972656, -0.06847000122070312, -0.06623649597167969, -0.06400299072265625, -0.06176948547363281, -0.059535980224609375, -0.05730247497558594, -0.0550689697265625, -0.05283546447753906, -0.050601959228515625, -0.04836845397949219, -0.04613494873046875, -0.04390144348144531, -0.041667938232421875, -0.03943443298339844, -0.037200927734375, -0.03496742248535156, -0.032733917236328125, -0.030500411987304688, -0.02826690673828125, -0.026033401489257812, -0.023799896240234375, -0.021566390991210938, -0.0193328857421875, -0.017099380493164062, -0.014865875244140625, -0.012632369995117188, -0.01039886474609375, -0.008165359497070312, -0.005931854248046875, -0.0036983489990234375, -0.00146484375, 0.0007686614990234375, 0.003002166748046875, 0.0052356719970703125, 0.00746917724609375, 0.009702682495117188, 0.011936187744140625, 0.014169692993164062, 0.0164031982421875, 0.018636703491210938, 0.020870208740234375, 0.023103713989257812, 0.02533721923828125, 0.027570724487304688, 0.029804229736328125, 0.03203773498535156, 0.034271240234375, 0.03650474548339844, 0.038738250732421875, 0.04097175598144531, 0.04320526123046875, 0.04543876647949219, 0.047672271728515625, 0.04990577697753906, 0.0521392822265625, 0.05437278747558594, 0.056606292724609375, 0.05883979797363281, 0.06107330322265625, 0.06330680847167969, 0.06554031372070312, 0.06777381896972656, 0.07000732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 16.0, 19.0, 27.0, 41.0, 49.0, 68.0, 96.0, 174.0, 312.0, 624.0, 987.0, 691.0, 326.0, 178.0, 131.0, 85.0, 50.0, 42.0, 25.0, 31.0, 13.0, 12.0, 13.0, 11.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.106201171875, -0.10312652587890625, -0.1000518798828125, -0.09697723388671875, -0.093902587890625, -0.09082794189453125, -0.0877532958984375, -0.08467864990234375, -0.08160400390625, -0.07852935791015625, -0.0754547119140625, -0.07238006591796875, -0.069305419921875, -0.06623077392578125, -0.0631561279296875, -0.06008148193359375, -0.0570068359375, -0.05393218994140625, -0.0508575439453125, -0.04778289794921875, -0.044708251953125, -0.04163360595703125, -0.0385589599609375, -0.03548431396484375, -0.03240966796875, -0.02933502197265625, -0.0262603759765625, -0.02318572998046875, -0.020111083984375, -0.01703643798828125, -0.0139617919921875, -0.01088714599609375, -0.0078125, -0.00473785400390625, -0.0016632080078125, 0.00141143798828125, 0.004486083984375, 0.00756072998046875, 0.0106353759765625, 0.01371002197265625, 0.01678466796875, 0.01985931396484375, 0.0229339599609375, 0.02600860595703125, 0.029083251953125, 0.03215789794921875, 0.0352325439453125, 0.03830718994140625, 0.0413818359375, 0.04445648193359375, 0.0475311279296875, 0.05060577392578125, 0.053680419921875, 0.05675506591796875, 0.0598297119140625, 0.06290435791015625, 0.06597900390625, 0.06905364990234375, 0.0721282958984375, 0.07520294189453125, 0.078277587890625, 0.08135223388671875, 0.0844268798828125, 0.08750152587890625, 0.090576171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 15.0, 9.0, 22.0, 37.0, 53.0, 85.0, 136.0, 116.0, 117.0, 127.0, 93.0, 54.0, 35.0, 36.0, 11.0, 12.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43688398599624634, -0.4169860780239105, -0.3970881700515747, -0.3771902918815613, -0.35729238390922546, -0.33739447593688965, -0.3174965977668762, -0.2975986897945404, -0.2777007818222046, -0.2578028738498688, -0.23790498077869415, -0.21800708770751953, -0.19810917973518372, -0.1782112717628479, -0.15831337869167328, -0.13841548562049866, -0.11851757764816284, -0.09861967712640762, -0.0787217766046524, -0.058823876082897186, -0.03892597556114197, -0.01902807503938675, 0.0008698254823684692, 0.02076771855354309, 0.040665626525878906, 0.060563527047634125, 0.08046142756938934, 0.10035932809114456, 0.12025722861289978, 0.1401551365852356, 0.16005302965641022, 0.17995092272758484, 0.19984877109527588, 0.2197466790676117, 0.23964457213878632, 0.25954246520996094, 0.27944037318229675, 0.29933828115463257, 0.319236159324646, 0.3391340672969818, 0.3590319752693176, 0.37892988324165344, 0.39882779121398926, 0.4187256693840027, 0.4386235773563385, 0.4585214853286743, 0.47841936349868774, 0.49831727147102356, 0.5182151794433594, 0.5381130576133728, 0.558010995388031, 0.5779088735580444, 0.5978068113327026, 0.6177046895027161, 0.6376025676727295, 0.6575005054473877, 0.6773983836174011, 0.6972962617874146, 0.7171941995620728, 0.7370920777320862, 0.7569899559020996, 0.7768878936767578, 0.7967857718467712, 0.8166836500167847, 0.8365815877914429]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 14.0, 9.0, 17.0, 19.0, 20.0, 28.0, 29.0, 34.0, 37.0, 42.0, 43.0, 35.0, 47.0, 58.0, 46.0, 38.0, 32.0, 31.0, 43.0, 40.0, 37.0, 26.0, 28.0, 46.0, 28.0, 22.0, 23.0, 27.0, 23.0, 8.0, 19.0, 10.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28855353593826294, -0.2785467505455017, -0.2685399353504181, -0.25853314995765686, -0.24852633476257324, -0.23851953446865082, -0.2285127341747284, -0.21850594878196716, -0.20849913358688354, -0.19849233329296112, -0.1884855329990387, -0.17847873270511627, -0.16847193241119385, -0.15846513211727142, -0.148458331823349, -0.13845154643058777, -0.12844474613666534, -0.11843794584274292, -0.1084311455488205, -0.09842434525489807, -0.08841754496097565, -0.07841074466705322, -0.0684039518237114, -0.05839715152978897, -0.04839035123586655, -0.03838355094194412, -0.028376752510666847, -0.018369954079389572, -0.008363153785467148, 0.0016436465084552765, 0.011650443077087402, 0.021657243371009827, 0.03166404366493225, 0.041670843958854675, 0.0516776442527771, 0.061684440821409225, 0.07169124484062195, 0.08169804513454437, 0.0917048379778862, 0.10171163827180862, 0.11171843856573105, 0.12172523885965347, 0.1317320317029953, 0.14173883199691772, 0.15174563229084015, 0.16175243258476257, 0.171759232878685, 0.18176603317260742, 0.19177283346652985, 0.20177963376045227, 0.2117864340543747, 0.22179323434829712, 0.23180003464221954, 0.24180683493614197, 0.2518136203289032, 0.2618204355239868, 0.27182722091674805, 0.2818340063095093, 0.2918408215045929, 0.3018476068973541, 0.31185442209243774, 0.321861207485199, 0.3318680226802826, 0.3418748080730438, 0.35188162326812744]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 10.0, 17.0, 18.0, 39.0, 50.0, 91.0, 112.0, 167.0, 266.0, 425.0, 723.0, 1211.0, 2164.0, 3935.0, 7215.0, 13647.0, 27155.0, 56742.0, 121500.0, 238082.0, 273867.0, 155789.0, 73413.0, 34714.0, 16966.0, 8868.0, 4922.0, 2665.0, 1494.0, 853.0, 519.0, 349.0, 187.0, 123.0, 73.0, 64.0, 27.0, 26.0, 17.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.06998825073242188, -0.06758880615234375, -0.06518936157226562, -0.0627899169921875, -0.060390472412109375, -0.05799102783203125, -0.055591583251953125, -0.053192138671875, -0.050792694091796875, -0.04839324951171875, -0.045993804931640625, -0.0435943603515625, -0.041194915771484375, -0.03879547119140625, -0.036396026611328125, -0.03399658203125, -0.031597137451171875, -0.02919769287109375, -0.026798248291015625, -0.0243988037109375, -0.021999359130859375, -0.01959991455078125, -0.017200469970703125, -0.014801025390625, -0.012401580810546875, -0.01000213623046875, -0.007602691650390625, -0.0052032470703125, -0.002803802490234375, -0.00040435791015625, 0.001995086669921875, 0.00439453125, 0.006793975830078125, 0.00919342041015625, 0.011592864990234375, 0.0139923095703125, 0.016391754150390625, 0.01879119873046875, 0.021190643310546875, 0.023590087890625, 0.025989532470703125, 0.02838897705078125, 0.030788421630859375, 0.0331878662109375, 0.035587310791015625, 0.03798675537109375, 0.040386199951171875, 0.04278564453125, 0.045185089111328125, 0.04758453369140625, 0.049983978271484375, 0.0523834228515625, 0.054782867431640625, 0.05718231201171875, 0.059581756591796875, 0.061981201171875, 0.06438064575195312, 0.06678009033203125, 0.06917953491210938, 0.0715789794921875, 0.07397842407226562, 0.07637786865234375, 0.07877731323242188, 0.0811767578125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 4.0, 11.0, 14.0, 20.0, 25.0, 41.0, 44.0, 53.0, 48.0, 54.0, 70.0, 58.0, 65.0, 68.0, 62.0, 63.0, 57.0, 47.0, 47.0, 28.0, 32.0, 19.0, 16.0, 15.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056610107421875, -0.054692745208740234, -0.05277538299560547, -0.0508580207824707, -0.04894065856933594, -0.04702329635620117, -0.045105934143066406, -0.04318857192993164, -0.041271209716796875, -0.03935384750366211, -0.037436485290527344, -0.03551912307739258, -0.03360176086425781, -0.03168439865112305, -0.02976703643798828, -0.027849674224853516, -0.02593231201171875, -0.024014949798583984, -0.02209758758544922, -0.020180225372314453, -0.018262863159179688, -0.016345500946044922, -0.014428138732910156, -0.01251077651977539, -0.010593414306640625, -0.00867605209350586, -0.006758689880371094, -0.004841327667236328, -0.0029239654541015625, -0.0010066032409667969, 0.0009107589721679688, 0.0028281211853027344, 0.0047454833984375, 0.006662845611572266, 0.008580207824707031, 0.010497570037841797, 0.012414932250976562, 0.014332294464111328, 0.016249656677246094, 0.01816701889038086, 0.020084381103515625, 0.02200174331665039, 0.023919105529785156, 0.025836467742919922, 0.027753829956054688, 0.029671192169189453, 0.03158855438232422, 0.033505916595458984, 0.03542327880859375, 0.037340641021728516, 0.03925800323486328, 0.04117536544799805, 0.04309272766113281, 0.04501008987426758, 0.046927452087402344, 0.04884481430053711, 0.050762176513671875, 0.05267953872680664, 0.054596900939941406, 0.05651426315307617, 0.05843162536621094, 0.0603489875793457, 0.06226634979248047, 0.06418371200561523, 0.06610107421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 14.0, 8.0, 20.0, 16.0, 29.0, 53.0, 52.0, 119.0, 168.0, 280.0, 436.0, 775.0, 1372.0, 2488.0, 4609.0, 9359.0, 20640.0, 51974.0, 154214.0, 429455.0, 241025.0, 76934.0, 28800.0, 12571.0, 5841.0, 3112.0, 1712.0, 992.0, 572.0, 310.0, 204.0, 111.0, 81.0, 55.0, 42.0, 25.0, 23.0, 17.0, 5.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10910606384277344, -0.10566329956054688, -0.10222053527832031, -0.09877777099609375, -0.09533500671386719, -0.09189224243164062, -0.08844947814941406, -0.0850067138671875, -0.08156394958496094, -0.07812118530273438, -0.07467842102050781, -0.07123565673828125, -0.06779289245605469, -0.06435012817382812, -0.06090736389160156, -0.057464599609375, -0.05402183532714844, -0.050579071044921875, -0.04713630676269531, -0.04369354248046875, -0.04025077819824219, -0.036808013916015625, -0.03336524963378906, -0.0299224853515625, -0.026479721069335938, -0.023036956787109375, -0.019594192504882812, -0.01615142822265625, -0.012708663940429688, -0.009265899658203125, -0.0058231353759765625, -0.00238037109375, 0.0010623931884765625, 0.004505157470703125, 0.007947921752929688, 0.01139068603515625, 0.014833450317382812, 0.018276214599609375, 0.021718978881835938, 0.0251617431640625, 0.028604507446289062, 0.032047271728515625, 0.03549003601074219, 0.03893280029296875, 0.04237556457519531, 0.045818328857421875, 0.04926109313964844, 0.052703857421875, 0.05614662170410156, 0.059589385986328125, 0.06303215026855469, 0.06647491455078125, 0.06991767883300781, 0.07336044311523438, 0.07680320739746094, 0.0802459716796875, 0.08368873596191406, 0.08713150024414062, 0.09057426452636719, 0.09401702880859375, 0.09745979309082031, 0.10090255737304688, 0.10434532165527344, 0.1077880859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 7.0, 8.0, 12.0, 15.0, 16.0, 19.0, 30.0, 29.0, 53.0, 49.0, 34.0, 46.0, 58.0, 67.0, 69.0, 60.0, 60.0, 48.0, 44.0, 46.0, 39.0, 35.0, 31.0, 18.0, 17.0, 17.0, 12.0, 8.0, 6.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1761474609375, -0.1710338592529297, -0.16592025756835938, -0.16080665588378906, -0.15569305419921875, -0.15057945251464844, -0.14546585083007812, -0.1403522491455078, -0.1352386474609375, -0.1301250457763672, -0.12501144409179688, -0.11989784240722656, -0.11478424072265625, -0.10967063903808594, -0.10455703735351562, -0.09944343566894531, -0.094329833984375, -0.08921623229980469, -0.08410263061523438, -0.07898902893066406, -0.07387542724609375, -0.06876182556152344, -0.06364822387695312, -0.05853462219238281, -0.0534210205078125, -0.04830741882324219, -0.043193817138671875, -0.03808021545410156, -0.03296661376953125, -0.027853012084960938, -0.022739410400390625, -0.017625808715820312, -0.01251220703125, -0.0073986053466796875, -0.002285003662109375, 0.0028285980224609375, 0.00794219970703125, 0.013055801391601562, 0.018169403076171875, 0.023283004760742188, 0.0283966064453125, 0.03351020812988281, 0.038623809814453125, 0.04373741149902344, 0.04885101318359375, 0.05396461486816406, 0.059078216552734375, 0.06419181823730469, 0.069305419921875, 0.07441902160644531, 0.07953262329101562, 0.08464622497558594, 0.08975982666015625, 0.09487342834472656, 0.09998703002929688, 0.10510063171386719, 0.1102142333984375, 0.11532783508300781, 0.12044143676757812, 0.12555503845214844, 0.13066864013671875, 0.13578224182128906, 0.14089584350585938, 0.1460094451904297, 0.151123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 10.0, 15.0, 26.0, 31.0, 54.0, 67.0, 108.0, 138.0, 220.0, 351.0, 561.0, 851.0, 1502.0, 2565.0, 4645.0, 9494.0, 21617.0, 60771.0, 219248.0, 480759.0, 162695.0, 47133.0, 17812.0, 8048.0, 4083.0, 2232.0, 1279.0, 780.0, 480.0, 308.0, 195.0, 138.0, 110.0, 85.0, 33.0, 27.0, 18.0, 17.0, 14.0, 7.0, 2.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.034844398498535156, -0.03361701965332031, -0.03238964080810547, -0.031162261962890625, -0.02993488311767578, -0.028707504272460938, -0.027480125427246094, -0.02625274658203125, -0.025025367736816406, -0.023797988891601562, -0.02257061004638672, -0.021343231201171875, -0.02011585235595703, -0.018888473510742188, -0.017661094665527344, -0.0164337158203125, -0.015206336975097656, -0.013978958129882812, -0.012751579284667969, -0.011524200439453125, -0.010296821594238281, -0.009069442749023438, -0.007842063903808594, -0.00661468505859375, -0.005387306213378906, -0.0041599273681640625, -0.0029325485229492188, -0.001705169677734375, -0.00047779083251953125, 0.0007495880126953125, 0.0019769668579101562, 0.003204345703125, 0.004431724548339844, 0.0056591033935546875, 0.006886482238769531, 0.008113861083984375, 0.009341239929199219, 0.010568618774414062, 0.011795997619628906, 0.01302337646484375, 0.014250755310058594, 0.015478134155273438, 0.01670551300048828, 0.017932891845703125, 0.01916027069091797, 0.020387649536132812, 0.021615028381347656, 0.0228424072265625, 0.024069786071777344, 0.025297164916992188, 0.02652454376220703, 0.027751922607421875, 0.02897930145263672, 0.030206680297851562, 0.031434059143066406, 0.03266143798828125, 0.033888816833496094, 0.03511619567871094, 0.03634357452392578, 0.037570953369140625, 0.03879833221435547, 0.04002571105957031, 0.041253089904785156, 0.04248046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 4.0, 8.0, 6.0, 7.0, 13.0, 8.0, 24.0, 21.0, 33.0, 24.0, 39.0, 35.0, 45.0, 51.0, 56.0, 78.0, 61.0, 76.0, 61.0, 58.0, 53.0, 50.0, 36.0, 22.0, 26.0, 22.0, 22.0, 13.0, 16.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.999471664428711e-05, -3.863032907247543e-05, -3.726594150066376e-05, -3.590155392885208e-05, -3.4537166357040405e-05, -3.317277878522873e-05, -3.180839121341705e-05, -3.0444003641605377e-05, -2.90796160697937e-05, -2.7715228497982025e-05, -2.635084092617035e-05, -2.4986453354358673e-05, -2.3622065782546997e-05, -2.225767821073532e-05, -2.0893290638923645e-05, -1.952890306711197e-05, -1.8164515495300293e-05, -1.6800127923488617e-05, -1.543574035167694e-05, -1.4071352779865265e-05, -1.2706965208053589e-05, -1.1342577636241913e-05, -9.978190064430237e-06, -8.61380249261856e-06, -7.249414920806885e-06, -5.885027348995209e-06, -4.520639777183533e-06, -3.1562522053718567e-06, -1.7918646335601807e-06, -4.2747706174850464e-07, 9.369105100631714e-07, 2.3012980818748474e-06, 3.6656856536865234e-06, 5.0300732254981995e-06, 6.3944607973098755e-06, 7.758848369121552e-06, 9.123235940933228e-06, 1.0487623512744904e-05, 1.185201108455658e-05, 1.3216398656368256e-05, 1.4580786228179932e-05, 1.5945173799991608e-05, 1.7309561371803284e-05, 1.867394894361496e-05, 2.0038336515426636e-05, 2.1402724087238312e-05, 2.2767111659049988e-05, 2.4131499230861664e-05, 2.549588680267334e-05, 2.6860274374485016e-05, 2.8224661946296692e-05, 2.9589049518108368e-05, 3.0953437089920044e-05, 3.231782466173172e-05, 3.3682212233543396e-05, 3.504659980535507e-05, 3.641098737716675e-05, 3.7775374948978424e-05, 3.91397625207901e-05, 4.0504150092601776e-05, 4.186853766441345e-05, 4.323292523622513e-05, 4.4597312808036804e-05, 4.596170037984848e-05, 4.7326087951660156e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 11.0, 14.0, 14.0, 19.0, 24.0, 54.0, 55.0, 84.0, 140.0, 262.0, 406.0, 803.0, 1381.0, 2511.0, 5144.0, 11549.0, 27556.0, 78636.0, 250657.0, 430372.0, 153850.0, 49937.0, 18845.0, 8065.0, 3829.0, 1905.0, 984.0, 564.0, 329.0, 211.0, 120.0, 83.0, 65.0, 26.0, 14.0, 14.0, 10.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.038726806640625, -0.037659645080566406, -0.03659248352050781, -0.03552532196044922, -0.034458160400390625, -0.03339099884033203, -0.03232383728027344, -0.031256675720214844, -0.03018951416015625, -0.029122352600097656, -0.028055191040039062, -0.02698802947998047, -0.025920867919921875, -0.02485370635986328, -0.023786544799804688, -0.022719383239746094, -0.0216522216796875, -0.020585060119628906, -0.019517898559570312, -0.01845073699951172, -0.017383575439453125, -0.01631641387939453, -0.015249252319335938, -0.014182090759277344, -0.01311492919921875, -0.012047767639160156, -0.010980606079101562, -0.009913444519042969, -0.008846282958984375, -0.007779121398925781, -0.0067119598388671875, -0.005644798278808594, -0.00457763671875, -0.0035104751586914062, -0.0024433135986328125, -0.0013761520385742188, -0.000308990478515625, 0.0007581710815429688, 0.0018253326416015625, 0.0028924942016601562, 0.00395965576171875, 0.005026817321777344, 0.0060939788818359375, 0.007161140441894531, 0.008228302001953125, 0.009295463562011719, 0.010362625122070312, 0.011429786682128906, 0.0124969482421875, 0.013564109802246094, 0.014631271362304688, 0.01569843292236328, 0.016765594482421875, 0.01783275604248047, 0.018899917602539062, 0.019967079162597656, 0.02103424072265625, 0.022101402282714844, 0.023168563842773438, 0.02423572540283203, 0.025302886962890625, 0.02637004852294922, 0.027437210083007812, 0.028504371643066406, 0.029571533203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 2.0, 14.0, 23.0, 23.0, 31.0, 46.0, 69.0, 107.0, 132.0, 100.0, 119.0, 91.0, 72.0, 43.0, 35.0, 22.0, 15.0, 12.0, 5.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0582275390625, -0.056382179260253906, -0.05453681945800781, -0.05269145965576172, -0.050846099853515625, -0.04900074005126953, -0.04715538024902344, -0.045310020446777344, -0.04346466064453125, -0.041619300842285156, -0.03977394104003906, -0.03792858123779297, -0.036083221435546875, -0.03423786163330078, -0.03239250183105469, -0.030547142028808594, -0.0287017822265625, -0.026856422424316406, -0.025011062622070312, -0.02316570281982422, -0.021320343017578125, -0.01947498321533203, -0.017629623413085938, -0.015784263610839844, -0.01393890380859375, -0.012093544006347656, -0.010248184204101562, -0.008402824401855469, -0.006557464599609375, -0.004712104797363281, -0.0028667449951171875, -0.0010213851928710938, 0.000823974609375, 0.0026693344116210938, 0.0045146942138671875, 0.006360054016113281, 0.008205413818359375, 0.010050773620605469, 0.011896133422851562, 0.013741493225097656, 0.01558685302734375, 0.017432212829589844, 0.019277572631835938, 0.02112293243408203, 0.022968292236328125, 0.02481365203857422, 0.026659011840820312, 0.028504371643066406, 0.0303497314453125, 0.032195091247558594, 0.03404045104980469, 0.03588581085205078, 0.037731170654296875, 0.03957653045654297, 0.04142189025878906, 0.043267250061035156, 0.04511260986328125, 0.046957969665527344, 0.04880332946777344, 0.05064868927001953, 0.052494049072265625, 0.05433940887451172, 0.05618476867675781, 0.058030128479003906, 0.05987548828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 7.0, 7.0, 20.0, 21.0, 50.0, 93.0, 147.0, 183.0, 181.0, 120.0, 76.0, 48.0, 19.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2651619911193848, -1.2298510074615479, -1.194540023803711, -1.1592289209365845, -1.1239179372787476, -1.0886069536209106, -1.0532959699630737, -1.0179849863052368, -0.9826739430427551, -0.9473629593849182, -0.9120519161224365, -0.8767409324645996, -0.8414299488067627, -0.806118905544281, -0.7708079218864441, -0.7354968786239624, -0.7001858949661255, -0.6648749113082886, -0.6295638680458069, -0.59425288438797, -0.5589418411254883, -0.5236308574676514, -0.48831987380981445, -0.45300886034965515, -0.41769784688949585, -0.38238683342933655, -0.34707581996917725, -0.31176483631134033, -0.27645382285118103, -0.24114280939102173, -0.20583181083202362, -0.1705208122730255, -0.13520967960357666, -0.09989867359399796, -0.06458766758441925, -0.029276661574840546, 0.006034344434738159, 0.04134535789489746, 0.07665635645389557, 0.11196735501289368, 0.14727836847305298, 0.18258938193321228, 0.2179003804922104, 0.2532113790512085, 0.2885223925113678, 0.3238334059715271, 0.359144389629364, 0.3944554030895233, 0.4297664165496826, 0.4650774300098419, 0.5003884434700012, 0.5356994271278381, 0.5710104703903198, 0.6063214540481567, 0.6416324377059937, 0.6769434213638306, 0.7122544646263123, 0.7475654482841492, 0.7828764915466309, 0.8181874752044678, 0.8534984588623047, 0.8888095021247864, 0.9241204857826233, 0.959431529045105, 0.9947425127029419]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 18.0, 16.0, 13.0, 21.0, 23.0, 17.0, 28.0, 34.0, 39.0, 28.0, 30.0, 42.0, 54.0, 49.0, 50.0, 51.0, 39.0, 44.0, 43.0, 46.0, 34.0, 33.0, 37.0, 26.0, 30.0, 31.0, 19.0, 12.0, 10.0, 5.0, 13.0, 6.0, 6.0, 3.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4245501756668091, -0.4117284119129181, -0.3989066481590271, -0.3860848844051361, -0.3732631206512451, -0.36044132709503174, -0.34761959314346313, -0.33479779958724976, -0.32197603583335876, -0.3091542720794678, -0.2963325083255768, -0.2835107445716858, -0.2706889808177948, -0.2578672170639038, -0.24504543840885162, -0.23222365975379944, -0.21940191090106964, -0.20658014714717865, -0.19375838339328766, -0.18093660473823547, -0.16811484098434448, -0.1552930772304535, -0.1424713134765625, -0.1296495497226715, -0.11682777851819992, -0.10400601476430893, -0.09118424355983734, -0.07836247980594635, -0.06554071605205536, -0.05271894484758377, -0.03989718109369278, -0.02707540988922119, -0.0142536461353302, -0.0014318795874714851, 0.01138988696038723, 0.02421165257692337, 0.03703342005610466, 0.04985518753528595, 0.06267695128917694, 0.07549872249364853, 0.08832048624753952, 0.10114225000143051, 0.1139640212059021, 0.1267857849597931, 0.13960754871368408, 0.15242931246757507, 0.16525107622146606, 0.17807285487651825, 0.19089461863040924, 0.20371638238430023, 0.21653814613819122, 0.2293599247932434, 0.2421816885471344, 0.2550034523010254, 0.2678252160549164, 0.2806469798088074, 0.29346874356269836, 0.30629050731658936, 0.31911227107048035, 0.33193403482437134, 0.34475579857826233, 0.3575775623321533, 0.3703993558883667, 0.3832211196422577, 0.3960428833961487]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 9.0, 8.0, 12.0, 18.0, 20.0, 35.0, 46.0, 82.0, 113.0, 201.0, 429.0, 769.0, 1888.0, 4982.0, 14796.0, 53477.0, 278045.0, 2130372.0, 1470252.0, 179908.0, 39383.0, 11815.0, 4182.0, 1618.0, 788.0, 377.0, 210.0, 158.0, 64.0, 38.0, 62.0, 29.0, 20.0, 19.0, 12.0, 6.0, 9.0, 6.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1522216796875, -0.1472930908203125, -0.142364501953125, -0.1374359130859375, -0.13250732421875, -0.1275787353515625, -0.122650146484375, -0.1177215576171875, -0.11279296875, -0.1078643798828125, -0.102935791015625, -0.0980072021484375, -0.09307861328125, -0.0881500244140625, -0.083221435546875, -0.0782928466796875, -0.0733642578125, -0.0684356689453125, -0.063507080078125, -0.0585784912109375, -0.05364990234375, -0.0487213134765625, -0.043792724609375, -0.0388641357421875, -0.033935546875, -0.0290069580078125, -0.024078369140625, -0.0191497802734375, -0.01422119140625, -0.0092926025390625, -0.004364013671875, 0.0005645751953125, 0.0054931640625, 0.0104217529296875, 0.015350341796875, 0.0202789306640625, 0.02520751953125, 0.0301361083984375, 0.035064697265625, 0.0399932861328125, 0.044921875, 0.0498504638671875, 0.054779052734375, 0.0597076416015625, 0.06463623046875, 0.0695648193359375, 0.074493408203125, 0.0794219970703125, 0.0843505859375, 0.0892791748046875, 0.094207763671875, 0.0991363525390625, 0.10406494140625, 0.1089935302734375, 0.113922119140625, 0.1188507080078125, 0.123779296875, 0.1287078857421875, 0.133636474609375, 0.1385650634765625, 0.14349365234375, 0.1484222412109375, 0.153350830078125, 0.1582794189453125, 0.1632080078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 12.0, 8.0, 15.0, 25.0, 26.0, 35.0, 46.0, 55.0, 49.0, 63.0, 73.0, 56.0, 76.0, 72.0, 76.0, 78.0, 64.0, 46.0, 31.0, 31.0, 23.0, 14.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06396484375, -0.061908721923828125, -0.05985260009765625, -0.057796478271484375, -0.0557403564453125, -0.053684234619140625, -0.05162811279296875, -0.049571990966796875, -0.047515869140625, -0.045459747314453125, -0.04340362548828125, -0.041347503662109375, -0.0392913818359375, -0.037235260009765625, -0.03517913818359375, -0.033123016357421875, -0.03106689453125, -0.029010772705078125, -0.02695465087890625, -0.024898529052734375, -0.0228424072265625, -0.020786285400390625, -0.01873016357421875, -0.016674041748046875, -0.014617919921875, -0.012561798095703125, -0.01050567626953125, -0.008449554443359375, -0.0063934326171875, -0.004337310791015625, -0.00228118896484375, -0.000225067138671875, 0.0018310546875, 0.003887176513671875, 0.00594329833984375, 0.007999420166015625, 0.0100555419921875, 0.012111663818359375, 0.01416778564453125, 0.016223907470703125, 0.018280029296875, 0.020336151123046875, 0.02239227294921875, 0.024448394775390625, 0.0265045166015625, 0.028560638427734375, 0.03061676025390625, 0.032672882080078125, 0.03472900390625, 0.036785125732421875, 0.03884124755859375, 0.040897369384765625, 0.0429534912109375, 0.045009613037109375, 0.04706573486328125, 0.049121856689453125, 0.051177978515625, 0.053234100341796875, 0.05529022216796875, 0.057346343994140625, 0.0594024658203125, 0.061458587646484375, 0.06351470947265625, 0.06557083129882812, 0.067626953125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 17.0, 33.0, 55.0, 101.0, 222.0, 439.0, 1011.0, 3162.0, 14009.0, 173742.0, 3778692.0, 202458.0, 14990.0, 3275.0, 1210.0, 422.0, 203.0, 101.0, 48.0, 29.0, 18.0, 12.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3075752258300781, -0.29679107666015625, -0.2860069274902344, -0.2752227783203125, -0.2644386291503906, -0.25365447998046875, -0.24287033081054688, -0.232086181640625, -0.22130203247070312, -0.21051788330078125, -0.19973373413085938, -0.1889495849609375, -0.17816543579101562, -0.16738128662109375, -0.15659713745117188, -0.14581298828125, -0.13502883911132812, -0.12424468994140625, -0.11346054077148438, -0.1026763916015625, -0.09189224243164062, -0.08110809326171875, -0.07032394409179688, -0.059539794921875, -0.048755645751953125, -0.03797149658203125, -0.027187347412109375, -0.0164031982421875, -0.005619049072265625, 0.00516510009765625, 0.015949249267578125, 0.0267333984375, 0.037517547607421875, 0.04830169677734375, 0.059085845947265625, 0.0698699951171875, 0.08065414428710938, 0.09143829345703125, 0.10222244262695312, 0.113006591796875, 0.12379074096679688, 0.13457489013671875, 0.14535903930664062, 0.1561431884765625, 0.16692733764648438, 0.17771148681640625, 0.18849563598632812, 0.19927978515625, 0.21006393432617188, 0.22084808349609375, 0.23163223266601562, 0.2424163818359375, 0.2532005310058594, 0.26398468017578125, 0.2747688293457031, 0.285552978515625, 0.2963371276855469, 0.30712127685546875, 0.3179054260253906, 0.3286895751953125, 0.3394737243652344, 0.35025787353515625, 0.3610420227050781, 0.371826171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 4.0, 8.0, 18.0, 24.0, 35.0, 38.0, 62.0, 137.0, 181.0, 311.0, 433.0, 599.0, 663.0, 546.0, 342.0, 231.0, 149.0, 91.0, 69.0, 37.0, 26.0, 20.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2386474609375, -0.23171043395996094, -0.22477340698242188, -0.2178363800048828, -0.21089935302734375, -0.2039623260498047, -0.19702529907226562, -0.19008827209472656, -0.1831512451171875, -0.17621421813964844, -0.16927719116210938, -0.1623401641845703, -0.15540313720703125, -0.1484661102294922, -0.14152908325195312, -0.13459205627441406, -0.127655029296875, -0.12071800231933594, -0.11378097534179688, -0.10684394836425781, -0.09990692138671875, -0.09296989440917969, -0.08603286743164062, -0.07909584045410156, -0.0721588134765625, -0.06522178649902344, -0.058284759521484375, -0.05134773254394531, -0.04441070556640625, -0.03747367858886719, -0.030536651611328125, -0.023599624633789062, -0.01666259765625, -0.009725570678710938, -0.002788543701171875, 0.0041484832763671875, 0.01108551025390625, 0.018022537231445312, 0.024959564208984375, 0.03189659118652344, 0.0388336181640625, 0.04577064514160156, 0.052707672119140625, 0.05964469909667969, 0.06658172607421875, 0.07351875305175781, 0.08045578002929688, 0.08739280700683594, 0.094329833984375, 0.10126686096191406, 0.10820388793945312, 0.11514091491699219, 0.12207794189453125, 0.1290149688720703, 0.13595199584960938, 0.14288902282714844, 0.1498260498046875, 0.15676307678222656, 0.16370010375976562, 0.1706371307373047, 0.17757415771484375, 0.1845111846923828, 0.19144821166992188, 0.19838523864746094, 0.205322265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 9.0, 28.0, 32.0, 133.0, 273.0, 301.0, 120.0, 49.0, 21.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44143009185791, -4.249141693115234, -4.056853294372559, -3.8645644187927246, -3.672276020050049, -3.479987621307373, -3.287698984146118, -3.0954103469848633, -2.9031219482421875, -2.7108335494995117, -2.518544912338257, -2.326256275177002, -2.133967876434326, -1.9416793584823608, -1.7493908405303955, -1.5571023225784302, -1.3648138046264648, -1.1725252866744995, -0.9802367687225342, -0.7879482507705688, -0.5956597328186035, -0.4033712148666382, -0.21108269691467285, -0.01879417896270752, 0.1734943389892578, 0.36578285694122314, 0.5580713748931885, 0.7503598928451538, 0.9426484107971191, 1.1349369287490845, 1.3272254467010498, 1.5195139646530151, 1.7118024826049805, 1.9040910005569458, 2.096379518508911, 2.288668155670166, 2.480956554412842, 2.6732449531555176, 2.8655335903167725, 3.0578222274780273, 3.250110626220703, 3.442399024963379, 3.634687662124634, 3.8269762992858887, 4.0192646980285645, 4.21155309677124, 4.403841972351074, 4.59613037109375, 4.788418769836426, 4.980707168579102, 5.172995567321777, 5.365284442901611, 5.557572841644287, 5.749861240386963, 5.942150115966797, 6.134438514709473, 6.326726913452148, 6.519015312194824, 6.7113037109375, 6.903592586517334, 7.09588098526001, 7.2881693840026855, 7.4804582595825195, 7.672746658325195, 7.865035057067871]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 14.0, 14.0, 22.0, 33.0, 31.0, 42.0, 52.0, 68.0, 70.0, 71.0, 74.0, 83.0, 70.0, 66.0, 55.0, 49.0, 44.0, 29.0, 27.0, 17.0, 17.0, 11.0, 6.0, 5.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6712656021118164, -1.6157715320587158, -1.5602774620056152, -1.5047833919525146, -1.449289321899414, -1.3937952518463135, -1.338301181793213, -1.2828071117401123, -1.2273130416870117, -1.1718189716339111, -1.1163249015808105, -1.06083083152771, -1.0053367614746094, -0.9498426914215088, -0.8943486213684082, -0.8388545513153076, -0.783360481262207, -0.7278664112091064, -0.6723723411560059, -0.6168782711029053, -0.5613842010498047, -0.5058901309967041, -0.4503960609436035, -0.39490199089050293, -0.33940792083740234, -0.28391385078430176, -0.22841978073120117, -0.17292571067810059, -0.117431640625, -0.061937570571899414, -0.006443500518798828, 0.04905056953430176, 0.10454463958740234, 0.16003870964050293, 0.21553277969360352, 0.2710268497467041, 0.3265209197998047, 0.3820149898529053, 0.43750905990600586, 0.49300312995910645, 0.548497200012207, 0.6039912700653076, 0.6594853401184082, 0.7149794101715088, 0.7704734802246094, 0.82596755027771, 0.8814616203308105, 0.9369556903839111, 0.9924497604370117, 1.0479438304901123, 1.103437900543213, 1.1589319705963135, 1.214426040649414, 1.2699201107025146, 1.3254141807556152, 1.3809082508087158, 1.4364023208618164, 1.491896390914917, 1.5473904609680176, 1.6028845310211182, 1.6583786010742188, 1.7138726711273193, 1.76936674118042, 1.8248608112335205, 1.880354881286621]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 11.0, 12.0, 17.0, 27.0, 30.0, 41.0, 67.0, 97.0, 167.0, 226.0, 394.0, 696.0, 1232.0, 2262.0, 5014.0, 11881.0, 32827.0, 116354.0, 413395.0, 332257.0, 87123.0, 25909.0, 9540.0, 4225.0, 2017.0, 1049.0, 584.0, 364.0, 237.0, 160.0, 96.0, 68.0, 41.0, 33.0, 20.0, 11.0, 12.0, 9.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.13869857788085938, -0.13420867919921875, -0.12971878051757812, -0.1252288818359375, -0.12073898315429688, -0.11624908447265625, -0.11175918579101562, -0.107269287109375, -0.10277938842773438, -0.09828948974609375, -0.09379959106445312, -0.0893096923828125, -0.08481979370117188, -0.08032989501953125, -0.07583999633789062, -0.07135009765625, -0.06686019897460938, -0.06237030029296875, -0.057880401611328125, -0.0533905029296875, -0.048900604248046875, -0.04441070556640625, -0.039920806884765625, -0.035430908203125, -0.030941009521484375, -0.02645111083984375, -0.021961212158203125, -0.0174713134765625, -0.012981414794921875, -0.00849151611328125, -0.004001617431640625, 0.00048828125, 0.004978179931640625, 0.00946807861328125, 0.013957977294921875, 0.0184478759765625, 0.022937774658203125, 0.02742767333984375, 0.031917572021484375, 0.036407470703125, 0.040897369384765625, 0.04538726806640625, 0.049877166748046875, 0.0543670654296875, 0.058856964111328125, 0.06334686279296875, 0.06783676147460938, 0.07232666015625, 0.07681655883789062, 0.08130645751953125, 0.08579635620117188, 0.0902862548828125, 0.09477615356445312, 0.09926605224609375, 0.10375595092773438, 0.108245849609375, 0.11273574829101562, 0.11722564697265625, 0.12171554565429688, 0.1262054443359375, 0.13069534301757812, 0.13518524169921875, 0.13967514038085938, 0.1441650390625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 14.0, 20.0, 33.0, 30.0, 41.0, 61.0, 65.0, 76.0, 85.0, 91.0, 79.0, 85.0, 76.0, 51.0, 42.0, 29.0, 22.0, 22.0, 15.0, 12.0, 9.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13518524169921875, -0.1304779052734375, -0.12577056884765625, -0.121063232421875, -0.11635589599609375, -0.1116485595703125, -0.10694122314453125, -0.10223388671875, -0.09752655029296875, -0.0928192138671875, -0.08811187744140625, -0.083404541015625, -0.07869720458984375, -0.0739898681640625, -0.06928253173828125, -0.0645751953125, -0.05986785888671875, -0.0551605224609375, -0.05045318603515625, -0.045745849609375, -0.04103851318359375, -0.0363311767578125, -0.03162384033203125, -0.02691650390625, -0.02220916748046875, -0.0175018310546875, -0.01279449462890625, -0.008087158203125, -0.00337982177734375, 0.0013275146484375, 0.00603485107421875, 0.0107421875, 0.01544952392578125, 0.0201568603515625, 0.02486419677734375, 0.029571533203125, 0.03427886962890625, 0.0389862060546875, 0.04369354248046875, 0.04840087890625, 0.05310821533203125, 0.0578155517578125, 0.06252288818359375, 0.067230224609375, 0.07193756103515625, 0.0766448974609375, 0.08135223388671875, 0.0860595703125, 0.09076690673828125, 0.0954742431640625, 0.10018157958984375, 0.104888916015625, 0.10959625244140625, 0.1143035888671875, 0.11901092529296875, 0.12371826171875, 0.12842559814453125, 0.1331329345703125, 0.13784027099609375, 0.142547607421875, 0.14725494384765625, 0.1519622802734375, 0.15666961669921875, 0.161376953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 16.0, 13.0, 30.0, 42.0, 88.0, 162.0, 558.0, 1841.0, 9328.0, 121539.0, 870613.0, 37582.0, 4861.0, 1163.0, 370.0, 138.0, 82.0, 39.0, 26.0, 9.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.46343994140625, -0.4490966796875, -0.43475341796875, -0.42041015625, -0.40606689453125, -0.3917236328125, -0.37738037109375, -0.363037109375, -0.34869384765625, -0.3343505859375, -0.32000732421875, -0.3056640625, -0.29132080078125, -0.2769775390625, -0.26263427734375, -0.248291015625, -0.23394775390625, -0.2196044921875, -0.20526123046875, -0.19091796875, -0.17657470703125, -0.1622314453125, -0.14788818359375, -0.133544921875, -0.11920166015625, -0.1048583984375, -0.09051513671875, -0.076171875, -0.06182861328125, -0.0474853515625, -0.03314208984375, -0.018798828125, -0.00445556640625, 0.0098876953125, 0.02423095703125, 0.03857421875, 0.05291748046875, 0.0672607421875, 0.08160400390625, 0.095947265625, 0.11029052734375, 0.1246337890625, 0.13897705078125, 0.1533203125, 0.16766357421875, 0.1820068359375, 0.19635009765625, 0.210693359375, 0.22503662109375, 0.2393798828125, 0.25372314453125, 0.26806640625, 0.28240966796875, 0.2967529296875, 0.31109619140625, 0.325439453125, 0.33978271484375, 0.3541259765625, 0.36846923828125, 0.3828125, 0.39715576171875, 0.4114990234375, 0.42584228515625, 0.440185546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 10.0, 8.0, 9.0, 8.0, 16.0, 17.0, 28.0, 34.0, 67.0, 55.0, 74.0, 85.0, 108.0, 104.0, 82.0, 79.0, 61.0, 52.0, 33.0, 29.0, 16.0, 14.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6455078125, -0.6230010986328125, -0.600494384765625, -0.5779876708984375, -0.55548095703125, -0.5329742431640625, -0.510467529296875, -0.4879608154296875, -0.4654541015625, -0.4429473876953125, -0.420440673828125, -0.3979339599609375, -0.37542724609375, -0.3529205322265625, -0.330413818359375, -0.3079071044921875, -0.285400390625, -0.2628936767578125, -0.240386962890625, -0.2178802490234375, -0.19537353515625, -0.1728668212890625, -0.150360107421875, -0.1278533935546875, -0.1053466796875, -0.0828399658203125, -0.060333251953125, -0.0378265380859375, -0.01531982421875, 0.0071868896484375, 0.029693603515625, 0.0522003173828125, 0.07470703125, 0.0972137451171875, 0.119720458984375, 0.1422271728515625, 0.16473388671875, 0.1872406005859375, 0.209747314453125, 0.2322540283203125, 0.2547607421875, 0.2772674560546875, 0.299774169921875, 0.3222808837890625, 0.34478759765625, 0.3672943115234375, 0.389801025390625, 0.4123077392578125, 0.434814453125, 0.4573211669921875, 0.479827880859375, 0.5023345947265625, 0.52484130859375, 0.5473480224609375, 0.569854736328125, 0.5923614501953125, 0.6148681640625, 0.6373748779296875, 0.659881591796875, 0.6823883056640625, 0.70489501953125, 0.7274017333984375, 0.749908447265625, 0.7724151611328125, 0.794921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 20.0, 28.0, 46.0, 159.0, 1042.0, 96823.0, 948323.0, 1697.0, 243.0, 57.0, 40.0, 22.0, 15.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265625, -0.702423095703125, -0.67828369140625, -0.654144287109375, -0.6300048828125, -0.605865478515625, -0.58172607421875, -0.557586669921875, -0.533447265625, -0.509307861328125, -0.48516845703125, -0.461029052734375, -0.4368896484375, -0.412750244140625, -0.38861083984375, -0.364471435546875, -0.34033203125, -0.316192626953125, -0.29205322265625, -0.267913818359375, -0.2437744140625, -0.219635009765625, -0.19549560546875, -0.171356201171875, -0.147216796875, -0.123077392578125, -0.09893798828125, -0.074798583984375, -0.0506591796875, -0.026519775390625, -0.00238037109375, 0.021759033203125, 0.0458984375, 0.070037841796875, 0.09417724609375, 0.118316650390625, 0.1424560546875, 0.166595458984375, 0.19073486328125, 0.214874267578125, 0.239013671875, 0.263153076171875, 0.28729248046875, 0.311431884765625, 0.3355712890625, 0.359710693359375, 0.38385009765625, 0.407989501953125, 0.43212890625, 0.456268310546875, 0.48040771484375, 0.504547119140625, 0.5286865234375, 0.552825927734375, 0.57696533203125, 0.601104736328125, 0.625244140625, 0.649383544921875, 0.67352294921875, 0.697662353515625, 0.7218017578125, 0.745941162109375, 0.77008056640625, 0.794219970703125, 0.818359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 5.0, 2.0, 4.0, 9.0, 7.0, 11.0, 10.0, 15.0, 11.0, 14.0, 29.0, 32.0, 38.0, 54.0, 67.0, 105.0, 93.0, 102.0, 81.0, 62.0, 43.0, 23.0, 30.0, 20.0, 21.0, 13.0, 11.0, 11.0, 7.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7239322662353516e-05, -2.632010728120804e-05, -2.540089190006256e-05, -2.4481676518917084e-05, -2.3562461137771606e-05, -2.264324575662613e-05, -2.1724030375480652e-05, -2.0804814994335175e-05, -1.9885599613189697e-05, -1.896638423204422e-05, -1.8047168850898743e-05, -1.7127953469753265e-05, -1.6208738088607788e-05, -1.528952270746231e-05, -1.4370307326316833e-05, -1.3451091945171356e-05, -1.2531876564025879e-05, -1.1612661182880402e-05, -1.0693445801734924e-05, -9.774230420589447e-06, -8.85501503944397e-06, -7.935799658298492e-06, -7.016584277153015e-06, -6.097368896007538e-06, -5.1781535148620605e-06, -4.258938133716583e-06, -3.339722752571106e-06, -2.4205073714256287e-06, -1.5012919902801514e-06, -5.820766091346741e-07, 3.371387720108032e-07, 1.2563541531562805e-06, 2.175569534301758e-06, 3.094784915447235e-06, 4.014000296592712e-06, 4.93321567773819e-06, 5.852431058883667e-06, 6.771646440029144e-06, 7.690861821174622e-06, 8.610077202320099e-06, 9.529292583465576e-06, 1.0448507964611053e-05, 1.136772334575653e-05, 1.2286938726902008e-05, 1.3206154108047485e-05, 1.4125369489192963e-05, 1.504458487033844e-05, 1.5963800251483917e-05, 1.6883015632629395e-05, 1.7802231013774872e-05, 1.872144639492035e-05, 1.9640661776065826e-05, 2.0559877157211304e-05, 2.147909253835678e-05, 2.2398307919502258e-05, 2.3317523300647736e-05, 2.4236738681793213e-05, 2.515595406293869e-05, 2.6075169444084167e-05, 2.6994384825229645e-05, 2.7913600206375122e-05, 2.88328155875206e-05, 2.9752030968666077e-05, 3.0671246349811554e-05, 3.159046173095703e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 5.0, 10.0, 15.0, 22.0, 27.0, 35.0, 42.0, 57.0, 90.0, 144.0, 210.0, 401.0, 633.0, 1292.0, 3065.0, 11338.0, 85716.0, 833483.0, 93575.0, 12023.0, 3333.0, 1328.0, 685.0, 364.0, 223.0, 133.0, 82.0, 55.0, 40.0, 38.0, 19.0, 13.0, 11.0, 8.0, 11.0, 2.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12158203125, -0.11699676513671875, -0.1124114990234375, -0.10782623291015625, -0.103240966796875, -0.09865570068359375, -0.0940704345703125, -0.08948516845703125, -0.08489990234375, -0.08031463623046875, -0.0757293701171875, -0.07114410400390625, -0.066558837890625, -0.06197357177734375, -0.0573883056640625, -0.05280303955078125, -0.0482177734375, -0.04363250732421875, -0.0390472412109375, -0.03446197509765625, -0.029876708984375, -0.02529144287109375, -0.0207061767578125, -0.01612091064453125, -0.01153564453125, -0.00695037841796875, -0.0023651123046875, 0.00222015380859375, 0.006805419921875, 0.01139068603515625, 0.0159759521484375, 0.02056121826171875, 0.025146484375, 0.02973175048828125, 0.0343170166015625, 0.03890228271484375, 0.043487548828125, 0.04807281494140625, 0.0526580810546875, 0.05724334716796875, 0.06182861328125, 0.06641387939453125, 0.0709991455078125, 0.07558441162109375, 0.080169677734375, 0.08475494384765625, 0.0893402099609375, 0.09392547607421875, 0.0985107421875, 0.10309600830078125, 0.1076812744140625, 0.11226654052734375, 0.116851806640625, 0.12143707275390625, 0.1260223388671875, 0.13060760498046875, 0.13519287109375, 0.13977813720703125, 0.1443634033203125, 0.14894866943359375, 0.153533935546875, 0.15811920166015625, 0.1627044677734375, 0.16728973388671875, 0.171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 20.0, 38.0, 67.0, 90.0, 115.0, 164.0, 138.0, 101.0, 88.0, 56.0, 35.0, 18.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2166748046875, -0.2091503143310547, -0.20162582397460938, -0.19410133361816406, -0.18657684326171875, -0.17905235290527344, -0.17152786254882812, -0.1640033721923828, -0.1564788818359375, -0.1489543914794922, -0.14142990112304688, -0.13390541076660156, -0.12638092041015625, -0.11885643005371094, -0.11133193969726562, -0.10380744934082031, -0.096282958984375, -0.08875846862792969, -0.08123397827148438, -0.07370948791503906, -0.06618499755859375, -0.05866050720214844, -0.051136016845703125, -0.04361152648925781, -0.0360870361328125, -0.028562545776367188, -0.021038055419921875, -0.013513565063476562, -0.00598907470703125, 0.0015354156494140625, 0.009059906005859375, 0.016584396362304688, 0.02410888671875, 0.03163337707519531, 0.039157867431640625, 0.04668235778808594, 0.05420684814453125, 0.06173133850097656, 0.06925582885742188, 0.07678031921386719, 0.0843048095703125, 0.09182929992675781, 0.09935379028320312, 0.10687828063964844, 0.11440277099609375, 0.12192726135253906, 0.12945175170898438, 0.1369762420654297, 0.144500732421875, 0.1520252227783203, 0.15954971313476562, 0.16707420349121094, 0.17459869384765625, 0.18212318420410156, 0.18964767456054688, 0.1971721649169922, 0.2046966552734375, 0.2122211456298828, 0.21974563598632812, 0.22727012634277344, 0.23479461669921875, 0.24231910705566406, 0.24984359741210938, 0.2573680877685547, 0.264892578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 34.0, 72.0, 136.0, 246.0, 213.0, 116.0, 65.0, 27.0, 18.0, 8.0, 13.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.995100498199463, -4.8752851486206055, -4.75546932220459, -4.635653972625732, -4.515838146209717, -4.396022796630859, -4.276207447052002, -4.156391620635986, -4.036576271057129, -3.9167606830596924, -3.796945095062256, -3.6771297454833984, -3.557314157485962, -3.4374985694885254, -3.317682981491089, -3.1978673934936523, -3.078052043914795, -2.9582364559173584, -2.838420867919922, -2.7186055183410645, -2.598789930343628, -2.4789743423461914, -2.359158754348755, -2.2393431663513184, -2.119527578353882, -1.9997119903564453, -1.8798965215682983, -1.7600809335708618, -1.6402654647827148, -1.5204498767852783, -1.4006342887878418, -1.2808188199996948, -1.1610033512115479, -1.0411877632141113, -0.9213722944259644, -0.8015567064285278, -0.6817412376403809, -0.5619256496429443, -0.4421101212501526, -0.32229459285736084, -0.2024790644645691, -0.08266352862119675, 0.0371520072221756, 0.15696755051612854, 0.2767830789089203, 0.3965986371040344, 0.5164141654968262, 0.6362296938896179, 0.7560452222824097, 0.8758607506752014, 0.9956762790679932, 1.1154918670654297, 1.2353073358535767, 1.3551229238510132, 1.4749383926391602, 1.5947539806365967, 1.7145695686340332, 1.8343851566314697, 1.9542006254196167, 2.0740160942077637, 2.1938316822052, 2.3136472702026367, 2.4334628582000732, 2.5532784461975098, 2.673093795776367]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 9.0, 17.0, 26.0, 36.0, 52.0, 99.0, 121.0, 177.0, 149.0, 110.0, 74.0, 57.0, 23.0, 16.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.316988945007324, -6.176357746124268, -6.035726547241211, -5.895095348358154, -5.754464149475098, -5.613832473754883, -5.473201274871826, -5.3325700759887695, -5.191938877105713, -5.051307678222656, -4.9106764793396, -4.770045280456543, -4.629413604736328, -4.4887824058532715, -4.348151206970215, -4.207520008087158, -4.066888809204102, -3.926257610321045, -3.7856264114379883, -3.6449949741363525, -3.504363775253296, -3.3637325763702393, -3.2231011390686035, -3.082469940185547, -2.9418387413024902, -2.8012075424194336, -2.660576343536377, -2.519944906234741, -2.3793137073516846, -2.238682508468628, -2.098051071166992, -1.9574198722839355, -1.816789150238037, -1.6761579513549805, -1.5355266332626343, -1.394895315170288, -1.2542641162872314, -1.1136329174041748, -0.9730015993118286, -0.8323703408241272, -0.6917390823364258, -0.5511078238487244, -0.41047656536102295, -0.26984530687332153, -0.12921404838562012, 0.011417210102081299, 0.15204846858978271, 0.29267972707748413, 0.43331098556518555, 0.573942244052887, 0.7145735025405884, 0.8552047610282898, 0.9958360195159912, 1.1364672183990479, 1.277098536491394, 1.4177298545837402, 1.5583610534667969, 1.6989922523498535, 1.8396235704421997, 1.980254888534546, 2.1208860874176025, 2.261517286300659, 2.402148723602295, 2.5427799224853516, 2.683411121368408]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 10.0, 25.0, 28.0, 58.0, 180.0, 477.0, 86.0, 52.0, 38.0, 21.0, 10.0, 7.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.703125, -0.68853759765625, -0.6739501953125, -0.65936279296875, -0.644775390625, -0.63018798828125, -0.6156005859375, -0.60101318359375, -0.58642578125, -0.57183837890625, -0.5572509765625, -0.54266357421875, -0.528076171875, -0.51348876953125, -0.4989013671875, -0.48431396484375, -0.4697265625, -0.45513916015625, -0.4405517578125, -0.42596435546875, -0.411376953125, -0.39678955078125, -0.3822021484375, -0.36761474609375, -0.35302734375, -0.33843994140625, -0.3238525390625, -0.30926513671875, -0.294677734375, -0.28009033203125, -0.2655029296875, -0.25091552734375, -0.236328125, -0.22174072265625, -0.2071533203125, -0.19256591796875, -0.177978515625, -0.16339111328125, -0.1488037109375, -0.13421630859375, -0.11962890625, -0.10504150390625, -0.0904541015625, -0.07586669921875, -0.061279296875, -0.04669189453125, -0.0321044921875, -0.01751708984375, -0.0029296875, 0.01165771484375, 0.0262451171875, 0.04083251953125, 0.055419921875, 0.07000732421875, 0.0845947265625, 0.09918212890625, 0.11376953125, 0.12835693359375, 0.1429443359375, 0.15753173828125, 0.172119140625, 0.18670654296875, 0.2012939453125, 0.21588134765625, 0.23046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 4.0, 11.0, 6.0, 5.0, 14.0, 22.0, 11.0, 14.0, 28.0, 33.0, 50.0, 83.0, 132.0, 226.0, 408.0, 936.0, 2934.0, 17977.0, 8328513.0, 31257.0, 3892.0, 1133.0, 413.0, 178.0, 98.0, 46.0, 28.0, 21.0, 14.0, 15.0, 13.0, 11.0, 9.0, 11.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.0912374258041382, -1.0622166395187378, -1.0331958532333374, -1.004175066947937, -0.9751542210578918, -0.9461334347724915, -0.9171125888824463, -0.8880918025970459, -0.8590710163116455, -0.8300502300262451, -0.8010294437408447, -0.7720085978507996, -0.7429878115653992, -0.7139670252799988, -0.6849461793899536, -0.6559253931045532, -0.6269046068191528, -0.5978838205337524, -0.568863034248352, -0.5398421883583069, -0.5108214020729065, -0.4818006157875061, -0.4527797996997833, -0.42375898361206055, -0.39473819732666016, -0.36571741104125977, -0.336696594953537, -0.3076757788658142, -0.2786549925804138, -0.24963419139385223, -0.22061339020729065, -0.19159258902072906, -0.16257178783416748, -0.1335509866476059, -0.10453018546104431, -0.07550938427448273, -0.04648858308792114, -0.017467781901359558, 0.011553019285202026, 0.04057382047176361, 0.0695946216583252, 0.09861542284488678, 0.12763622403144836, 0.15665702521800995, 0.18567782640457153, 0.21469862759113312, 0.2437194287776947, 0.2727402448654175, 0.30176103115081787, 0.33078181743621826, 0.35980263352394104, 0.3888234496116638, 0.4178442358970642, 0.4468650221824646, 0.4758858382701874, 0.5049066543579102, 0.5339274406433105, 0.5629482269287109, 0.5919690132141113, 0.6209898591041565, 0.6500106453895569, 0.6790314316749573, 0.7080522775650024, 0.7370730638504028, 0.7660938501358032]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.9121706485748291, -0.8577847480773926, -0.803398847579956, -0.7490128874778748, -0.6946269869804382, -0.6402410864830017, -0.5858551263809204, -0.5314692258834839, -0.47708332538604736, -0.42269742488861084, -0.36831149458885193, -0.313925564289093, -0.2595396637916565, -0.20515376329421997, -0.15076783299446106, -0.09638190269470215, -0.041996002197265625, 0.012389913201332092, 0.06677582859992981, 0.12116174399852753, 0.17554765939712524, 0.22993355989456177, 0.2843194901943207, 0.3387054204940796, 0.3930913209915161, 0.44747722148895264, 0.5018631219863892, 0.5562490820884705, 0.610634982585907, 0.6650208830833435, 0.7194068431854248, 0.7737927436828613, 0.8281786441802979, 0.8825645446777344, 0.9369504451751709, 0.9913364052772522, 1.045722246170044, 1.1001081466674805, 1.1544941663742065, 1.208880066871643, 1.2632659673690796, 1.3176518678665161, 1.3720377683639526, 1.4264236688613892, 1.4808096885681152, 1.5351955890655518, 1.5895814895629883, 1.6439673900604248, 1.6983532905578613, 1.7527391910552979, 1.8071250915527344, 1.861510992050171, 1.9158968925476074, 1.970282793045044, 2.0246686935424805, 2.079054832458496, 2.1334404945373535, 2.18782639503479, 2.2422122955322266, 2.296598196029663, 2.3509840965270996, 2.405369997024536, 2.4597558975219727, 2.5141420364379883, 2.568527936935425]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 24.0, 29.0, 33.0, 58.0, 76.0, 87.0, 98.0, 119.0, 97.0, 91.0, 72.0, 53.0, 38.0, 29.0, 21.0, 12.0, 10.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.1303853988647461, -0.1272258758544922, -0.12406635284423828, -0.12090682983398438, -0.11774730682373047, -0.11458778381347656, -0.11142826080322266, -0.10826873779296875, -0.10510921478271484, -0.10194969177246094, -0.09879016876220703, -0.09563064575195312, -0.09247112274169922, -0.08931159973144531, -0.0861520767211914, -0.0829925537109375, -0.0798330307006836, -0.07667350769042969, -0.07351398468017578, -0.07035446166992188, -0.06719493865966797, -0.06403541564941406, -0.060875892639160156, -0.05771636962890625, -0.054556846618652344, -0.05139732360839844, -0.04823780059814453, -0.045078277587890625, -0.04191875457763672, -0.03875923156738281, -0.035599708557128906, -0.032440185546875, -0.029280662536621094, -0.026121139526367188, -0.02296161651611328, -0.019802093505859375, -0.01664257049560547, -0.013483047485351562, -0.010323524475097656, -0.00716400146484375, -0.004004478454589844, -0.0008449554443359375, 0.0023145675659179688, 0.005474090576171875, 0.008633613586425781, 0.011793136596679688, 0.014952659606933594, 0.0181121826171875, 0.021271705627441406, 0.024431228637695312, 0.02759075164794922, 0.030750274658203125, 0.03390979766845703, 0.03706932067871094, 0.040228843688964844, 0.04338836669921875, 0.046547889709472656, 0.04970741271972656, 0.05286693572998047, 0.056026458740234375, 0.05918598175048828, 0.06234550476074219, 0.0655050277709961, 0.06866455078125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 11.0, 12.0, 12.0, 17.0, 24.0, 30.0, 43.0, 71.0, 91.0, 144.0, 191.0, 306.0, 481.0, 843.0, 1673.0, 3264.0, 7042.0, 17922.0, 53677.0, 199075.0, 167342.0, 44458.0, 15183.0, 5990.0, 2810.0, 1457.0, 780.0, 440.0, 302.0, 185.0, 105.0, 92.0, 49.0, 38.0, 35.0, 22.0, 11.0, 5.0, 11.0, 4.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0186920166015625, -0.984649658203125, -0.9506072998046875, -0.91656494140625, -0.8825225830078125, -0.848480224609375, -0.8144378662109375, -0.7803955078125, -0.7463531494140625, -0.712310791015625, -0.6782684326171875, -0.64422607421875, -0.6101837158203125, -0.576141357421875, -0.5420989990234375, -0.508056640625, -0.4740142822265625, -0.439971923828125, -0.4059295654296875, -0.37188720703125, -0.3378448486328125, -0.303802490234375, -0.2697601318359375, -0.2357177734375, -0.2016754150390625, -0.167633056640625, -0.1335906982421875, -0.09954833984375, -0.0655059814453125, -0.031463623046875, 0.0025787353515625, 0.03662109375, 0.0706634521484375, 0.104705810546875, 0.1387481689453125, 0.17279052734375, 0.2068328857421875, 0.240875244140625, 0.2749176025390625, 0.3089599609375, 0.3430023193359375, 0.377044677734375, 0.4110870361328125, 0.44512939453125, 0.4791717529296875, 0.513214111328125, 0.5472564697265625, 0.581298828125, 0.6153411865234375, 0.649383544921875, 0.6834259033203125, 0.71746826171875, 0.7515106201171875, 0.785552978515625, 0.8195953369140625, 0.8536376953125, 0.8876800537109375, 0.921722412109375, 0.9557647705078125, 0.98980712890625, 1.0238494873046875, 1.057891845703125, 1.0919342041015625, 1.1259765625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 21.0, 21.0, 35.0, 42.0, 60.0, 57.0, 84.0, 105.0, 88.0, 95.0, 80.0, 66.0, 60.0, 35.0, 30.0, 18.0, 17.0, 16.0, 15.0, 5.0, 5.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1961669921875, -0.18860435485839844, -0.18104171752929688, -0.1734790802001953, -0.16591644287109375, -0.1583538055419922, -0.15079116821289062, -0.14322853088378906, -0.1356658935546875, -0.12810325622558594, -0.12054061889648438, -0.11297798156738281, -0.10541534423828125, -0.09785270690917969, -0.09029006958007812, -0.08272743225097656, -0.075164794921875, -0.06760215759277344, -0.060039520263671875, -0.05247688293457031, -0.04491424560546875, -0.03735160827636719, -0.029788970947265625, -0.022226333618164062, -0.0146636962890625, -0.0071010589599609375, 0.000461578369140625, 0.008024215698242188, 0.01558685302734375, 0.023149490356445312, 0.030712127685546875, 0.03827476501464844, 0.04583740234375, 0.05340003967285156, 0.060962677001953125, 0.06852531433105469, 0.07608795166015625, 0.08365058898925781, 0.09121322631835938, 0.09877586364746094, 0.1063385009765625, 0.11390113830566406, 0.12146377563476562, 0.1290264129638672, 0.13658905029296875, 0.1441516876220703, 0.15171432495117188, 0.15927696228027344, 0.166839599609375, 0.17440223693847656, 0.18196487426757812, 0.1895275115966797, 0.19709014892578125, 0.2046527862548828, 0.21221542358398438, 0.21977806091308594, 0.2273406982421875, 0.23490333557128906, 0.24246597290039062, 0.2500286102294922, 0.25759124755859375, 0.2651538848876953, 0.2727165222167969, 0.28027915954589844, 0.287841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 8.0, 11.0, 9.0, 23.0, 21.0, 31.0, 40.0, 45.0, 48.0, 44.0, 39.0, 37.0, 34.0, 23.0, 12.0, 19.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6611654758453369, -0.6370133757591248, -0.6128613352775574, -0.5887092351913452, -0.5645571947097778, -0.5404050946235657, -0.5162529945373535, -0.49210095405578613, -0.46794888377189636, -0.4437968134880066, -0.4196447432041168, -0.39549267292022705, -0.3713405728340149, -0.3471885323524475, -0.32303643226623535, -0.2988843619823456, -0.2747322916984558, -0.25058022141456604, -0.22642815113067627, -0.2022760659456253, -0.17812399566173553, -0.15397192537784576, -0.1298198401927948, -0.10566776990890503, -0.08151569962501526, -0.05736362561583519, -0.03321155160665512, -0.009059473872184753, 0.015092596411705017, 0.03924466669559479, 0.06339675188064575, 0.08754882216453552, 0.11170083284378052, 0.1358529031276703, 0.16000497341156006, 0.18415705859661102, 0.2083091288805008, 0.23246119916439056, 0.25661328434944153, 0.2807653546333313, 0.30491742491722107, 0.32906949520111084, 0.3532215654850006, 0.3773736357688904, 0.40152573585510254, 0.4256777763366699, 0.4498298764228821, 0.47398194670677185, 0.4981340169906616, 0.5222861170768738, 0.5464381575584412, 0.5705902576446533, 0.5947422981262207, 0.6188943982124329, 0.643046498298645, 0.6671985387802124, 0.6913505792617798, 0.7155026793479919, 0.7396547198295593, 0.7638068199157715, 0.7879588603973389, 0.812110960483551, 0.8362630605697632, 0.8604151010513306, 0.8845672011375427]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 6.0, 12.0, 16.0, 10.0, 23.0, 27.0, 38.0, 35.0, 43.0, 39.0, 39.0, 31.0, 33.0, 23.0, 23.0, 16.0, 10.0, 13.0, 4.0, 5.0, 9.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6281315088272095, -1.5818910598754883, -1.535650610923767, -1.489410161972046, -1.4431697130203247, -1.3969292640686035, -1.3506886959075928, -1.3044483661651611, -1.2582077980041504, -1.2119673490524292, -1.165726900100708, -1.1194864511489868, -1.0732460021972656, -1.0270055532455444, -0.9807650446891785, -0.9345245957374573, -0.8882842063903809, -0.8420437574386597, -0.7958033084869385, -0.7495628595352173, -0.7033224105834961, -0.6570819616317749, -0.6108414530754089, -0.5646010041236877, -0.5183605551719666, -0.47212010622024536, -0.42587965726852417, -0.3796391785144806, -0.3333987295627594, -0.2871582806110382, -0.24091780185699463, -0.19467735290527344, -0.1484370231628418, -0.10219656676054001, -0.05595611035823822, -0.009715646505355835, 0.036524802446365356, 0.08276525139808655, 0.12900573015213013, 0.17524617910385132, 0.2214866280555725, 0.2677270770072937, 0.3139675259590149, 0.36020800471305847, 0.40644845366477966, 0.45268890261650085, 0.49892938137054443, 0.5451698303222656, 0.5914102792739868, 0.637650728225708, 0.6838911771774292, 0.7301316261291504, 0.7763720750808716, 0.8226125240325928, 0.8688530325889587, 0.9150934815406799, 0.9613339304924011, 1.007574439048767, 1.0538148880004883, 1.1000553369522095, 1.1462957859039307, 1.1925362348556519, 1.238776683807373, 1.2850171327590942, 1.3312575817108154]}, "eval/loss": 4.170206069946289, "eval/bleu": 2.2622740788922234e-13, "eval/runtime": 2580.4115, "eval/samples_per_second": 5.72, "eval/steps_per_second": 0.715} \ No newline at end of file