diff --git "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" --- "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" +++ "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 2.1087, "train/learning_rate": 2.5321100917431195e-06, "train/epoch": 2.78, "train/global_step": 4500, "_runtime": 64806, "_timestamp": 1651837074, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 9.0, 34.0, 94.0, 154.0, 239.0, 209.0, 147.0, 81.0, 30.0, 12.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8217853903770447, -0.729047417640686, -0.6363095045089722, -0.5435715317726135, -0.45083358883857727, -0.358095645904541, -0.2653576731681824, -0.1726197600364685, -0.07988178730010986, 0.012856163084506989, 0.10559411346912384, 0.1983320713043213, 0.29107001423835754, 0.3838079571723938, 0.47654592990875244, 0.5692838430404663, 0.662021815776825, 0.7547597885131836, 0.8474977016448975, 0.9402356743812561, 1.0329736471176147, 1.1257115602493286, 1.218449592590332, 1.311187505722046, 1.4039254188537598, 1.4966633319854736, 1.589401364326477, 1.682139277458191, 1.7748771905899048, 1.8676152229309082, 1.960353136062622, 2.053091049194336, 2.14582896232605, 2.2385668754577637, 2.3313047885894775, 2.4240427017211914, 2.5167808532714844, 2.6095187664031982, 2.702256679534912, 2.794994592666626, 2.88773250579834, 2.9804704189300537, 3.0732083320617676, 3.1659464836120605, 3.2586843967437744, 3.3514223098754883, 3.444160223007202, 3.536898136138916, 3.629636287689209, 3.722374200820923, 3.8151121139526367, 3.9078502655029297, 4.0005879402160645, 4.093326091766357, 4.186063766479492, 4.278801918029785, 4.37153959274292, 4.464277744293213, 4.557015419006348, 4.649753570556641, 4.742491245269775, 4.835229396820068, 4.927967071533203, 5.020705223083496, 5.113443374633789]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 9.0, 9.0, 2.0, 19.0, 9.0, 12.0, 19.0, 22.0, 27.0, 25.0, 26.0, 25.0, 38.0, 38.0, 44.0, 41.0, 46.0, 35.0, 30.0, 47.0, 42.0, 44.0, 53.0, 39.0, 39.0, 28.0, 24.0, 33.0, 25.0, 23.0, 23.0, 23.0, 14.0, 15.0, 9.0, 9.0, 8.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0925257205963135, -1.0581175088882446, -1.0237091779708862, -0.9893009066581726, -0.954892635345459, -0.9204844236373901, -0.8860761523246765, -0.8516678810119629, -0.8172596096992493, -0.7828513383865356, -0.748443067073822, -0.7140347957611084, -0.6796265840530396, -0.6452182531356812, -0.6108100414276123, -0.5764017701148987, -0.5419934988021851, -0.5075852274894714, -0.4731769561767578, -0.4387687146663666, -0.40436044335365295, -0.36995217204093933, -0.3355439305305481, -0.3011356592178345, -0.26672738790512085, -0.23231911659240723, -0.1979108601808548, -0.16350260376930237, -0.12909433245658875, -0.09468606114387512, -0.06027780473232269, -0.025869548320770264, 0.00853884220123291, 0.042947106063365936, 0.07735536992549896, 0.11176363378763199, 0.14617189764976501, 0.18058016896247864, 0.21498842537403107, 0.2493966817855835, 0.2838049530982971, 0.31821322441101074, 0.35262149572372437, 0.3870297372341156, 0.4214380085468292, 0.45584627985954285, 0.4902545213699341, 0.5246627926826477, 0.5590710639953613, 0.593479335308075, 0.6278876066207886, 0.6622958779335022, 0.6967041492462158, 0.7311123609542847, 0.7655206322669983, 0.7999289035797119, 0.8343371748924255, 0.8687454462051392, 0.9031537175178528, 0.9375619888305664, 0.9719702005386353, 1.0063785314559937, 1.0407867431640625, 1.075195074081421, 1.1096032857894897]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 10.0, 15.0, 18.0, 29.0, 35.0, 53.0, 67.0, 145.0, 215.0, 303.0, 548.0, 939.0, 1710.0, 3439.0, 7546.0, 18600.0, 48104.0, 124902.0, 318078.0, 695103.0, 1154959.0, 965323.0, 504647.0, 217527.0, 81714.0, 29320.0, 11114.0, 4692.0, 2238.0, 1179.0, 637.0, 393.0, 227.0, 148.0, 89.0, 63.0, 42.0, 28.0, 23.0, 18.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.37890625, -1.334075927734375, -1.28924560546875, -1.244415283203125, -1.1995849609375, -1.154754638671875, -1.10992431640625, -1.065093994140625, -1.020263671875, -0.975433349609375, -0.93060302734375, -0.885772705078125, -0.8409423828125, -0.796112060546875, -0.75128173828125, -0.706451416015625, -0.66162109375, -0.616790771484375, -0.57196044921875, -0.527130126953125, -0.4822998046875, -0.437469482421875, -0.39263916015625, -0.347808837890625, -0.302978515625, -0.258148193359375, -0.21331787109375, -0.168487548828125, -0.1236572265625, -0.078826904296875, -0.03399658203125, 0.010833740234375, 0.0556640625, 0.100494384765625, 0.14532470703125, 0.190155029296875, 0.2349853515625, 0.279815673828125, 0.32464599609375, 0.369476318359375, 0.414306640625, 0.459136962890625, 0.50396728515625, 0.548797607421875, 0.5936279296875, 0.638458251953125, 0.68328857421875, 0.728118896484375, 0.77294921875, 0.817779541015625, 0.86260986328125, 0.907440185546875, 0.9522705078125, 0.997100830078125, 1.04193115234375, 1.086761474609375, 1.131591796875, 1.176422119140625, 1.22125244140625, 1.266082763671875, 1.3109130859375, 1.355743408203125, 1.40057373046875, 1.445404052734375, 1.490234375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 11.0, 18.0, 16.0, 24.0, 13.0, 29.0, 28.0, 17.0, 24.0, 30.0, 35.0, 47.0, 48.0, 49.0, 45.0, 38.0, 42.0, 52.0, 33.0, 50.0, 38.0, 38.0, 39.0, 36.0, 24.0, 25.0, 26.0, 19.0, 25.0, 19.0, 12.0, 2.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.681640625, -1.6260528564453125, -1.570465087890625, -1.5148773193359375, -1.45928955078125, -1.4037017822265625, -1.348114013671875, -1.2925262451171875, -1.2369384765625, -1.1813507080078125, -1.125762939453125, -1.0701751708984375, -1.01458740234375, -0.9589996337890625, -0.903411865234375, -0.8478240966796875, -0.792236328125, -0.7366485595703125, -0.681060791015625, -0.6254730224609375, -0.56988525390625, -0.5142974853515625, -0.458709716796875, -0.4031219482421875, -0.3475341796875, -0.2919464111328125, -0.236358642578125, -0.1807708740234375, -0.12518310546875, -0.0695953369140625, -0.014007568359375, 0.0415802001953125, 0.09716796875, 0.1527557373046875, 0.208343505859375, 0.2639312744140625, 0.31951904296875, 0.3751068115234375, 0.430694580078125, 0.4862823486328125, 0.5418701171875, 0.5974578857421875, 0.653045654296875, 0.7086334228515625, 0.76422119140625, 0.8198089599609375, 0.875396728515625, 0.9309844970703125, 0.986572265625, 1.0421600341796875, 1.097747802734375, 1.1533355712890625, 1.20892333984375, 1.2645111083984375, 1.320098876953125, 1.3756866455078125, 1.4312744140625, 1.4868621826171875, 1.542449951171875, 1.5980377197265625, 1.65362548828125, 1.7092132568359375, 1.764801025390625, 1.8203887939453125, 1.8759765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 8.0, 7.0, 7.0, 9.0, 23.0, 25.0, 43.0, 42.0, 77.0, 97.0, 172.0, 236.0, 440.0, 1072.0, 61745.0, 4126660.0, 2103.0, 551.0, 345.0, 195.0, 120.0, 71.0, 59.0, 39.0, 22.0, 21.0, 23.0, 13.0, 15.0, 3.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.784423828125, -18.16259765625, -17.540771484375, -16.9189453125, -16.297119140625, -15.67529296875, -15.053466796875, -14.431640625, -13.809814453125, -13.18798828125, -12.566162109375, -11.9443359375, -11.322509765625, -10.70068359375, -10.078857421875, -9.45703125, -8.835205078125, -8.21337890625, -7.591552734375, -6.9697265625, -6.347900390625, -5.72607421875, -5.104248046875, -4.482421875, -3.860595703125, -3.23876953125, -2.616943359375, -1.9951171875, -1.373291015625, -0.75146484375, -0.129638671875, 0.4921875, 1.114013671875, 1.73583984375, 2.357666015625, 2.9794921875, 3.601318359375, 4.22314453125, 4.844970703125, 5.466796875, 6.088623046875, 6.71044921875, 7.332275390625, 7.9541015625, 8.575927734375, 9.19775390625, 9.819580078125, 10.44140625, 11.063232421875, 11.68505859375, 12.306884765625, 12.9287109375, 13.550537109375, 14.17236328125, 14.794189453125, 15.416015625, 16.037841796875, 16.65966796875, 17.281494140625, 17.9033203125, 18.525146484375, 19.14697265625, 19.768798828125, 20.390625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 9.0, 4.0, 10.0, 14.0, 22.0, 30.0, 34.0, 33.0, 52.0, 76.0, 127.0, 129.0, 228.0, 295.0, 403.0, 508.0, 550.0, 412.0, 295.0, 235.0, 160.0, 104.0, 82.0, 55.0, 44.0, 30.0, 32.0, 21.0, 11.0, 8.0, 13.0, 11.0, 3.0, 6.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6330032348632812, -0.6112213134765625, -0.5894393920898438, -0.567657470703125, -0.5458755493164062, -0.5240936279296875, -0.5023117065429688, -0.48052978515625, -0.45874786376953125, -0.4369659423828125, -0.41518402099609375, -0.393402099609375, -0.37162017822265625, -0.3498382568359375, -0.32805633544921875, -0.3062744140625, -0.28449249267578125, -0.2627105712890625, -0.24092864990234375, -0.219146728515625, -0.19736480712890625, -0.1755828857421875, -0.15380096435546875, -0.13201904296875, -0.11023712158203125, -0.0884552001953125, -0.06667327880859375, -0.044891357421875, -0.02310943603515625, -0.0013275146484375, 0.02045440673828125, 0.042236328125, 0.06401824951171875, 0.0858001708984375, 0.10758209228515625, 0.129364013671875, 0.15114593505859375, 0.1729278564453125, 0.19470977783203125, 0.21649169921875, 0.23827362060546875, 0.2600555419921875, 0.28183746337890625, 0.303619384765625, 0.32540130615234375, 0.3471832275390625, 0.36896514892578125, 0.3907470703125, 0.41252899169921875, 0.4343109130859375, 0.45609283447265625, 0.477874755859375, 0.49965667724609375, 0.5214385986328125, 0.5432205200195312, 0.56500244140625, 0.5867843627929688, 0.6085662841796875, 0.6303482055664062, 0.652130126953125, 0.6739120483398438, 0.6956939697265625, 0.7174758911132812, 0.7392578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 19.0, 17.0, 21.0, 26.0, 41.0, 46.0, 50.0, 58.0, 94.0, 95.0, 89.0, 94.0, 66.0, 54.0, 45.0, 39.0, 35.0, 24.0, 17.0, 17.0, 13.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6731536388397217, -2.592991590499878, -2.512829542160034, -2.4326672554016113, -2.3525052070617676, -2.272343158721924, -2.19218111038208, -2.1120190620422363, -2.0318570137023926, -1.9516949653625488, -1.8715327978134155, -1.7913707494735718, -1.711208701133728, -1.6310465335845947, -1.550884485244751, -1.4707224369049072, -1.390560269355774, -1.3103982210159302, -1.2302360534667969, -1.1500740051269531, -1.0699119567871094, -0.9897498488426208, -0.9095877408981323, -0.8294256925582886, -0.7492635846138, -0.6691014766693115, -0.5889394283294678, -0.5087773203849792, -0.4286152422428131, -0.348453164100647, -0.26829105615615845, -0.1881290078163147, -0.10796689987182617, -0.027804814279079437, 0.0523572713136673, 0.13251936435699463, 0.21268144249916077, 0.2928435206413269, 0.37300562858581543, 0.4531676769256592, 0.5333297848701477, 0.6134918928146362, 0.69365394115448, 0.7738160490989685, 0.853978157043457, 0.9341402053833008, 1.0143022537231445, 1.0944643020629883, 1.1746264696121216, 1.2547885179519653, 1.3349506855010986, 1.4151127338409424, 1.4952747821807861, 1.5754368305206299, 1.6555989980697632, 1.735761046409607, 1.8159232139587402, 1.896085262298584, 1.9762474298477173, 2.0564093589782715, 2.1365716457366943, 2.216733694076538, 2.296895742416382, 2.3770577907562256, 2.4572198390960693]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 0.0, 4.0, 8.0, 8.0, 6.0, 10.0, 14.0, 17.0, 20.0, 16.0, 25.0, 27.0, 27.0, 29.0, 31.0, 29.0, 35.0, 43.0, 47.0, 43.0, 42.0, 31.0, 53.0, 41.0, 30.0, 37.0, 32.0, 48.0, 30.0, 32.0, 35.0, 23.0, 28.0, 13.0, 23.0, 7.0, 13.0, 9.0, 4.0, 7.0, 3.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4387236833572388, -1.3873543739318848, -1.3359849452972412, -1.2846155166625977, -1.2332462072372437, -1.1818768978118896, -1.130507469177246, -1.0791380405426025, -1.0277687311172485, -0.9763993620872498, -0.925029993057251, -0.8736606240272522, -0.8222912549972534, -0.7709218859672546, -0.7195525169372559, -0.6681831479072571, -0.6168137788772583, -0.5654444098472595, -0.5140750408172607, -0.46270567178726196, -0.4113363027572632, -0.3599669337272644, -0.3085975646972656, -0.25722819566726685, -0.20585882663726807, -0.1544894576072693, -0.10312008857727051, -0.05175071954727173, -0.0003813505172729492, 0.05098801851272583, 0.10235738754272461, 0.1537267565727234, 0.20509624481201172, 0.2564656138420105, 0.3078349828720093, 0.35920435190200806, 0.41057372093200684, 0.4619430899620056, 0.5133124589920044, 0.5646818280220032, 0.616051197052002, 0.6674205660820007, 0.7187899351119995, 0.7701593041419983, 0.8215286731719971, 0.8728980422019958, 0.9242674112319946, 0.9756367802619934, 1.0270061492919922, 1.0783755779266357, 1.1297448873519897, 1.1811141967773438, 1.2324836254119873, 1.2838530540466309, 1.3352223634719849, 1.3865916728973389, 1.4379611015319824, 1.489330530166626, 1.54069983959198, 1.592069149017334, 1.6434385776519775, 1.694808006286621, 1.746177315711975, 1.797546625137329, 1.8489160537719727]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 17.0, 16.0, 25.0, 33.0, 44.0, 72.0, 127.0, 206.0, 300.0, 509.0, 731.0, 1249.0, 1955.0, 3265.0, 5578.0, 10015.0, 18648.0, 35958.0, 70655.0, 142496.0, 259405.0, 239750.0, 125016.0, 62475.0, 31764.0, 16750.0, 8809.0, 5047.0, 2851.0, 1772.0, 1092.0, 710.0, 411.0, 289.0, 205.0, 118.0, 62.0, 48.0, 25.0, 15.0, 10.0, 15.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.471923828125, -0.4550132751464844, -0.43810272216796875, -0.4211921691894531, -0.4042816162109375, -0.3873710632324219, -0.37046051025390625, -0.3535499572753906, -0.336639404296875, -0.3197288513183594, -0.30281829833984375, -0.2859077453613281, -0.2689971923828125, -0.2520866394042969, -0.23517608642578125, -0.21826553344726562, -0.20135498046875, -0.18444442749023438, -0.16753387451171875, -0.15062332153320312, -0.1337127685546875, -0.11680221557617188, -0.09989166259765625, -0.08298110961914062, -0.066070556640625, -0.049160003662109375, -0.03224945068359375, -0.015338897705078125, 0.0015716552734375, 0.018482208251953125, 0.03539276123046875, 0.052303314208984375, 0.0692138671875, 0.08612442016601562, 0.10303497314453125, 0.11994552612304688, 0.1368560791015625, 0.15376663208007812, 0.17067718505859375, 0.18758773803710938, 0.204498291015625, 0.22140884399414062, 0.23831939697265625, 0.2552299499511719, 0.2721405029296875, 0.2890510559082031, 0.30596160888671875, 0.3228721618652344, 0.33978271484375, 0.3566932678222656, 0.37360382080078125, 0.3905143737792969, 0.4074249267578125, 0.4243354797363281, 0.44124603271484375, 0.4581565856933594, 0.475067138671875, 0.4919776916503906, 0.5088882446289062, 0.5257987976074219, 0.5427093505859375, 0.5596199035644531, 0.5765304565429688, 0.5934410095214844, 0.6103515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 14.0, 2.0, 13.0, 9.0, 9.0, 16.0, 22.0, 32.0, 21.0, 35.0, 27.0, 29.0, 25.0, 29.0, 38.0, 36.0, 43.0, 48.0, 39.0, 38.0, 42.0, 49.0, 37.0, 41.0, 36.0, 25.0, 42.0, 23.0, 25.0, 17.0, 25.0, 15.0, 15.0, 9.0, 9.0, 7.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0], "bins": [-1.2109375, -1.1737518310546875, -1.136566162109375, -1.0993804931640625, -1.06219482421875, -1.0250091552734375, -0.987823486328125, -0.9506378173828125, -0.9134521484375, -0.8762664794921875, -0.839080810546875, -0.8018951416015625, -0.76470947265625, -0.7275238037109375, -0.690338134765625, -0.6531524658203125, -0.615966796875, -0.5787811279296875, -0.541595458984375, -0.5044097900390625, -0.46722412109375, -0.4300384521484375, -0.392852783203125, -0.3556671142578125, -0.3184814453125, -0.2812957763671875, -0.244110107421875, -0.2069244384765625, -0.16973876953125, -0.1325531005859375, -0.095367431640625, -0.0581817626953125, -0.02099609375, 0.0161895751953125, 0.053375244140625, 0.0905609130859375, 0.12774658203125, 0.1649322509765625, 0.202117919921875, 0.2393035888671875, 0.2764892578125, 0.3136749267578125, 0.350860595703125, 0.3880462646484375, 0.42523193359375, 0.4624176025390625, 0.499603271484375, 0.5367889404296875, 0.573974609375, 0.6111602783203125, 0.648345947265625, 0.6855316162109375, 0.72271728515625, 0.7599029541015625, 0.797088623046875, 0.8342742919921875, 0.8714599609375, 0.9086456298828125, 0.945831298828125, 0.9830169677734375, 1.02020263671875, 1.0573883056640625, 1.094573974609375, 1.1317596435546875, 1.1689453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 4.0, 13.0, 16.0, 31.0, 37.0, 50.0, 69.0, 97.0, 213.0, 285.0, 505.0, 905.0, 1959.0, 4144.0, 9575.0, 25353.0, 74726.0, 252957.0, 436301.0, 160774.0, 49404.0, 17503.0, 7080.0, 3159.0, 1459.0, 791.0, 430.0, 267.0, 159.0, 84.0, 55.0, 34.0, 30.0, 16.0, 15.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9814453125, -0.950103759765625, -0.91876220703125, -0.887420654296875, -0.8560791015625, -0.824737548828125, -0.79339599609375, -0.762054443359375, -0.730712890625, -0.699371337890625, -0.66802978515625, -0.636688232421875, -0.6053466796875, -0.574005126953125, -0.54266357421875, -0.511322021484375, -0.47998046875, -0.448638916015625, -0.41729736328125, -0.385955810546875, -0.3546142578125, -0.323272705078125, -0.29193115234375, -0.260589599609375, -0.229248046875, -0.197906494140625, -0.16656494140625, -0.135223388671875, -0.1038818359375, -0.072540283203125, -0.04119873046875, -0.009857177734375, 0.021484375, 0.052825927734375, 0.08416748046875, 0.115509033203125, 0.1468505859375, 0.178192138671875, 0.20953369140625, 0.240875244140625, 0.272216796875, 0.303558349609375, 0.33489990234375, 0.366241455078125, 0.3975830078125, 0.428924560546875, 0.46026611328125, 0.491607666015625, 0.52294921875, 0.554290771484375, 0.58563232421875, 0.616973876953125, 0.6483154296875, 0.679656982421875, 0.71099853515625, 0.742340087890625, 0.773681640625, 0.805023193359375, 0.83636474609375, 0.867706298828125, 0.8990478515625, 0.930389404296875, 0.96173095703125, 0.993072509765625, 1.0244140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 12.0, 13.0, 20.0, 25.0, 24.0, 28.0, 34.0, 43.0, 54.0, 38.0, 43.0, 50.0, 52.0, 47.0, 51.0, 44.0, 47.0, 46.0, 47.0, 43.0, 40.0, 25.0, 33.0, 26.0, 12.0, 15.0, 18.0, 16.0, 13.0, 3.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.673828125, -3.578887939453125, -3.48394775390625, -3.389007568359375, -3.2940673828125, -3.199127197265625, -3.10418701171875, -3.009246826171875, -2.914306640625, -2.819366455078125, -2.72442626953125, -2.629486083984375, -2.5345458984375, -2.439605712890625, -2.34466552734375, -2.249725341796875, -2.15478515625, -2.059844970703125, -1.96490478515625, -1.869964599609375, -1.7750244140625, -1.680084228515625, -1.58514404296875, -1.490203857421875, -1.395263671875, -1.300323486328125, -1.20538330078125, -1.110443115234375, -1.0155029296875, -0.920562744140625, -0.82562255859375, -0.730682373046875, -0.6357421875, -0.540802001953125, -0.44586181640625, -0.350921630859375, -0.2559814453125, -0.161041259765625, -0.06610107421875, 0.028839111328125, 0.123779296875, 0.218719482421875, 0.31365966796875, 0.408599853515625, 0.5035400390625, 0.598480224609375, 0.69342041015625, 0.788360595703125, 0.88330078125, 0.978240966796875, 1.07318115234375, 1.168121337890625, 1.2630615234375, 1.358001708984375, 1.45294189453125, 1.547882080078125, 1.642822265625, 1.737762451171875, 1.83270263671875, 1.927642822265625, 2.0225830078125, 2.117523193359375, 2.21246337890625, 2.307403564453125, 2.40234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 9.0, 16.0, 33.0, 33.0, 34.0, 51.0, 102.0, 149.0, 207.0, 311.0, 504.0, 808.0, 1340.0, 2283.0, 4178.0, 8639.0, 19248.0, 52689.0, 206021.0, 516008.0, 158288.0, 44057.0, 16669.0, 7646.0, 3885.0, 2122.0, 1158.0, 768.0, 425.0, 307.0, 168.0, 129.0, 76.0, 64.0, 48.0, 23.0, 17.0, 12.0, 8.0, 10.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.382080078125, -0.37029266357421875, -0.3585052490234375, -0.34671783447265625, -0.334930419921875, -0.32314300537109375, -0.3113555908203125, -0.29956817626953125, -0.28778076171875, -0.27599334716796875, -0.2642059326171875, -0.25241851806640625, -0.240631103515625, -0.22884368896484375, -0.2170562744140625, -0.20526885986328125, -0.1934814453125, -0.18169403076171875, -0.1699066162109375, -0.15811920166015625, -0.146331787109375, -0.13454437255859375, -0.1227569580078125, -0.11096954345703125, -0.09918212890625, -0.08739471435546875, -0.0756072998046875, -0.06381988525390625, -0.052032470703125, -0.04024505615234375, -0.0284576416015625, -0.01667022705078125, -0.0048828125, 0.00690460205078125, 0.0186920166015625, 0.03047943115234375, 0.042266845703125, 0.05405426025390625, 0.0658416748046875, 0.07762908935546875, 0.08941650390625, 0.10120391845703125, 0.1129913330078125, 0.12477874755859375, 0.136566162109375, 0.14835357666015625, 0.1601409912109375, 0.17192840576171875, 0.1837158203125, 0.19550323486328125, 0.2072906494140625, 0.21907806396484375, 0.230865478515625, 0.24265289306640625, 0.2544403076171875, 0.26622772216796875, 0.27801513671875, 0.28980255126953125, 0.3015899658203125, 0.31337738037109375, 0.325164794921875, 0.33695220947265625, 0.3487396240234375, 0.36052703857421875, 0.372314453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 14.0, 7.0, 20.0, 25.0, 52.0, 67.0, 141.0, 200.0, 185.0, 108.0, 62.0, 30.0, 24.0, 8.0, 10.0, 4.0, 4.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028824806213378906, -0.0002788752317428589, -0.0002695024013519287, -0.00026012957096099854, -0.00025075674057006836, -0.00024138391017913818, -0.000232011079788208, -0.00022263824939727783, -0.00021326541900634766, -0.00020389258861541748, -0.0001945197582244873, -0.00018514692783355713, -0.00017577409744262695, -0.00016640126705169678, -0.0001570284366607666, -0.00014765560626983643, -0.00013828277587890625, -0.00012890994548797607, -0.0001195371150970459, -0.00011016428470611572, -0.00010079145431518555, -9.141862392425537e-05, -8.20457935333252e-05, -7.267296314239502e-05, -6.330013275146484e-05, -5.392730236053467e-05, -4.455447196960449e-05, -3.5181641578674316e-05, -2.580881118774414e-05, -1.6435980796813965e-05, -7.063150405883789e-06, 2.3096799850463867e-06, 1.1682510375976562e-05, 2.1055340766906738e-05, 3.0428171157836914e-05, 3.980100154876709e-05, 4.9173831939697266e-05, 5.854666233062744e-05, 6.791949272155762e-05, 7.729232311248779e-05, 8.666515350341797e-05, 9.603798389434814e-05, 0.00010541081428527832, 0.0001147836446762085, 0.00012415647506713867, 0.00013352930545806885, 0.00014290213584899902, 0.0001522749662399292, 0.00016164779663085938, 0.00017102062702178955, 0.00018039345741271973, 0.0001897662878036499, 0.00019913911819458008, 0.00020851194858551025, 0.00021788477897644043, 0.0002272576093673706, 0.00023663043975830078, 0.00024600327014923096, 0.00025537610054016113, 0.0002647489309310913, 0.0002741217613220215, 0.00028349459171295166, 0.00029286742210388184, 0.000302240252494812, 0.0003116130828857422]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 9.0, 5.0, 11.0, 15.0, 15.0, 23.0, 27.0, 27.0, 42.0, 55.0, 86.0, 142.0, 385.0, 1614.0, 10400.0, 163638.0, 826780.0, 39564.0, 4281.0, 839.0, 244.0, 103.0, 56.0, 53.0, 34.0, 26.0, 22.0, 12.0, 9.0, 11.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2373046875, -1.2032012939453125, -1.169097900390625, -1.1349945068359375, -1.10089111328125, -1.0667877197265625, -1.032684326171875, -0.9985809326171875, -0.9644775390625, -0.9303741455078125, -0.896270751953125, -0.8621673583984375, -0.82806396484375, -0.7939605712890625, -0.759857177734375, -0.7257537841796875, -0.691650390625, -0.6575469970703125, -0.623443603515625, -0.5893402099609375, -0.55523681640625, -0.5211334228515625, -0.487030029296875, -0.4529266357421875, -0.4188232421875, -0.3847198486328125, -0.350616455078125, -0.3165130615234375, -0.28240966796875, -0.2483062744140625, -0.214202880859375, -0.1800994873046875, -0.14599609375, -0.1118927001953125, -0.077789306640625, -0.0436859130859375, -0.00958251953125, 0.0245208740234375, 0.058624267578125, 0.0927276611328125, 0.1268310546875, 0.1609344482421875, 0.195037841796875, 0.2291412353515625, 0.26324462890625, 0.2973480224609375, 0.331451416015625, 0.3655548095703125, 0.399658203125, 0.4337615966796875, 0.467864990234375, 0.5019683837890625, 0.53607177734375, 0.5701751708984375, 0.604278564453125, 0.6383819580078125, 0.6724853515625, 0.7065887451171875, 0.740692138671875, 0.7747955322265625, 0.80889892578125, 0.8430023193359375, 0.877105712890625, 0.9112091064453125, 0.9453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 11.0, 12.0, 10.0, 11.0, 13.0, 21.0, 30.0, 27.0, 42.0, 41.0, 92.0, 76.0, 93.0, 112.0, 77.0, 67.0, 60.0, 41.0, 30.0, 25.0, 13.0, 14.0, 18.0, 10.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1322021484375, -0.12841510772705078, -0.12462806701660156, -0.12084102630615234, -0.11705398559570312, -0.1132669448852539, -0.10947990417480469, -0.10569286346435547, -0.10190582275390625, -0.09811878204345703, -0.09433174133300781, -0.0905447006225586, -0.08675765991210938, -0.08297061920166016, -0.07918357849121094, -0.07539653778076172, -0.0716094970703125, -0.06782245635986328, -0.06403541564941406, -0.060248374938964844, -0.056461334228515625, -0.052674293518066406, -0.04888725280761719, -0.04510021209716797, -0.04131317138671875, -0.03752613067626953, -0.03373908996582031, -0.029952049255371094, -0.026165008544921875, -0.022377967834472656, -0.018590927124023438, -0.014803886413574219, -0.011016845703125, -0.007229804992675781, -0.0034427642822265625, 0.00034427642822265625, 0.004131317138671875, 0.007918357849121094, 0.011705398559570312, 0.015492439270019531, 0.01927947998046875, 0.02306652069091797, 0.026853561401367188, 0.030640602111816406, 0.034427642822265625, 0.038214683532714844, 0.04200172424316406, 0.04578876495361328, 0.0495758056640625, 0.05336284637451172, 0.05714988708496094, 0.060936927795410156, 0.06472396850585938, 0.0685110092163086, 0.07229804992675781, 0.07608509063720703, 0.07987213134765625, 0.08365917205810547, 0.08744621276855469, 0.0912332534790039, 0.09502029418945312, 0.09880733489990234, 0.10259437561035156, 0.10638141632080078, 0.11016845703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 10.0, 13.0, 31.0, 39.0, 59.0, 68.0, 108.0, 144.0, 121.0, 128.0, 93.0, 73.0, 45.0, 18.0, 19.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.001615524291992, -3.910857915878296, -3.8201003074645996, -3.729342460632324, -3.638584852218628, -3.5478272438049316, -3.4570696353912354, -3.366312026977539, -3.2755544185638428, -3.1847968101501465, -3.09403920173645, -3.003281593322754, -2.9125237464904785, -2.8217661380767822, -2.731008529663086, -2.6402509212493896, -2.5494933128356934, -2.458735704421997, -2.367978096008301, -2.2772202491760254, -2.186462640762329, -2.095705032348633, -2.0049474239349365, -1.9141898155212402, -1.8234319686889648, -1.7326743602752686, -1.6419166326522827, -1.5511590242385864, -1.4604014158248901, -1.3696436882019043, -1.278886079788208, -1.1881284713745117, -1.0973708629608154, -1.0066132545471191, -0.9158555865287781, -0.825097918510437, -0.7343403100967407, -0.6435826420783997, -0.5528249740600586, -0.4620673656463623, -0.37130969762802124, -0.28055205941200256, -0.1897944062948227, -0.09903675317764282, -0.008279114961624146, 0.08247852325439453, 0.1732361912727356, 0.2639937996864319, 0.35475146770477295, 0.4455091059207916, 0.5362667441368103, 0.6270244121551514, 0.7177820205688477, 0.8085396885871887, 0.8992973566055298, 0.9900549650192261, 1.080812692642212, 1.1715703010559082, 1.262328028678894, 1.3530856370925903, 1.4438432455062866, 1.5346009731292725, 1.6253585815429688, 1.716116189956665, 1.8068737983703613]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 7.0, 7.0, 8.0, 15.0, 12.0, 21.0, 17.0, 24.0, 24.0, 25.0, 28.0, 36.0, 35.0, 30.0, 32.0, 54.0, 41.0, 47.0, 33.0, 42.0, 52.0, 36.0, 36.0, 36.0, 40.0, 55.0, 32.0, 29.0, 27.0, 20.0, 15.0, 16.0, 9.0, 11.0, 6.0, 7.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1570268869400024, -1.1179341077804565, -1.078841209411621, -1.0397484302520752, -1.0006556510925293, -0.9615628123283386, -0.922469973564148, -0.883377194404602, -0.8442843556404114, -0.8051915168762207, -0.7660987377166748, -0.7270058989524841, -0.6879130601882935, -0.6488202810287476, -0.6097274422645569, -0.5706346035003662, -0.5315418243408203, -0.492449015378952, -0.45335620641708374, -0.41426336765289307, -0.3751705586910248, -0.3360777497291565, -0.2969849109649658, -0.25789210200309753, -0.21879929304122925, -0.17970648407936096, -0.14061366021633148, -0.1015208438038826, -0.062428027391433716, -0.02333521842956543, 0.01575760543346405, 0.05485042929649353, 0.09394311904907227, 0.13303592801094055, 0.17212875187397003, 0.2112215757369995, 0.2503143846988678, 0.2894071936607361, 0.32850003242492676, 0.36759284138679504, 0.40668565034866333, 0.4457784593105316, 0.4848712682723999, 0.5239641070365906, 0.5630569458007812, 0.6021497249603271, 0.6412425637245178, 0.6803354024887085, 0.7194281816482544, 0.7585210204124451, 0.797613799571991, 0.8367066383361816, 0.8757994174957275, 0.9148922562599182, 0.9539850950241089, 0.9930778741836548, 1.0321707725524902, 1.0712635517120361, 1.1103564500808716, 1.1494492292404175, 1.1885420083999634, 1.2276349067687988, 1.2667276859283447, 1.3058204650878906, 1.3449132442474365]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 12.0, 24.0, 35.0, 34.0, 68.0, 67.0, 115.0, 168.0, 236.0, 400.0, 534.0, 826.0, 1382.0, 2176.0, 3665.0, 6446.0, 11789.0, 21956.0, 41567.0, 79803.0, 144908.0, 217768.0, 212119.0, 139219.0, 76003.0, 39293.0, 21277.0, 11207.0, 6048.0, 3550.0, 2053.0, 1279.0, 803.0, 536.0, 378.0, 240.0, 184.0, 108.0, 67.0, 72.0, 33.0, 21.0, 22.0, 14.0, 12.0, 8.0, 8.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5070838928222656, -0.49121856689453125, -0.4753532409667969, -0.4594879150390625, -0.4436225891113281, -0.42775726318359375, -0.4118919372558594, -0.396026611328125, -0.3801612854003906, -0.36429595947265625, -0.3484306335449219, -0.3325653076171875, -0.3166999816894531, -0.30083465576171875, -0.2849693298339844, -0.26910400390625, -0.2532386779785156, -0.23737335205078125, -0.22150802612304688, -0.2056427001953125, -0.18977737426757812, -0.17391204833984375, -0.15804672241210938, -0.142181396484375, -0.12631607055664062, -0.11045074462890625, -0.09458541870117188, -0.0787200927734375, -0.06285476684570312, -0.04698944091796875, -0.031124114990234375, -0.0152587890625, 0.000606536865234375, 0.01647186279296875, 0.032337188720703125, 0.0482025146484375, 0.06406784057617188, 0.07993316650390625, 0.09579849243164062, 0.111663818359375, 0.12752914428710938, 0.14339447021484375, 0.15925979614257812, 0.1751251220703125, 0.19099044799804688, 0.20685577392578125, 0.22272109985351562, 0.23858642578125, 0.2544517517089844, 0.27031707763671875, 0.2861824035644531, 0.3020477294921875, 0.3179130554199219, 0.33377838134765625, 0.3496437072753906, 0.365509033203125, 0.3813743591308594, 0.39723968505859375, 0.4131050109863281, 0.4289703369140625, 0.4448356628417969, 0.46070098876953125, 0.4765663146972656, 0.492431640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 11.0, 14.0, 16.0, 19.0, 19.0, 26.0, 34.0, 26.0, 29.0, 42.0, 44.0, 52.0, 40.0, 66.0, 45.0, 66.0, 39.0, 49.0, 33.0, 34.0, 39.0, 33.0, 30.0, 30.0, 26.0, 20.0, 14.0, 16.0, 18.0, 16.0, 9.0, 3.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5850830078125, -9.271728515625, -8.9583740234375, -8.64501953125, -8.3316650390625, -8.018310546875, -7.7049560546875, -7.3916015625, -7.0782470703125, -6.764892578125, -6.4515380859375, -6.13818359375, -5.8248291015625, -5.511474609375, -5.1981201171875, -4.884765625, -4.5714111328125, -4.258056640625, -3.9447021484375, -3.63134765625, -3.3179931640625, -3.004638671875, -2.6912841796875, -2.3779296875, -2.0645751953125, -1.751220703125, -1.4378662109375, -1.12451171875, -0.8111572265625, -0.497802734375, -0.1844482421875, 0.12890625, 0.4422607421875, 0.755615234375, 1.0689697265625, 1.38232421875, 1.6956787109375, 2.009033203125, 2.3223876953125, 2.6357421875, 2.9490966796875, 3.262451171875, 3.5758056640625, 3.88916015625, 4.2025146484375, 4.515869140625, 4.8292236328125, 5.142578125, 5.4559326171875, 5.769287109375, 6.0826416015625, 6.39599609375, 6.7093505859375, 7.022705078125, 7.3360595703125, 7.6494140625, 7.9627685546875, 8.276123046875, 8.5894775390625, 8.90283203125, 9.2161865234375, 9.529541015625, 9.8428955078125, 10.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 29.0, 28.0, 29.0, 51.0, 56.0, 71.0, 90.0, 137.0, 206.0, 252.0, 458.0, 935.0, 5275.0, 306446.0, 719950.0, 11745.0, 1222.0, 533.0, 279.0, 185.0, 136.0, 84.0, 81.0, 44.0, 41.0, 33.0, 26.0, 24.0, 8.0, 12.0, 7.0, 6.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.83984375, -3.7203369140625, -3.600830078125, -3.4813232421875, -3.36181640625, -3.2423095703125, -3.122802734375, -3.0032958984375, -2.8837890625, -2.7642822265625, -2.644775390625, -2.5252685546875, -2.40576171875, -2.2862548828125, -2.166748046875, -2.0472412109375, -1.927734375, -1.8082275390625, -1.688720703125, -1.5692138671875, -1.44970703125, -1.3302001953125, -1.210693359375, -1.0911865234375, -0.9716796875, -0.8521728515625, -0.732666015625, -0.6131591796875, -0.49365234375, -0.3741455078125, -0.254638671875, -0.1351318359375, -0.015625, 0.1038818359375, 0.223388671875, 0.3428955078125, 0.46240234375, 0.5819091796875, 0.701416015625, 0.8209228515625, 0.9404296875, 1.0599365234375, 1.179443359375, 1.2989501953125, 1.41845703125, 1.5379638671875, 1.657470703125, 1.7769775390625, 1.896484375, 2.0159912109375, 2.135498046875, 2.2550048828125, 2.37451171875, 2.4940185546875, 2.613525390625, 2.7330322265625, 2.8525390625, 2.9720458984375, 3.091552734375, 3.2110595703125, 3.33056640625, 3.4500732421875, 3.569580078125, 3.6890869140625, 3.80859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 19.0, 8.0, 22.0, 13.0, 22.0, 29.0, 25.0, 35.0, 46.0, 35.0, 38.0, 35.0, 48.0, 42.0, 54.0, 53.0, 47.0, 44.0, 46.0, 50.0, 24.0, 46.0, 28.0, 21.0, 30.0, 21.0, 10.0, 14.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83203125, -7.55230712890625, -7.2725830078125, -6.99285888671875, -6.713134765625, -6.43341064453125, -6.1536865234375, -5.87396240234375, -5.59423828125, -5.31451416015625, -5.0347900390625, -4.75506591796875, -4.475341796875, -4.19561767578125, -3.9158935546875, -3.63616943359375, -3.3564453125, -3.07672119140625, -2.7969970703125, -2.51727294921875, -2.237548828125, -1.95782470703125, -1.6781005859375, -1.39837646484375, -1.11865234375, -0.83892822265625, -0.5592041015625, -0.27947998046875, 0.000244140625, 0.27996826171875, 0.5596923828125, 0.83941650390625, 1.119140625, 1.39886474609375, 1.6785888671875, 1.95831298828125, 2.238037109375, 2.51776123046875, 2.7974853515625, 3.07720947265625, 3.35693359375, 3.63665771484375, 3.9163818359375, 4.19610595703125, 4.475830078125, 4.75555419921875, 5.0352783203125, 5.31500244140625, 5.5947265625, 5.87445068359375, 6.1541748046875, 6.43389892578125, 6.713623046875, 6.99334716796875, 7.2730712890625, 7.55279541015625, 7.83251953125, 8.11224365234375, 8.3919677734375, 8.67169189453125, 8.951416015625, 9.23114013671875, 9.5108642578125, 9.79058837890625, 10.0703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 1.0, 8.0, 9.0, 15.0, 35.0, 42.0, 39.0, 77.0, 116.0, 244.0, 524.0, 1510.0, 6504.0, 92715.0, 907955.0, 32851.0, 3906.0, 1100.0, 410.0, 184.0, 119.0, 64.0, 48.0, 29.0, 21.0, 10.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6166839599609375, -0.595672607421875, -0.5746612548828125, -0.55364990234375, -0.5326385498046875, -0.511627197265625, -0.4906158447265625, -0.4696044921875, -0.4485931396484375, -0.427581787109375, -0.4065704345703125, -0.38555908203125, -0.3645477294921875, -0.343536376953125, -0.3225250244140625, -0.301513671875, -0.2805023193359375, -0.259490966796875, -0.2384796142578125, -0.21746826171875, -0.1964569091796875, -0.175445556640625, -0.1544342041015625, -0.1334228515625, -0.1124114990234375, -0.091400146484375, -0.0703887939453125, -0.04937744140625, -0.0283660888671875, -0.007354736328125, 0.0136566162109375, 0.03466796875, 0.0556793212890625, 0.076690673828125, 0.0977020263671875, 0.11871337890625, 0.1397247314453125, 0.160736083984375, 0.1817474365234375, 0.2027587890625, 0.2237701416015625, 0.244781494140625, 0.2657928466796875, 0.28680419921875, 0.3078155517578125, 0.328826904296875, 0.3498382568359375, 0.370849609375, 0.3918609619140625, 0.412872314453125, 0.4338836669921875, 0.45489501953125, 0.4759063720703125, 0.496917724609375, 0.5179290771484375, 0.5389404296875, 0.5599517822265625, 0.580963134765625, 0.6019744873046875, 0.62298583984375, 0.6439971923828125, 0.665008544921875, 0.6860198974609375, 0.70703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 9.0, 12.0, 15.0, 28.0, 17.0, 49.0, 67.0, 104.0, 158.0, 169.0, 133.0, 70.0, 45.0, 38.0, 27.0, 16.0, 8.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.595518112182617e-05, -4.413537681102753e-05, -4.231557250022888e-05, -4.049576818943024e-05, -3.867596387863159e-05, -3.685615956783295e-05, -3.50363552570343e-05, -3.321655094623566e-05, -3.139674663543701e-05, -2.9576942324638367e-05, -2.775713801383972e-05, -2.5937333703041077e-05, -2.411752939224243e-05, -2.2297725081443787e-05, -2.047792077064514e-05, -1.8658116459846497e-05, -1.683831214904785e-05, -1.5018507838249207e-05, -1.3198703527450562e-05, -1.1378899216651917e-05, -9.559094905853271e-06, -7.739290595054626e-06, -5.9194862842559814e-06, -4.0996819734573364e-06, -2.2798776626586914e-06, -4.600733518600464e-07, 1.3597309589385986e-06, 3.1795352697372437e-06, 4.999339580535889e-06, 6.819143891334534e-06, 8.638948202133179e-06, 1.0458752512931824e-05, 1.2278556823730469e-05, 1.4098361134529114e-05, 1.591816544532776e-05, 1.7737969756126404e-05, 1.955777406692505e-05, 2.1377578377723694e-05, 2.319738268852234e-05, 2.5017186999320984e-05, 2.683699131011963e-05, 2.8656795620918274e-05, 3.047659993171692e-05, 3.2296404242515564e-05, 3.411620855331421e-05, 3.5936012864112854e-05, 3.77558171749115e-05, 3.9575621485710144e-05, 4.139542579650879e-05, 4.3215230107307434e-05, 4.503503441810608e-05, 4.6854838728904724e-05, 4.867464303970337e-05, 5.0494447350502014e-05, 5.231425166130066e-05, 5.4134055972099304e-05, 5.595386028289795e-05, 5.7773664593696594e-05, 5.959346890449524e-05, 6.141327321529388e-05, 6.323307752609253e-05, 6.505288183689117e-05, 6.687268614768982e-05, 6.869249045848846e-05, 7.051229476928711e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 13.0, 17.0, 14.0, 29.0, 38.0, 45.0, 82.0, 201.0, 447.0, 1742.0, 10270.0, 181548.0, 818256.0, 30852.0, 3626.0, 803.0, 285.0, 101.0, 59.0, 30.0, 20.0, 20.0, 17.0, 11.0, 4.0, 9.0, 3.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.480712890625, -0.4623832702636719, -0.44405364990234375, -0.4257240295410156, -0.4073944091796875, -0.3890647888183594, -0.37073516845703125, -0.3524055480957031, -0.334075927734375, -0.3157463073730469, -0.29741668701171875, -0.2790870666503906, -0.2607574462890625, -0.24242782592773438, -0.22409820556640625, -0.20576858520507812, -0.18743896484375, -0.16910934448242188, -0.15077972412109375, -0.13245010375976562, -0.1141204833984375, -0.09579086303710938, -0.07746124267578125, -0.059131622314453125, -0.040802001953125, -0.022472381591796875, -0.00414276123046875, 0.014186859130859375, 0.0325164794921875, 0.050846099853515625, 0.06917572021484375, 0.08750534057617188, 0.1058349609375, 0.12416458129882812, 0.14249420166015625, 0.16082382202148438, 0.1791534423828125, 0.19748306274414062, 0.21581268310546875, 0.23414230346679688, 0.252471923828125, 0.2708015441894531, 0.28913116455078125, 0.3074607849121094, 0.3257904052734375, 0.3441200256347656, 0.36244964599609375, 0.3807792663574219, 0.39910888671875, 0.4174385070800781, 0.43576812744140625, 0.4540977478027344, 0.4724273681640625, 0.4907569885253906, 0.5090866088867188, 0.5274162292480469, 0.545745849609375, 0.5640754699707031, 0.5824050903320312, 0.6007347106933594, 0.6190643310546875, 0.6373939514160156, 0.6557235717773438, 0.6740531921386719, 0.6923828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 9.0, 13.0, 19.0, 19.0, 23.0, 20.0, 37.0, 45.0, 69.0, 100.0, 137.0, 141.0, 91.0, 59.0, 43.0, 34.0, 27.0, 18.0, 23.0, 16.0, 10.0, 9.0, 9.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10498046875, -0.10107803344726562, -0.09717559814453125, -0.09327316284179688, -0.0893707275390625, -0.08546829223632812, -0.08156585693359375, -0.07766342163085938, -0.073760986328125, -0.06985855102539062, -0.06595611572265625, -0.062053680419921875, -0.0581512451171875, -0.054248809814453125, -0.05034637451171875, -0.046443939208984375, -0.04254150390625, -0.038639068603515625, -0.03473663330078125, -0.030834197998046875, -0.0269317626953125, -0.023029327392578125, -0.01912689208984375, -0.015224456787109375, -0.011322021484375, -0.007419586181640625, -0.00351715087890625, 0.000385284423828125, 0.0042877197265625, 0.008190155029296875, 0.01209259033203125, 0.015995025634765625, 0.0198974609375, 0.023799896240234375, 0.02770233154296875, 0.031604766845703125, 0.0355072021484375, 0.039409637451171875, 0.04331207275390625, 0.047214508056640625, 0.051116943359375, 0.055019378662109375, 0.05892181396484375, 0.06282424926757812, 0.0667266845703125, 0.07062911987304688, 0.07453155517578125, 0.07843399047851562, 0.08233642578125, 0.08623886108398438, 0.09014129638671875, 0.09404373168945312, 0.0979461669921875, 0.10184860229492188, 0.10575103759765625, 0.10965347290039062, 0.113555908203125, 0.11745834350585938, 0.12136077880859375, 0.12526321411132812, 0.1291656494140625, 0.13306808471679688, 0.13697052001953125, 0.14087295532226562, 0.144775390625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 255.0, 739.0, 22.0], "bins": [-82.84195709228516, -81.51062774658203, -80.1792984008789, -78.84796905517578, -77.51663970947266, -76.18531036376953, -74.8539810180664, -73.52265167236328, -72.19132232666016, -70.85999298095703, -69.5286636352539, -68.19733428955078, -66.86600494384766, -65.53467559814453, -64.2033462524414, -62.87201690673828, -61.54069137573242, -60.2093620300293, -58.87803268432617, -57.54670333862305, -56.21537399291992, -54.8840446472168, -53.55271530151367, -52.22138977050781, -50.89006042480469, -49.55873107910156, -48.22740173339844, -46.89607238769531, -45.56474304199219, -44.23341369628906, -42.90208435058594, -41.57075500488281, -40.23942947387695, -38.90810012817383, -37.5767707824707, -36.24544143676758, -34.91411209106445, -33.58278274536133, -32.2514533996582, -30.92012596130371, -29.588796615600586, -28.25746726989746, -26.926137924194336, -25.59480857849121, -24.26348114013672, -22.932151794433594, -21.60082244873047, -20.269493103027344, -18.93816375732422, -17.606834411621094, -16.27550506591797, -14.94417667388916, -13.612847328186035, -12.28151798248291, -10.950189590454102, -9.618860244750977, -8.287530899047852, -6.956201553344727, -5.62487268447876, -4.293543815612793, -2.962214469909668, -1.630885124206543, -0.29955625534057617, 1.0317726135253906, 2.3631019592285156]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 6.0, 7.0, 8.0, 8.0, 9.0, 15.0, 15.0, 31.0, 29.0, 18.0, 33.0, 27.0, 23.0, 35.0, 36.0, 33.0, 32.0, 41.0, 36.0, 36.0, 42.0, 39.0, 41.0, 37.0, 38.0, 37.0, 33.0, 34.0, 30.0, 27.0, 36.0, 20.0, 23.0, 11.0, 17.0, 14.0, 9.0, 2.0, 4.0, 3.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.697251319885254, -12.286035537719727, -11.8748197555542, -11.463603973388672, -11.052389144897461, -10.641173362731934, -10.229957580566406, -9.818741798400879, -9.407526016235352, -8.996310234069824, -8.585094451904297, -8.173879623413086, -7.7626633644104, -7.351448059082031, -6.940232276916504, -6.529016494750977, -6.117801189422607, -5.70658540725708, -5.295370101928711, -4.884154319763184, -4.472938537597656, -4.061722755432129, -3.6505074501037598, -3.2392916679382324, -2.828076124191284, -2.416860580444336, -2.0056447982788086, -1.5944292545318604, -1.1832135915756226, -0.7719979286193848, -0.3607823848724365, 0.05043339729309082, 0.46164894104003906, 0.8728646039962769, 1.2840802669525146, 1.695295810699463, 2.1065115928649902, 2.5177271366119385, 2.9289426803588867, 3.340158462524414, 3.7513740062713623, 4.1625895500183105, 4.573805332183838, 4.985020637512207, 5.396236419677734, 5.807452201843262, 6.218667984008789, 6.629883766174316, 7.0410990715026855, 7.452314853668213, 7.863530158996582, 8.27474594116211, 8.685961723327637, 9.097177505493164, 9.508392333984375, 9.919609069824219, 10.33082389831543, 10.742039680480957, 11.153255462646484, 11.564470291137695, 11.975686073303223, 12.38690185546875, 12.798117637634277, 13.209333419799805, 13.620549201965332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 3.0, 7.0, 5.0, 24.0, 18.0, 28.0, 31.0, 38.0, 48.0, 70.0, 116.0, 249.0, 940.0, 6163.0, 88824.0, 1813766.0, 2159990.0, 114777.0, 7349.0, 1154.0, 282.0, 112.0, 70.0, 42.0, 34.0, 23.0, 22.0, 19.0, 15.0, 20.0, 4.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.28515625, -4.166259765625, -4.04736328125, -3.928466796875, -3.8095703125, -3.690673828125, -3.57177734375, -3.452880859375, -3.333984375, -3.215087890625, -3.09619140625, -2.977294921875, -2.8583984375, -2.739501953125, -2.62060546875, -2.501708984375, -2.3828125, -2.263916015625, -2.14501953125, -2.026123046875, -1.9072265625, -1.788330078125, -1.66943359375, -1.550537109375, -1.431640625, -1.312744140625, -1.19384765625, -1.074951171875, -0.9560546875, -0.837158203125, -0.71826171875, -0.599365234375, -0.48046875, -0.361572265625, -0.24267578125, -0.123779296875, -0.0048828125, 0.114013671875, 0.23291015625, 0.351806640625, 0.470703125, 0.589599609375, 0.70849609375, 0.827392578125, 0.9462890625, 1.065185546875, 1.18408203125, 1.302978515625, 1.421875, 1.540771484375, 1.65966796875, 1.778564453125, 1.8974609375, 2.016357421875, 2.13525390625, 2.254150390625, 2.373046875, 2.491943359375, 2.61083984375, 2.729736328125, 2.8486328125, 2.967529296875, 3.08642578125, 3.205322265625, 3.32421875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 14.0, 12.0, 14.0, 14.0, 15.0, 33.0, 35.0, 36.0, 42.0, 38.0, 42.0, 55.0, 47.0, 44.0, 57.0, 48.0, 43.0, 50.0, 45.0, 34.0, 47.0, 31.0, 25.0, 33.0, 24.0, 25.0, 19.0, 13.0, 7.0, 10.0, 9.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.767578125, -1.713775634765625, -1.65997314453125, -1.606170654296875, -1.5523681640625, -1.498565673828125, -1.44476318359375, -1.390960693359375, -1.337158203125, -1.283355712890625, -1.22955322265625, -1.175750732421875, -1.1219482421875, -1.068145751953125, -1.01434326171875, -0.960540771484375, -0.90673828125, -0.852935791015625, -0.79913330078125, -0.745330810546875, -0.6915283203125, -0.637725830078125, -0.58392333984375, -0.530120849609375, -0.476318359375, -0.422515869140625, -0.36871337890625, -0.314910888671875, -0.2611083984375, -0.207305908203125, -0.15350341796875, -0.099700927734375, -0.0458984375, 0.007904052734375, 0.06170654296875, 0.115509033203125, 0.1693115234375, 0.223114013671875, 0.27691650390625, 0.330718994140625, 0.384521484375, 0.438323974609375, 0.49212646484375, 0.545928955078125, 0.5997314453125, 0.653533935546875, 0.70733642578125, 0.761138916015625, 0.81494140625, 0.868743896484375, 0.92254638671875, 0.976348876953125, 1.0301513671875, 1.083953857421875, 1.13775634765625, 1.191558837890625, 1.245361328125, 1.299163818359375, 1.35296630859375, 1.406768798828125, 1.4605712890625, 1.514373779296875, 1.56817626953125, 1.621978759765625, 1.67578125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 8.0, 16.0, 16.0, 35.0, 134.0, 6988.0, 4186645.0, 260.0, 74.0, 22.0, 15.0, 10.0, 10.0, 10.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.1875, -75.16259765625, -73.1376953125, -71.11279296875, -69.087890625, -67.06298828125, -65.0380859375, -63.01318359375, -60.98828125, -58.96337890625, -56.9384765625, -54.91357421875, -52.888671875, -50.86376953125, -48.8388671875, -46.81396484375, -44.7890625, -42.76416015625, -40.7392578125, -38.71435546875, -36.689453125, -34.66455078125, -32.6396484375, -30.61474609375, -28.58984375, -26.56494140625, -24.5400390625, -22.51513671875, -20.490234375, -18.46533203125, -16.4404296875, -14.41552734375, -12.390625, -10.36572265625, -8.3408203125, -6.31591796875, -4.291015625, -2.26611328125, -0.2412109375, 1.78369140625, 3.80859375, 5.83349609375, 7.8583984375, 9.88330078125, 11.908203125, 13.93310546875, 15.9580078125, 17.98291015625, 20.0078125, 22.03271484375, 24.0576171875, 26.08251953125, 28.107421875, 30.13232421875, 32.1572265625, 34.18212890625, 36.20703125, 38.23193359375, 40.2568359375, 42.28173828125, 44.306640625, 46.33154296875, 48.3564453125, 50.38134765625, 52.40625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 12.0, 17.0, 21.0, 19.0, 37.0, 63.0, 91.0, 153.0, 236.0, 296.0, 470.0, 620.0, 599.0, 480.0, 296.0, 221.0, 144.0, 104.0, 49.0, 41.0, 31.0, 20.0, 16.0, 9.0, 6.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.527191162109375, -0.50311279296875, -0.479034423828125, -0.4549560546875, -0.430877685546875, -0.40679931640625, -0.382720947265625, -0.358642578125, -0.334564208984375, -0.31048583984375, -0.286407470703125, -0.2623291015625, -0.238250732421875, -0.21417236328125, -0.190093994140625, -0.166015625, -0.141937255859375, -0.11785888671875, -0.093780517578125, -0.0697021484375, -0.045623779296875, -0.02154541015625, 0.002532958984375, 0.026611328125, 0.050689697265625, 0.07476806640625, 0.098846435546875, 0.1229248046875, 0.147003173828125, 0.17108154296875, 0.195159912109375, 0.21923828125, 0.243316650390625, 0.26739501953125, 0.291473388671875, 0.3155517578125, 0.339630126953125, 0.36370849609375, 0.387786865234375, 0.411865234375, 0.435943603515625, 0.46002197265625, 0.484100341796875, 0.5081787109375, 0.532257080078125, 0.55633544921875, 0.580413818359375, 0.6044921875, 0.628570556640625, 0.65264892578125, 0.676727294921875, 0.7008056640625, 0.724884033203125, 0.74896240234375, 0.773040771484375, 0.797119140625, 0.821197509765625, 0.84527587890625, 0.869354248046875, 0.8934326171875, 0.917510986328125, 0.94158935546875, 0.965667724609375, 0.98974609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 20.0, 34.0, 81.0, 92.0, 180.0, 176.0, 155.0, 96.0, 68.0, 42.0, 23.0, 13.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.36844539642334, -6.221563339233398, -6.074681282043457, -5.927798748016357, -5.780916690826416, -5.634034633636475, -5.487152099609375, -5.340270042419434, -5.193387985229492, -5.046505928039551, -4.899623870849609, -4.75274133682251, -4.605859279632568, -4.458977222442627, -4.312094688415527, -4.165212631225586, -4.0183305740356445, -3.871448516845703, -3.7245662212371826, -3.577683925628662, -3.4308018684387207, -3.2839198112487793, -3.137037515640259, -2.9901552200317383, -2.843273162841797, -2.6963911056518555, -2.549508810043335, -2.4026265144348145, -2.255744457244873, -2.1088624000549316, -1.9619801044464111, -1.8150979280471802, -1.6682162284851074, -1.5213340520858765, -1.3744518756866455, -1.2275696992874146, -1.0806875228881836, -0.9338053464889526, -0.7869231700897217, -0.6400409936904907, -0.49315881729125977, -0.3462766408920288, -0.19939446449279785, -0.052512288093566895, 0.09436988830566406, 0.24125206470489502, 0.388134241104126, 0.5350164175033569, 0.6818985939025879, 0.8287807703018188, 0.9756629467010498, 1.1225451231002808, 1.2694272994995117, 1.4163094758987427, 1.5631916522979736, 1.7100738286972046, 1.8569560050964355, 2.003838062286377, 2.1507203578948975, 2.297602653503418, 2.4444847106933594, 2.591366767883301, 2.7382490634918213, 2.885131359100342, 3.032013416290283]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 11.0, 8.0, 12.0, 19.0, 9.0, 13.0, 23.0, 20.0, 22.0, 24.0, 26.0, 37.0, 37.0, 29.0, 31.0, 43.0, 48.0, 54.0, 35.0, 43.0, 45.0, 45.0, 39.0, 30.0, 34.0, 35.0, 34.0, 22.0, 16.0, 20.0, 23.0, 22.0, 15.0, 12.0, 12.0, 7.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6271095275878906, -1.5789276361465454, -1.5307457447052002, -1.482563853263855, -1.4343819618225098, -1.386200189590454, -1.3380181789398193, -1.2898364067077637, -1.2416545152664185, -1.1934726238250732, -1.145290732383728, -1.0971088409423828, -1.0489269495010376, -1.0007450580596924, -0.9525632262229919, -0.9043813943862915, -0.8561994433403015, -0.8080175518989563, -0.7598356604576111, -0.7116538286209106, -0.6634719371795654, -0.6152900457382202, -0.567108154296875, -0.5189262628555298, -0.47074440121650696, -0.42256250977516174, -0.3743806481361389, -0.3261987566947937, -0.2780168652534485, -0.22983500361442566, -0.18165311217308044, -0.13347125053405762, -0.0852893590927124, -0.03710747882723808, 0.011074401438236237, 0.059256285429000854, 0.10743816196918488, 0.1556200385093689, 0.2038019299507141, 0.25198379158973694, 0.30016568303108215, 0.34834757447242737, 0.3965294361114502, 0.4447113275527954, 0.4928932189941406, 0.5410751104354858, 0.589257001876831, 0.6374388337135315, 0.6856207251548767, 0.7338026165962219, 0.7819845080375671, 0.8301663398742676, 0.8783482313156128, 0.926530122756958, 0.9747120141983032, 1.0228939056396484, 1.0710757970809937, 1.1192576885223389, 1.167439579963684, 1.2156214714050293, 1.2638033628463745, 1.3119852542877197, 1.3601670265197754, 1.4083489179611206, 1.4565308094024658]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 19.0, 39.0, 61.0, 111.0, 162.0, 232.0, 388.0, 552.0, 852.0, 1405.0, 2312.0, 3796.0, 7427.0, 14584.0, 32584.0, 77644.0, 177770.0, 304392.0, 231519.0, 106457.0, 44893.0, 19716.0, 9253.0, 4917.0, 2794.0, 1721.0, 1082.0, 660.0, 394.0, 257.0, 192.0, 111.0, 79.0, 51.0, 32.0, 24.0, 14.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.63671875, -0.6183624267578125, -0.600006103515625, -0.5816497802734375, -0.56329345703125, -0.5449371337890625, -0.526580810546875, -0.5082244873046875, -0.4898681640625, -0.4715118408203125, -0.453155517578125, -0.4347991943359375, -0.41644287109375, -0.3980865478515625, -0.379730224609375, -0.3613739013671875, -0.343017578125, -0.3246612548828125, -0.306304931640625, -0.2879486083984375, -0.26959228515625, -0.2512359619140625, -0.232879638671875, -0.2145233154296875, -0.1961669921875, -0.1778106689453125, -0.159454345703125, -0.1410980224609375, -0.12274169921875, -0.1043853759765625, -0.086029052734375, -0.0676727294921875, -0.04931640625, -0.0309600830078125, -0.012603759765625, 0.0057525634765625, 0.02410888671875, 0.0424652099609375, 0.060821533203125, 0.0791778564453125, 0.0975341796875, 0.1158905029296875, 0.134246826171875, 0.1526031494140625, 0.17095947265625, 0.1893157958984375, 0.207672119140625, 0.2260284423828125, 0.244384765625, 0.2627410888671875, 0.281097412109375, 0.2994537353515625, 0.31781005859375, 0.3361663818359375, 0.354522705078125, 0.3728790283203125, 0.3912353515625, 0.4095916748046875, 0.427947998046875, 0.4463043212890625, 0.46466064453125, 0.4830169677734375, 0.501373291015625, 0.5197296142578125, 0.5380859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 4.0, 4.0, 11.0, 5.0, 7.0, 9.0, 14.0, 23.0, 27.0, 27.0, 29.0, 33.0, 38.0, 33.0, 48.0, 43.0, 37.0, 50.0, 53.0, 62.0, 47.0, 51.0, 41.0, 40.0, 33.0, 21.0, 24.0, 32.0, 23.0, 24.0, 21.0, 23.0, 12.0, 11.0, 14.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9617233276367188, -0.9258880615234375, -0.8900527954101562, -0.854217529296875, -0.8183822631835938, -0.7825469970703125, -0.7467117309570312, -0.71087646484375, -0.6750411987304688, -0.6392059326171875, -0.6033706665039062, -0.567535400390625, -0.5317001342773438, -0.4958648681640625, -0.46002960205078125, -0.4241943359375, -0.38835906982421875, -0.3525238037109375, -0.31668853759765625, -0.280853271484375, -0.24501800537109375, -0.2091827392578125, -0.17334747314453125, -0.13751220703125, -0.10167694091796875, -0.0658416748046875, -0.03000640869140625, 0.005828857421875, 0.04166412353515625, 0.0774993896484375, 0.11333465576171875, 0.149169921875, 0.18500518798828125, 0.2208404541015625, 0.25667572021484375, 0.292510986328125, 0.32834625244140625, 0.3641815185546875, 0.40001678466796875, 0.43585205078125, 0.47168731689453125, 0.5075225830078125, 0.5433578491210938, 0.579193115234375, 0.6150283813476562, 0.6508636474609375, 0.6866989135742188, 0.7225341796875, 0.7583694458007812, 0.7942047119140625, 0.8300399780273438, 0.865875244140625, 0.9017105102539062, 0.9375457763671875, 0.9733810424804688, 1.00921630859375, 1.0450515747070312, 1.0808868408203125, 1.1167221069335938, 1.152557373046875, 1.1883926391601562, 1.2242279052734375, 1.2600631713867188, 1.2958984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 6.0, 17.0, 20.0, 31.0, 38.0, 63.0, 89.0, 133.0, 219.0, 347.0, 649.0, 1148.0, 2473.0, 5946.0, 14993.0, 41968.0, 123265.0, 314465.0, 332316.0, 135350.0, 46240.0, 16458.0, 6457.0, 2829.0, 1317.0, 690.0, 350.0, 210.0, 148.0, 96.0, 52.0, 39.0, 28.0, 24.0, 15.0, 11.0, 15.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7841796875, -0.7589187622070312, -0.7336578369140625, -0.7083969116210938, -0.683135986328125, -0.6578750610351562, -0.6326141357421875, -0.6073532104492188, -0.58209228515625, -0.5568313598632812, -0.5315704345703125, -0.5063095092773438, -0.481048583984375, -0.45578765869140625, -0.4305267333984375, -0.40526580810546875, -0.3800048828125, -0.35474395751953125, -0.3294830322265625, -0.30422210693359375, -0.278961181640625, -0.25370025634765625, -0.2284393310546875, -0.20317840576171875, -0.17791748046875, -0.15265655517578125, -0.1273956298828125, -0.10213470458984375, -0.076873779296875, -0.05161285400390625, -0.0263519287109375, -0.00109100341796875, 0.024169921875, 0.04943084716796875, 0.0746917724609375, 0.09995269775390625, 0.125213623046875, 0.15047454833984375, 0.1757354736328125, 0.20099639892578125, 0.22625732421875, 0.25151824951171875, 0.2767791748046875, 0.30204010009765625, 0.327301025390625, 0.35256195068359375, 0.3778228759765625, 0.40308380126953125, 0.4283447265625, 0.45360565185546875, 0.4788665771484375, 0.5041275024414062, 0.529388427734375, 0.5546493530273438, 0.5799102783203125, 0.6051712036132812, 0.63043212890625, 0.6556930541992188, 0.6809539794921875, 0.7062149047851562, 0.731475830078125, 0.7567367553710938, 0.7819976806640625, 0.8072586059570312, 0.83251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 4.0, 6.0, 10.0, 8.0, 13.0, 15.0, 21.0, 27.0, 35.0, 35.0, 34.0, 40.0, 62.0, 60.0, 64.0, 52.0, 74.0, 58.0, 59.0, 69.0, 38.0, 40.0, 29.0, 35.0, 24.0, 20.0, 16.0, 11.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.353179931640625, -2.26885986328125, -2.184539794921875, -2.1002197265625, -2.015899658203125, -1.93157958984375, -1.847259521484375, -1.762939453125, -1.678619384765625, -1.59429931640625, -1.509979248046875, -1.4256591796875, -1.341339111328125, -1.25701904296875, -1.172698974609375, -1.08837890625, -1.004058837890625, -0.91973876953125, -0.835418701171875, -0.7510986328125, -0.666778564453125, -0.58245849609375, -0.498138427734375, -0.413818359375, -0.329498291015625, -0.24517822265625, -0.160858154296875, -0.0765380859375, 0.007781982421875, 0.09210205078125, 0.176422119140625, 0.2607421875, 0.345062255859375, 0.42938232421875, 0.513702392578125, 0.5980224609375, 0.682342529296875, 0.76666259765625, 0.850982666015625, 0.935302734375, 1.019622802734375, 1.10394287109375, 1.188262939453125, 1.2725830078125, 1.356903076171875, 1.44122314453125, 1.525543212890625, 1.60986328125, 1.694183349609375, 1.77850341796875, 1.862823486328125, 1.9471435546875, 2.031463623046875, 2.11578369140625, 2.200103759765625, 2.284423828125, 2.368743896484375, 2.45306396484375, 2.537384033203125, 2.6217041015625, 2.706024169921875, 2.79034423828125, 2.874664306640625, 2.958984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 5.0, 18.0, 14.0, 25.0, 35.0, 100.0, 120.0, 206.0, 407.0, 955.0, 2055.0, 5649.0, 20990.0, 130160.0, 633284.0, 211929.0, 30213.0, 7669.0, 2577.0, 1041.0, 474.0, 266.0, 139.0, 82.0, 38.0, 38.0, 17.0, 15.0, 5.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.436767578125, -0.42377471923828125, -0.4107818603515625, -0.39778900146484375, -0.384796142578125, -0.37180328369140625, -0.3588104248046875, -0.34581756591796875, -0.33282470703125, -0.31983184814453125, -0.3068389892578125, -0.29384613037109375, -0.280853271484375, -0.26786041259765625, -0.2548675537109375, -0.24187469482421875, -0.2288818359375, -0.21588897705078125, -0.2028961181640625, -0.18990325927734375, -0.176910400390625, -0.16391754150390625, -0.1509246826171875, -0.13793182373046875, -0.12493896484375, -0.11194610595703125, -0.0989532470703125, -0.08596038818359375, -0.072967529296875, -0.05997467041015625, -0.0469818115234375, -0.03398895263671875, -0.02099609375, -0.00800323486328125, 0.0049896240234375, 0.01798248291015625, 0.030975341796875, 0.04396820068359375, 0.0569610595703125, 0.06995391845703125, 0.08294677734375, 0.09593963623046875, 0.1089324951171875, 0.12192535400390625, 0.134918212890625, 0.14791107177734375, 0.1609039306640625, 0.17389678955078125, 0.1868896484375, 0.19988250732421875, 0.2128753662109375, 0.22586822509765625, 0.238861083984375, 0.25185394287109375, 0.2648468017578125, 0.27783966064453125, 0.29083251953125, 0.30382537841796875, 0.3168182373046875, 0.32981109619140625, 0.342803955078125, 0.35579681396484375, 0.3687896728515625, 0.38178253173828125, 0.394775390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 7.0, 3.0, 7.0, 7.0, 17.0, 16.0, 22.0, 49.0, 31.0, 60.0, 66.0, 69.0, 88.0, 114.0, 94.0, 79.0, 62.0, 43.0, 36.0, 25.0, 22.0, 22.0, 12.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00016450881958007812, -0.00016052182763814926, -0.0001565348356962204, -0.00015254784375429153, -0.00014856085181236267, -0.0001445738598704338, -0.00014058686792850494, -0.00013659987598657608, -0.00013261288404464722, -0.00012862589210271835, -0.0001246389001607895, -0.00012065190821886063, -0.00011666491627693176, -0.0001126779243350029, -0.00010869093239307404, -0.00010470394045114517, -0.00010071694850921631, -9.672995656728745e-05, -9.274296462535858e-05, -8.875597268342972e-05, -8.476898074150085e-05, -8.078198879957199e-05, -7.679499685764313e-05, -7.280800491571426e-05, -6.88210129737854e-05, -6.483402103185654e-05, -6.084702908992767e-05, -5.686003714799881e-05, -5.2873045206069946e-05, -4.888605326414108e-05, -4.489906132221222e-05, -4.0912069380283356e-05, -3.692507743835449e-05, -3.293808549642563e-05, -2.8951093554496765e-05, -2.49641016125679e-05, -2.0977109670639038e-05, -1.6990117728710175e-05, -1.3003125786781311e-05, -9.016133844852448e-06, -5.029141902923584e-06, -1.0421499609947205e-06, 2.944841980934143e-06, 6.931833922863007e-06, 1.091882586479187e-05, 1.4905817806720734e-05, 1.8892809748649597e-05, 2.287980169057846e-05, 2.6866793632507324e-05, 3.085378557443619e-05, 3.484077751636505e-05, 3.8827769458293915e-05, 4.281476140022278e-05, 4.680175334215164e-05, 5.0788745284080505e-05, 5.477573722600937e-05, 5.876272916793823e-05, 6.27497211098671e-05, 6.673671305179596e-05, 7.072370499372482e-05, 7.471069693565369e-05, 7.869768887758255e-05, 8.268468081951141e-05, 8.667167276144028e-05, 9.065866470336914e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 10.0, 9.0, 8.0, 10.0, 21.0, 25.0, 32.0, 49.0, 64.0, 103.0, 275.0, 570.0, 2220.0, 25364.0, 949885.0, 65091.0, 3404.0, 777.0, 252.0, 132.0, 88.0, 38.0, 29.0, 30.0, 13.0, 14.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.954376220703125, -0.91851806640625, -0.882659912109375, -0.8468017578125, -0.810943603515625, -0.77508544921875, -0.739227294921875, -0.703369140625, -0.667510986328125, -0.63165283203125, -0.595794677734375, -0.5599365234375, -0.524078369140625, -0.48822021484375, -0.452362060546875, -0.41650390625, -0.380645751953125, -0.34478759765625, -0.308929443359375, -0.2730712890625, -0.237213134765625, -0.20135498046875, -0.165496826171875, -0.129638671875, -0.093780517578125, -0.05792236328125, -0.022064208984375, 0.0137939453125, 0.049652099609375, 0.08551025390625, 0.121368408203125, 0.1572265625, 0.193084716796875, 0.22894287109375, 0.264801025390625, 0.3006591796875, 0.336517333984375, 0.37237548828125, 0.408233642578125, 0.444091796875, 0.479949951171875, 0.51580810546875, 0.551666259765625, 0.5875244140625, 0.623382568359375, 0.65924072265625, 0.695098876953125, 0.73095703125, 0.766815185546875, 0.80267333984375, 0.838531494140625, 0.8743896484375, 0.910247802734375, 0.94610595703125, 0.981964111328125, 1.017822265625, 1.053680419921875, 1.08953857421875, 1.125396728515625, 1.1612548828125, 1.197113037109375, 1.23297119140625, 1.268829345703125, 1.3046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 2.0, 0.0, 5.0, 3.0, 6.0, 14.0, 14.0, 23.0, 30.0, 37.0, 67.0, 98.0, 104.0, 141.0, 118.0, 99.0, 84.0, 52.0, 30.0, 23.0, 22.0, 9.0, 6.0, 5.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.1317577362060547, -0.12716293334960938, -0.12256813049316406, -0.11797332763671875, -0.11337852478027344, -0.10878372192382812, -0.10418891906738281, -0.0995941162109375, -0.09499931335449219, -0.09040451049804688, -0.08580970764160156, -0.08121490478515625, -0.07662010192871094, -0.07202529907226562, -0.06743049621582031, -0.062835693359375, -0.05824089050292969, -0.053646087646484375, -0.04905128479003906, -0.04445648193359375, -0.03986167907714844, -0.035266876220703125, -0.030672073364257812, -0.0260772705078125, -0.021482467651367188, -0.016887664794921875, -0.012292861938476562, -0.00769805908203125, -0.0031032562255859375, 0.001491546630859375, 0.0060863494873046875, 0.01068115234375, 0.015275955200195312, 0.019870758056640625, 0.024465560913085938, 0.02906036376953125, 0.03365516662597656, 0.038249969482421875, 0.04284477233886719, 0.0474395751953125, 0.05203437805175781, 0.056629180908203125, 0.06122398376464844, 0.06581878662109375, 0.07041358947753906, 0.07500839233398438, 0.07960319519042969, 0.084197998046875, 0.08879280090332031, 0.09338760375976562, 0.09798240661621094, 0.10257720947265625, 0.10717201232910156, 0.11176681518554688, 0.11636161804199219, 0.1209564208984375, 0.1255512237548828, 0.13014602661132812, 0.13474082946777344, 0.13933563232421875, 0.14393043518066406, 0.14852523803710938, 0.1531200408935547, 0.15771484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 9.0, 17.0, 28.0, 42.0, 61.0, 72.0, 119.0, 134.0, 119.0, 116.0, 102.0, 55.0, 33.0, 32.0, 24.0, 11.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9822492599487305, -1.9182709455490112, -1.854292631149292, -1.7903143167495728, -1.7263360023498535, -1.6623578071594238, -1.5983794927597046, -1.5344011783599854, -1.4704228639602661, -1.4064445495605469, -1.3424662351608276, -1.2784879207611084, -1.2145097255706787, -1.15053129196167, -1.0865530967712402, -1.022574782371521, -0.9585964679718018, -0.8946181535720825, -0.8306398391723633, -0.7666615843772888, -0.7026832699775696, -0.6387049555778503, -0.5747267007827759, -0.5107483863830566, -0.4467700719833374, -0.38279175758361816, -0.3188134729862213, -0.25483518838882446, -0.19085687398910522, -0.126878559589386, -0.06290027499198914, 0.0010780096054077148, 0.06505608558654785, 0.1290343850851059, 0.19301268458366394, 0.2569909691810608, 0.32096928358078003, 0.38494759798049927, 0.4489258825778961, 0.512904167175293, 0.5768824815750122, 0.6408607959747314, 0.7048391103744507, 0.7688173651695251, 0.8327956795692444, 0.8967739939689636, 0.9607522487640381, 1.0247305631637573, 1.0887088775634766, 1.1526871919631958, 1.216665506362915, 1.2806438207626343, 1.3446221351623535, 1.4086003303527832, 1.4725786447525024, 1.5365569591522217, 1.600535273551941, 1.6645135879516602, 1.7284919023513794, 1.7924702167510986, 1.8564484119415283, 1.920426845550537, 1.9844050407409668, 2.0483832359313965, 2.1123616695404053]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 9.0, 18.0, 20.0, 16.0, 16.0, 20.0, 32.0, 35.0, 21.0, 35.0, 46.0, 47.0, 50.0, 50.0, 59.0, 57.0, 39.0, 56.0, 55.0, 32.0, 35.0, 35.0, 34.0, 23.0, 28.0, 27.0, 23.0, 13.0, 17.0, 12.0, 9.0, 8.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1759898662567139, -1.1387073993682861, -1.1014249324798584, -1.0641424655914307, -1.026859998703003, -0.98957759141922, -0.952295184135437, -0.9150127172470093, -0.8777302503585815, -0.8404477834701538, -0.8031653165817261, -0.7658829092979431, -0.7286004424095154, -0.6913179755210876, -0.6540355682373047, -0.616753101348877, -0.5794706344604492, -0.5421881675720215, -0.5049057006835938, -0.4676232933998108, -0.43034082651138306, -0.3930583596229553, -0.35577592253685, -0.31849348545074463, -0.2812110185623169, -0.24392856657505035, -0.2066461145877838, -0.16936366260051727, -0.13208121061325073, -0.09479875862598419, -0.05751630663871765, -0.020233869552612305, 0.01704871654510498, 0.05433116853237152, 0.09161362051963806, 0.1288960725069046, 0.16617852449417114, 0.20346097648143768, 0.24074342846870422, 0.27802586555480957, 0.3153083324432373, 0.35259079933166504, 0.3898732364177704, 0.42715567350387573, 0.46443814039230347, 0.5017206072807312, 0.5390030145645142, 0.5762854814529419, 0.6135679483413696, 0.6508504152297974, 0.6881328821182251, 0.7254152894020081, 0.7626977562904358, 0.7999802231788635, 0.8372626304626465, 0.8745450973510742, 0.911827564239502, 0.9491100311279297, 0.9863924980163574, 1.0236749649047852, 1.060957431793213, 1.098239779472351, 1.1355222463607788, 1.1728047132492065, 1.2100871801376343]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 7.0, 13.0, 16.0, 18.0, 28.0, 52.0, 77.0, 124.0, 202.0, 384.0, 726.0, 1361.0, 2875.0, 6326.0, 14451.0, 32629.0, 79518.0, 277237.0, 427895.0, 122237.0, 45929.0, 19843.0, 8807.0, 3956.0, 1862.0, 870.0, 451.0, 244.0, 139.0, 83.0, 73.0, 32.0, 25.0, 21.0, 15.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.79833984375, -0.77099609375, -0.74365234375, -0.71630859375, -0.68896484375, -0.66162109375, -0.63427734375, -0.60693359375, -0.57958984375, -0.55224609375, -0.52490234375, -0.49755859375, -0.47021484375, -0.44287109375, -0.41552734375, -0.38818359375, -0.36083984375, -0.33349609375, -0.30615234375, -0.27880859375, -0.25146484375, -0.22412109375, -0.19677734375, -0.16943359375, -0.14208984375, -0.11474609375, -0.08740234375, -0.06005859375, -0.03271484375, -0.00537109375, 0.02197265625, 0.04931640625, 0.07666015625, 0.10400390625, 0.13134765625, 0.15869140625, 0.18603515625, 0.21337890625, 0.24072265625, 0.26806640625, 0.29541015625, 0.32275390625, 0.35009765625, 0.37744140625, 0.40478515625, 0.43212890625, 0.45947265625, 0.48681640625, 0.51416015625, 0.54150390625, 0.56884765625, 0.59619140625, 0.62353515625, 0.65087890625, 0.67822265625, 0.70556640625, 0.73291015625, 0.76025390625, 0.78759765625, 0.81494140625, 0.84228515625, 0.86962890625, 0.89697265625, 0.92431640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 9.0, 7.0, 13.0, 15.0, 17.0, 24.0, 22.0, 22.0, 24.0, 25.0, 19.0, 28.0, 36.0, 39.0, 44.0, 42.0, 47.0, 39.0, 32.0, 34.0, 39.0, 36.0, 46.0, 42.0, 27.0, 32.0, 25.0, 31.0, 25.0, 17.0, 21.0, 25.0, 16.0, 9.0, 12.0, 10.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.306640625, -3.200286865234375, -3.09393310546875, -2.987579345703125, -2.8812255859375, -2.774871826171875, -2.66851806640625, -2.562164306640625, -2.455810546875, -2.349456787109375, -2.24310302734375, -2.136749267578125, -2.0303955078125, -1.924041748046875, -1.81768798828125, -1.711334228515625, -1.60498046875, -1.498626708984375, -1.39227294921875, -1.285919189453125, -1.1795654296875, -1.073211669921875, -0.96685791015625, -0.860504150390625, -0.754150390625, -0.647796630859375, -0.54144287109375, -0.435089111328125, -0.3287353515625, -0.222381591796875, -0.11602783203125, -0.009674072265625, 0.0966796875, 0.203033447265625, 0.30938720703125, 0.415740966796875, 0.5220947265625, 0.628448486328125, 0.73480224609375, 0.841156005859375, 0.947509765625, 1.053863525390625, 1.16021728515625, 1.266571044921875, 1.3729248046875, 1.479278564453125, 1.58563232421875, 1.691986083984375, 1.79833984375, 1.904693603515625, 2.01104736328125, 2.117401123046875, 2.2237548828125, 2.330108642578125, 2.43646240234375, 2.542816162109375, 2.649169921875, 2.755523681640625, 2.86187744140625, 2.968231201171875, 3.0745849609375, 3.180938720703125, 3.28729248046875, 3.393646240234375, 3.5]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 9.0, 10.0, 7.0, 16.0, 16.0, 26.0, 36.0, 48.0, 52.0, 61.0, 86.0, 193.0, 773.0, 1040413.0, 6058.0, 279.0, 129.0, 89.0, 77.0, 51.0, 34.0, 24.0, 16.0, 15.0, 10.0, 8.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.2830810546875, -17.784912109375, -17.2867431640625, -16.78857421875, -16.2904052734375, -15.792236328125, -15.2940673828125, -14.7958984375, -14.2977294921875, -13.799560546875, -13.3013916015625, -12.80322265625, -12.3050537109375, -11.806884765625, -11.3087158203125, -10.810546875, -10.3123779296875, -9.814208984375, -9.3160400390625, -8.81787109375, -8.3197021484375, -7.821533203125, -7.3233642578125, -6.8251953125, -6.3270263671875, -5.828857421875, -5.3306884765625, -4.83251953125, -4.3343505859375, -3.836181640625, -3.3380126953125, -2.83984375, -2.3416748046875, -1.843505859375, -1.3453369140625, -0.84716796875, -0.3489990234375, 0.149169921875, 0.6473388671875, 1.1455078125, 1.6436767578125, 2.141845703125, 2.6400146484375, 3.13818359375, 3.6363525390625, 4.134521484375, 4.6326904296875, 5.130859375, 5.6290283203125, 6.127197265625, 6.6253662109375, 7.12353515625, 7.6217041015625, 8.119873046875, 8.6180419921875, 9.1162109375, 9.6143798828125, 10.112548828125, 10.6107177734375, 11.10888671875, 11.6070556640625, 12.105224609375, 12.6033935546875, 13.1015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 10.0, 8.0, 7.0, 18.0, 15.0, 23.0, 34.0, 33.0, 44.0, 50.0, 53.0, 63.0, 61.0, 93.0, 68.0, 69.0, 69.0, 56.0, 58.0, 48.0, 30.0, 22.0, 16.0, 17.0, 10.0, 7.0, 10.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51953125, -7.32012939453125, -7.1207275390625, -6.92132568359375, -6.721923828125, -6.52252197265625, -6.3231201171875, -6.12371826171875, -5.92431640625, -5.72491455078125, -5.5255126953125, -5.32611083984375, -5.126708984375, -4.92730712890625, -4.7279052734375, -4.52850341796875, -4.3291015625, -4.12969970703125, -3.9302978515625, -3.73089599609375, -3.531494140625, -3.33209228515625, -3.1326904296875, -2.93328857421875, -2.73388671875, -2.53448486328125, -2.3350830078125, -2.13568115234375, -1.936279296875, -1.73687744140625, -1.5374755859375, -1.33807373046875, -1.138671875, -0.93927001953125, -0.7398681640625, -0.54046630859375, -0.341064453125, -0.14166259765625, 0.0577392578125, 0.25714111328125, 0.45654296875, 0.65594482421875, 0.8553466796875, 1.05474853515625, 1.254150390625, 1.45355224609375, 1.6529541015625, 1.85235595703125, 2.0517578125, 2.25115966796875, 2.4505615234375, 2.64996337890625, 2.849365234375, 3.04876708984375, 3.2481689453125, 3.44757080078125, 3.64697265625, 3.84637451171875, 4.0457763671875, 4.24517822265625, 4.444580078125, 4.64398193359375, 4.8433837890625, 5.04278564453125, 5.2421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 23.0, 38.0, 40.0, 89.0, 129.0, 313.0, 1367.0, 11140.0, 504673.0, 516947.0, 11554.0, 1458.0, 349.0, 115.0, 60.0, 47.0, 37.0, 28.0, 18.0, 12.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0424041748046875, -1.007659912109375, -0.9729156494140625, -0.93817138671875, -0.9034271240234375, -0.868682861328125, -0.8339385986328125, -0.7991943359375, -0.7644500732421875, -0.729705810546875, -0.6949615478515625, -0.66021728515625, -0.6254730224609375, -0.590728759765625, -0.5559844970703125, -0.521240234375, -0.4864959716796875, -0.451751708984375, -0.4170074462890625, -0.38226318359375, -0.3475189208984375, -0.312774658203125, -0.2780303955078125, -0.2432861328125, -0.2085418701171875, -0.173797607421875, -0.1390533447265625, -0.10430908203125, -0.0695648193359375, -0.034820556640625, -7.62939453125e-05, 0.03466796875, 0.0694122314453125, 0.104156494140625, 0.1389007568359375, 0.17364501953125, 0.2083892822265625, 0.243133544921875, 0.2778778076171875, 0.3126220703125, 0.3473663330078125, 0.382110595703125, 0.4168548583984375, 0.45159912109375, 0.4863433837890625, 0.521087646484375, 0.5558319091796875, 0.590576171875, 0.6253204345703125, 0.660064697265625, 0.6948089599609375, 0.72955322265625, 0.7642974853515625, 0.799041748046875, 0.8337860107421875, 0.8685302734375, 0.9032745361328125, 0.938018798828125, 0.9727630615234375, 1.00750732421875, 1.0422515869140625, 1.076995849609375, 1.1117401123046875, 1.146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 16.0, 14.0, 29.0, 37.0, 73.0, 81.0, 141.0, 186.0, 143.0, 78.0, 41.0, 38.0, 32.0, 19.0, 17.0, 6.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921457290649414e-05, -7.621478289365768e-05, -7.321499288082123e-05, -7.021520286798477e-05, -6.721541285514832e-05, -6.421562284231186e-05, -6.12158328294754e-05, -5.8216042816638947e-05, -5.521625280380249e-05, -5.2216462790966034e-05, -4.921667277812958e-05, -4.621688276529312e-05, -4.3217092752456665e-05, -4.021730273962021e-05, -3.721751272678375e-05, -3.4217722713947296e-05, -3.121793270111084e-05, -2.8218142688274384e-05, -2.5218352675437927e-05, -2.221856266260147e-05, -1.9218772649765015e-05, -1.621898263692856e-05, -1.3219192624092102e-05, -1.0219402611255646e-05, -7.2196125984191895e-06, -4.219822585582733e-06, -1.2200325727462769e-06, 1.7797574400901794e-06, 4.779547452926636e-06, 7.779337465763092e-06, 1.0779127478599548e-05, 1.3778917491436005e-05, 1.677870750427246e-05, 1.9778497517108917e-05, 2.2778287529945374e-05, 2.577807754278183e-05, 2.8777867555618286e-05, 3.177765756845474e-05, 3.47774475812912e-05, 3.7777237594127655e-05, 4.077702760696411e-05, 4.377681761980057e-05, 4.6776607632637024e-05, 4.977639764547348e-05, 5.2776187658309937e-05, 5.577597767114639e-05, 5.877576768398285e-05, 6.17755576968193e-05, 6.477534770965576e-05, 6.777513772249222e-05, 7.077492773532867e-05, 7.377471774816513e-05, 7.677450776100159e-05, 7.977429777383804e-05, 8.27740877866745e-05, 8.577387779951096e-05, 8.877366781234741e-05, 9.177345782518387e-05, 9.477324783802032e-05, 9.777303785085678e-05, 0.00010077282786369324, 0.0001037726178765297, 0.00010677240788936615, 0.0001097721979022026, 0.00011277198791503906]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 12.0, 10.0, 13.0, 18.0, 24.0, 31.0, 46.0, 93.0, 167.0, 445.0, 1883.0, 15786.0, 702911.0, 314505.0, 10332.0, 1509.0, 375.0, 150.0, 74.0, 44.0, 28.0, 18.0, 12.0, 5.0, 9.0, 5.0, 8.0, 3.0, 9.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.22265625, -1.1886138916015625, -1.154571533203125, -1.1205291748046875, -1.08648681640625, -1.0524444580078125, -1.018402099609375, -0.9843597412109375, -0.9503173828125, -0.9162750244140625, -0.882232666015625, -0.8481903076171875, -0.81414794921875, -0.7801055908203125, -0.746063232421875, -0.7120208740234375, -0.677978515625, -0.6439361572265625, -0.609893798828125, -0.5758514404296875, -0.54180908203125, -0.5077667236328125, -0.473724365234375, -0.4396820068359375, -0.4056396484375, -0.3715972900390625, -0.337554931640625, -0.3035125732421875, -0.26947021484375, -0.2354278564453125, -0.201385498046875, -0.1673431396484375, -0.13330078125, -0.0992584228515625, -0.065216064453125, -0.0311737060546875, 0.00286865234375, 0.0369110107421875, 0.070953369140625, 0.1049957275390625, 0.1390380859375, 0.1730804443359375, 0.207122802734375, 0.2411651611328125, 0.27520751953125, 0.3092498779296875, 0.343292236328125, 0.3773345947265625, 0.411376953125, 0.4454193115234375, 0.479461669921875, 0.5135040283203125, 0.54754638671875, 0.5815887451171875, 0.615631103515625, 0.6496734619140625, 0.6837158203125, 0.7177581787109375, 0.751800537109375, 0.7858428955078125, 0.81988525390625, 0.8539276123046875, 0.887969970703125, 0.9220123291015625, 0.9560546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 8.0, 4.0, 5.0, 1.0, 9.0, 7.0, 11.0, 14.0, 19.0, 35.0, 37.0, 57.0, 67.0, 75.0, 110.0, 116.0, 96.0, 65.0, 45.0, 56.0, 34.0, 19.0, 27.0, 17.0, 8.0, 4.0, 5.0, 5.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.161865234375, -0.1571216583251953, -0.15237808227539062, -0.14763450622558594, -0.14289093017578125, -0.13814735412597656, -0.13340377807617188, -0.1286602020263672, -0.1239166259765625, -0.11917304992675781, -0.11442947387695312, -0.10968589782714844, -0.10494232177734375, -0.10019874572753906, -0.09545516967773438, -0.09071159362792969, -0.085968017578125, -0.08122444152832031, -0.07648086547851562, -0.07173728942871094, -0.06699371337890625, -0.06225013732910156, -0.057506561279296875, -0.05276298522949219, -0.0480194091796875, -0.04327583312988281, -0.038532257080078125, -0.03378868103027344, -0.02904510498046875, -0.024301528930664062, -0.019557952880859375, -0.014814376831054688, -0.01007080078125, -0.0053272247314453125, -0.000583648681640625, 0.0041599273681640625, 0.00890350341796875, 0.013647079467773438, 0.018390655517578125, 0.023134231567382812, 0.0278778076171875, 0.03262138366699219, 0.037364959716796875, 0.04210853576660156, 0.04685211181640625, 0.05159568786621094, 0.056339263916015625, 0.06108283996582031, 0.065826416015625, 0.07056999206542969, 0.07531356811523438, 0.08005714416503906, 0.08480072021484375, 0.08954429626464844, 0.09428787231445312, 0.09903144836425781, 0.1037750244140625, 0.10851860046386719, 0.11326217651367188, 0.11800575256347656, 0.12274932861328125, 0.12749290466308594, 0.13223648071289062, 0.1369800567626953, 0.1417236328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 30.0, 113.0, 322.0, 341.0, 141.0, 43.0, 13.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.34256935119629, -19.966489791870117, -19.590410232543945, -19.214330673217773, -18.8382511138916, -18.462173461914062, -18.08609390258789, -17.71001434326172, -17.333934783935547, -16.957855224609375, -16.581775665283203, -16.20569610595703, -15.829617500305176, -15.453537940979004, -15.077458381652832, -14.70137882232666, -14.325299263000488, -13.949219703674316, -13.573140144348145, -13.197061538696289, -12.820981979370117, -12.444902420043945, -12.068822860717773, -11.692743301391602, -11.31666374206543, -10.940584182739258, -10.564504623413086, -10.188425064086914, -9.812346458435059, -9.436266899108887, -9.060187339782715, -8.684107780456543, -8.308029174804688, -7.931949615478516, -7.555870532989502, -7.17979097366333, -6.803711891174316, -6.4276323318481445, -6.051552772521973, -5.675473213195801, -5.299394607543945, -4.923315048217773, -4.54723596572876, -4.171156406402588, -3.795077085494995, -3.4189977645874023, -3.0429182052612305, -2.6668388843536377, -2.290759325027466, -1.914680004119873, -1.5386005640029907, -1.1625211238861084, -0.7864418029785156, -0.41036248207092285, -0.03428292274475098, 0.3417963981628418, 0.7178757190704346, 1.0939550399780273, 1.4700344800949097, 1.846113920211792, 2.2221932411193848, 2.5982725620269775, 2.9743521213531494, 3.350431442260742, 3.726510763168335]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 9.0, 11.0, 6.0, 12.0, 12.0, 19.0, 16.0, 16.0, 17.0, 21.0, 28.0, 33.0, 29.0, 41.0, 44.0, 32.0, 36.0, 44.0, 26.0, 44.0, 56.0, 40.0, 43.0, 35.0, 42.0, 39.0, 30.0, 22.0, 30.0, 22.0, 23.0, 17.0, 23.0, 13.0, 11.0, 4.0, 9.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.362370491027832, -5.197085857391357, -5.031801223754883, -4.86651611328125, -4.701231479644775, -4.535946846008301, -4.370662212371826, -4.205377578735352, -4.040092468261719, -3.874807834625244, -3.7095229625701904, -3.544238328933716, -3.378953456878662, -3.2136688232421875, -3.048384189605713, -2.8830995559692383, -2.7178149223327637, -2.552530288696289, -2.3872454166412354, -2.2219607830047607, -2.056675910949707, -1.8913912773132324, -1.7261066436767578, -1.5608218908309937, -1.3955371379852295, -1.2302523851394653, -1.0649676322937012, -0.8996829986572266, -0.7343982458114624, -0.5691134929656982, -0.40382879972457886, -0.23854410648345947, -0.07325983047485352, 0.09202489256858826, 0.25730961561203003, 0.4225943386554718, 0.5878790616989136, 0.7531638145446777, 0.9184485077857971, 1.0837332010269165, 1.2490179538726807, 1.4143027067184448, 1.579587459564209, 1.7448720932006836, 1.9101568460464478, 2.075441598892212, 2.2407262325286865, 2.4060111045837402, 2.571295738220215, 2.7365803718566895, 2.901865243911743, 3.0671498775482178, 3.2324347496032715, 3.397719383239746, 3.5630040168762207, 3.7282886505126953, 3.893573522567749, 4.058858394622803, 4.224143028259277, 4.389427661895752, 4.554712295532227, 4.719997406005859, 4.885282039642334, 5.050566673278809, 5.215851306915283]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 9.0, 11.0, 21.0, 12.0, 22.0, 26.0, 27.0, 33.0, 34.0, 46.0, 85.0, 152.0, 309.0, 949.0, 4164.0, 29239.0, 485510.0, 2824249.0, 791599.0, 50141.0, 5556.0, 1206.0, 344.0, 160.0, 75.0, 44.0, 38.0, 22.0, 23.0, 20.0, 19.0, 10.0, 14.0, 8.0, 18.0, 13.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.119140625, -3.0234375, -2.927734375, -2.83203125, -2.736328125, -2.640625, -2.544921875, -2.44921875, -2.353515625, -2.2578125, -2.162109375, -2.06640625, -1.970703125, -1.875, -1.779296875, -1.68359375, -1.587890625, -1.4921875, -1.396484375, -1.30078125, -1.205078125, -1.109375, -1.013671875, -0.91796875, -0.822265625, -0.7265625, -0.630859375, -0.53515625, -0.439453125, -0.34375, -0.248046875, -0.15234375, -0.056640625, 0.0390625, 0.134765625, 0.23046875, 0.326171875, 0.421875, 0.517578125, 0.61328125, 0.708984375, 0.8046875, 0.900390625, 0.99609375, 1.091796875, 1.1875, 1.283203125, 1.37890625, 1.474609375, 1.5703125, 1.666015625, 1.76171875, 1.857421875, 1.953125, 2.048828125, 2.14453125, 2.240234375, 2.3359375, 2.431640625, 2.52734375, 2.623046875, 2.71875, 2.814453125, 2.91015625, 3.005859375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 6.0, 10.0, 14.0, 11.0, 20.0, 20.0, 24.0, 24.0, 29.0, 41.0, 46.0, 35.0, 44.0, 45.0, 57.0, 47.0, 40.0, 52.0, 50.0, 51.0, 28.0, 37.0, 37.0, 42.0, 31.0, 20.0, 26.0, 22.0, 14.0, 11.0, 15.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2531890869140625, -1.208526611328125, -1.1638641357421875, -1.11920166015625, -1.0745391845703125, -1.029876708984375, -0.9852142333984375, -0.9405517578125, -0.8958892822265625, -0.851226806640625, -0.8065643310546875, -0.76190185546875, -0.7172393798828125, -0.672576904296875, -0.6279144287109375, -0.583251953125, -0.5385894775390625, -0.493927001953125, -0.4492645263671875, -0.40460205078125, -0.3599395751953125, -0.315277099609375, -0.2706146240234375, -0.2259521484375, -0.1812896728515625, -0.136627197265625, -0.0919647216796875, -0.04730224609375, -0.0026397705078125, 0.042022705078125, 0.0866851806640625, 0.13134765625, 0.1760101318359375, 0.220672607421875, 0.2653350830078125, 0.30999755859375, 0.3546600341796875, 0.399322509765625, 0.4439849853515625, 0.4886474609375, 0.5333099365234375, 0.577972412109375, 0.6226348876953125, 0.66729736328125, 0.7119598388671875, 0.756622314453125, 0.8012847900390625, 0.845947265625, 0.8906097412109375, 0.935272216796875, 0.9799346923828125, 1.02459716796875, 1.0692596435546875, 1.113922119140625, 1.1585845947265625, 1.2032470703125, 1.2479095458984375, 1.292572021484375, 1.3372344970703125, 1.38189697265625, 1.4265594482421875, 1.471221923828125, 1.5158843994140625, 1.560546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 9.0, 10.0, 17.0, 23.0, 26.0, 55.0, 67.0, 118.0, 170.0, 277.0, 468.0, 1491.0, 179840.0, 4006209.0, 3962.0, 621.0, 329.0, 176.0, 108.0, 105.0, 60.0, 36.0, 24.0, 23.0, 17.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.46875, -11.1231689453125, -10.777587890625, -10.4320068359375, -10.08642578125, -9.7408447265625, -9.395263671875, -9.0496826171875, -8.7041015625, -8.3585205078125, -8.012939453125, -7.6673583984375, -7.32177734375, -6.9761962890625, -6.630615234375, -6.2850341796875, -5.939453125, -5.5938720703125, -5.248291015625, -4.9027099609375, -4.55712890625, -4.2115478515625, -3.865966796875, -3.5203857421875, -3.1748046875, -2.8292236328125, -2.483642578125, -2.1380615234375, -1.79248046875, -1.4468994140625, -1.101318359375, -0.7557373046875, -0.41015625, -0.0645751953125, 0.281005859375, 0.6265869140625, 0.97216796875, 1.3177490234375, 1.663330078125, 2.0089111328125, 2.3544921875, 2.7000732421875, 3.045654296875, 3.3912353515625, 3.73681640625, 4.0823974609375, 4.427978515625, 4.7735595703125, 5.119140625, 5.4647216796875, 5.810302734375, 6.1558837890625, 6.50146484375, 6.8470458984375, 7.192626953125, 7.5382080078125, 7.8837890625, 8.2293701171875, 8.574951171875, 8.9205322265625, 9.26611328125, 9.6116943359375, 9.957275390625, 10.3028564453125, 10.6484375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 15.0, 16.0, 27.0, 34.0, 40.0, 55.0, 75.0, 93.0, 132.0, 243.0, 286.0, 403.0, 475.0, 498.0, 408.0, 341.0, 251.0, 194.0, 123.0, 78.0, 50.0, 56.0, 36.0, 19.0, 21.0, 25.0, 13.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.69091796875, -0.6723518371582031, -0.6537857055664062, -0.6352195739746094, -0.6166534423828125, -0.5980873107910156, -0.5795211791992188, -0.5609550476074219, -0.542388916015625, -0.5238227844238281, -0.5052566528320312, -0.4866905212402344, -0.4681243896484375, -0.4495582580566406, -0.43099212646484375, -0.4124259948730469, -0.39385986328125, -0.3752937316894531, -0.35672760009765625, -0.3381614685058594, -0.3195953369140625, -0.3010292053222656, -0.28246307373046875, -0.2638969421386719, -0.245330810546875, -0.22676467895507812, -0.20819854736328125, -0.18963241577148438, -0.1710662841796875, -0.15250015258789062, -0.13393402099609375, -0.11536788940429688, -0.0968017578125, -0.07823562622070312, -0.05966949462890625, -0.041103363037109375, -0.0225372314453125, -0.003971099853515625, 0.01459503173828125, 0.033161163330078125, 0.051727294921875, 0.07029342651367188, 0.08885955810546875, 0.10742568969726562, 0.1259918212890625, 0.14455795288085938, 0.16312408447265625, 0.18169021606445312, 0.20025634765625, 0.21882247924804688, 0.23738861083984375, 0.2559547424316406, 0.2745208740234375, 0.2930870056152344, 0.31165313720703125, 0.3302192687988281, 0.348785400390625, 0.3673515319824219, 0.38591766357421875, 0.4044837951660156, 0.4230499267578125, 0.4416160583496094, 0.46018218994140625, 0.4787483215332031, 0.497314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 8.0, 6.0, 17.0, 32.0, 48.0, 96.0, 108.0, 109.0, 147.0, 128.0, 94.0, 77.0, 47.0, 37.0, 23.0, 11.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.035017967224121, -3.9271116256713867, -3.8192055225372314, -3.711299419403076, -3.603393077850342, -3.4954867362976074, -3.387580633163452, -3.279674530029297, -3.1717681884765625, -3.063861846923828, -2.955955743789673, -2.8480496406555176, -2.740143299102783, -2.632236957550049, -2.5243308544158936, -2.4164247512817383, -2.308518409729004, -2.2006120681762695, -2.0927059650421143, -1.9847997426986694, -1.8768935203552246, -1.7689872980117798, -1.661081075668335, -1.5531748533248901, -1.4452686309814453, -1.3373624086380005, -1.2294561862945557, -1.1215499639511108, -1.013643741607666, -0.9057375192642212, -0.7978312969207764, -0.6899250745773315, -0.5820190906524658, -0.474112868309021, -0.36620664596557617, -0.25830042362213135, -0.15039420127868652, -0.0424879789352417, 0.06541824340820312, 0.17332446575164795, 0.2812306880950928, 0.3891369104385376, 0.4970431327819824, 0.6049493551254272, 0.7128555774688721, 0.8207617998123169, 0.9286680221557617, 1.0365742444992065, 1.1444804668426514, 1.2523866891860962, 1.360292911529541, 1.4681991338729858, 1.5761053562164307, 1.6840115785598755, 1.7919178009033203, 1.8998240232467651, 2.00773024559021, 2.1156363487243652, 2.2235426902770996, 2.331449031829834, 2.4393551349639893, 2.5472612380981445, 2.655167579650879, 2.7630739212036133, 2.8709800243377686]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 9.0, 4.0, 12.0, 16.0, 7.0, 17.0, 20.0, 14.0, 20.0, 27.0, 31.0, 34.0, 40.0, 40.0, 34.0, 55.0, 46.0, 36.0, 47.0, 39.0, 31.0, 43.0, 35.0, 37.0, 31.0, 41.0, 29.0, 26.0, 26.0, 26.0, 19.0, 13.0, 16.0, 15.0, 10.0, 9.0, 5.0, 6.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-1.569925308227539, -1.5279452800750732, -1.485965371131897, -1.4439853429794312, -1.4020054340362549, -1.360025405883789, -1.3180453777313232, -1.2760653495788574, -1.2340854406356812, -1.1921054124832153, -1.150125503540039, -1.1081454753875732, -1.0661654472351074, -1.0241855382919312, -0.9822055101394653, -0.9402255415916443, -0.8982455730438232, -0.8562656044960022, -0.8142856359481812, -0.7723056077957153, -0.7303256392478943, -0.6883456707000732, -0.6463656425476074, -0.6043856739997864, -0.5624057054519653, -0.5204257369041443, -0.47844573855400085, -0.4364657402038574, -0.3944857716560364, -0.35250580310821533, -0.3105258047580719, -0.26854580640792847, -0.22656595706939697, -0.18458597362041473, -0.1426059901714325, -0.10062600672245026, -0.05864602327346802, -0.01666603982448578, 0.02531394362449646, 0.06729394197463989, 0.10927391052246094, 0.15125389397144318, 0.19323387742042542, 0.23521386086940765, 0.2771938443183899, 0.31917381286621094, 0.36115381121635437, 0.4031338095664978, 0.44511377811431885, 0.4870937466621399, 0.5290737152099609, 0.5710537433624268, 0.6130337119102478, 0.6550136804580688, 0.6969937086105347, 0.7389736771583557, 0.7809536457061768, 0.8229336142539978, 0.8649135828018188, 0.9068936109542847, 0.9488735795021057, 0.9908535480499268, 1.0328335762023926, 1.0748136043548584, 1.1167935132980347]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 19.0, 13.0, 31.0, 37.0, 65.0, 86.0, 168.0, 269.0, 563.0, 1151.0, 2755.0, 7836.0, 24588.0, 80604.0, 242409.0, 381412.0, 207698.0, 67246.0, 20421.0, 6598.0, 2449.0, 1024.0, 430.0, 250.0, 161.0, 77.0, 50.0, 33.0, 32.0, 18.0, 10.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7861328125, -0.7639389038085938, -0.7417449951171875, -0.7195510864257812, -0.697357177734375, -0.6751632690429688, -0.6529693603515625, -0.6307754516601562, -0.60858154296875, -0.5863876342773438, -0.5641937255859375, -0.5419998168945312, -0.519805908203125, -0.49761199951171875, -0.4754180908203125, -0.45322418212890625, -0.4310302734375, -0.40883636474609375, -0.3866424560546875, -0.36444854736328125, -0.342254638671875, -0.32006072998046875, -0.2978668212890625, -0.27567291259765625, -0.25347900390625, -0.23128509521484375, -0.2090911865234375, -0.18689727783203125, -0.164703369140625, -0.14250946044921875, -0.1203155517578125, -0.09812164306640625, -0.075927734375, -0.05373382568359375, -0.0315399169921875, -0.00934600830078125, 0.012847900390625, 0.03504180908203125, 0.0572357177734375, 0.07942962646484375, 0.10162353515625, 0.12381744384765625, 0.1460113525390625, 0.16820526123046875, 0.190399169921875, 0.21259307861328125, 0.2347869873046875, 0.25698089599609375, 0.2791748046875, 0.30136871337890625, 0.3235626220703125, 0.34575653076171875, 0.367950439453125, 0.39014434814453125, 0.4123382568359375, 0.43453216552734375, 0.45672607421875, 0.47891998291015625, 0.5011138916015625, 0.5233078002929688, 0.545501708984375, 0.5676956176757812, 0.5898895263671875, 0.6120834350585938, 0.63427734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 5.0, 8.0, 7.0, 14.0, 17.0, 21.0, 14.0, 21.0, 26.0, 33.0, 47.0, 41.0, 47.0, 56.0, 63.0, 38.0, 41.0, 54.0, 44.0, 42.0, 35.0, 43.0, 41.0, 36.0, 30.0, 26.0, 27.0, 19.0, 18.0, 17.0, 12.0, 11.0, 11.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.013671875, -0.9859085083007812, -0.9581451416015625, -0.9303817749023438, -0.902618408203125, -0.8748550415039062, -0.8470916748046875, -0.8193283081054688, -0.79156494140625, -0.7638015747070312, -0.7360382080078125, -0.7082748413085938, -0.680511474609375, -0.6527481079101562, -0.6249847412109375, -0.5972213745117188, -0.5694580078125, -0.5416946411132812, -0.5139312744140625, -0.48616790771484375, -0.458404541015625, -0.43064117431640625, -0.4028778076171875, -0.37511444091796875, -0.34735107421875, -0.31958770751953125, -0.2918243408203125, -0.26406097412109375, -0.236297607421875, -0.20853424072265625, -0.1807708740234375, -0.15300750732421875, -0.125244140625, -0.09748077392578125, -0.0697174072265625, -0.04195404052734375, -0.014190673828125, 0.01357269287109375, 0.0413360595703125, 0.06909942626953125, 0.09686279296875, 0.12462615966796875, 0.1523895263671875, 0.18015289306640625, 0.207916259765625, 0.23567962646484375, 0.2634429931640625, 0.29120635986328125, 0.3189697265625, 0.34673309326171875, 0.3744964599609375, 0.40225982666015625, 0.430023193359375, 0.45778656005859375, 0.4855499267578125, 0.5133132934570312, 0.54107666015625, 0.5688400268554688, 0.5966033935546875, 0.6243667602539062, 0.652130126953125, 0.6798934936523438, 0.7076568603515625, 0.7354202270507812, 0.76318359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 13.0, 15.0, 14.0, 29.0, 31.0, 52.0, 72.0, 96.0, 173.0, 265.0, 460.0, 1003.0, 2153.0, 5183.0, 14365.0, 43989.0, 138464.0, 319191.0, 318180.0, 137338.0, 43961.0, 14123.0, 4998.0, 2134.0, 984.0, 477.0, 275.0, 167.0, 115.0, 78.0, 48.0, 27.0, 25.0, 15.0, 10.0, 7.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.7490234375, -0.72930908203125, -0.7095947265625, -0.68988037109375, -0.670166015625, -0.65045166015625, -0.6307373046875, -0.61102294921875, -0.59130859375, -0.57159423828125, -0.5518798828125, -0.53216552734375, -0.512451171875, -0.49273681640625, -0.4730224609375, -0.45330810546875, -0.43359375, -0.41387939453125, -0.3941650390625, -0.37445068359375, -0.354736328125, -0.33502197265625, -0.3153076171875, -0.29559326171875, -0.27587890625, -0.25616455078125, -0.2364501953125, -0.21673583984375, -0.197021484375, -0.17730712890625, -0.1575927734375, -0.13787841796875, -0.1181640625, -0.09844970703125, -0.0787353515625, -0.05902099609375, -0.039306640625, -0.01959228515625, 0.0001220703125, 0.01983642578125, 0.03955078125, 0.05926513671875, 0.0789794921875, 0.09869384765625, 0.118408203125, 0.13812255859375, 0.1578369140625, 0.17755126953125, 0.197265625, 0.21697998046875, 0.2366943359375, 0.25640869140625, 0.276123046875, 0.29583740234375, 0.3155517578125, 0.33526611328125, 0.35498046875, 0.37469482421875, 0.3944091796875, 0.41412353515625, 0.433837890625, 0.45355224609375, 0.4732666015625, 0.49298095703125, 0.5126953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 8.0, 8.0, 21.0, 25.0, 41.0, 28.0, 55.0, 37.0, 49.0, 62.0, 81.0, 52.0, 72.0, 79.0, 69.0, 68.0, 46.0, 38.0, 31.0, 30.0, 21.0, 23.0, 7.0, 14.0, 9.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8480682373046875, -1.777191162109375, -1.7063140869140625, -1.63543701171875, -1.5645599365234375, -1.493682861328125, -1.4228057861328125, -1.3519287109375, -1.2810516357421875, -1.210174560546875, -1.1392974853515625, -1.06842041015625, -0.9975433349609375, -0.926666259765625, -0.8557891845703125, -0.784912109375, -0.7140350341796875, -0.643157958984375, -0.5722808837890625, -0.50140380859375, -0.4305267333984375, -0.359649658203125, -0.2887725830078125, -0.2178955078125, -0.1470184326171875, -0.076141357421875, -0.0052642822265625, 0.06561279296875, 0.1364898681640625, 0.207366943359375, 0.2782440185546875, 0.34912109375, 0.4199981689453125, 0.490875244140625, 0.5617523193359375, 0.63262939453125, 0.7035064697265625, 0.774383544921875, 0.8452606201171875, 0.9161376953125, 0.9870147705078125, 1.057891845703125, 1.1287689208984375, 1.19964599609375, 1.2705230712890625, 1.341400146484375, 1.4122772216796875, 1.483154296875, 1.5540313720703125, 1.624908447265625, 1.6957855224609375, 1.76666259765625, 1.8375396728515625, 1.908416748046875, 1.9792938232421875, 2.0501708984375, 2.1210479736328125, 2.191925048828125, 2.2628021240234375, 2.33367919921875, 2.4045562744140625, 2.475433349609375, 2.5463104248046875, 2.6171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 3.0, 10.0, 14.0, 20.0, 32.0, 38.0, 60.0, 77.0, 129.0, 174.0, 281.0, 542.0, 907.0, 1872.0, 3705.0, 8324.0, 20843.0, 64162.0, 215219.0, 414478.0, 216262.0, 64113.0, 21084.0, 8274.0, 3734.0, 1845.0, 974.0, 526.0, 286.0, 188.0, 108.0, 87.0, 63.0, 31.0, 25.0, 17.0, 13.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2337646484375, -0.22657203674316406, -0.21937942504882812, -0.2121868133544922, -0.20499420166015625, -0.1978015899658203, -0.19060897827148438, -0.18341636657714844, -0.1762237548828125, -0.16903114318847656, -0.16183853149414062, -0.1546459197998047, -0.14745330810546875, -0.1402606964111328, -0.13306808471679688, -0.12587547302246094, -0.118682861328125, -0.11149024963378906, -0.10429763793945312, -0.09710502624511719, -0.08991241455078125, -0.08271980285644531, -0.07552719116210938, -0.06833457946777344, -0.0611419677734375, -0.05394935607910156, -0.046756744384765625, -0.03956413269042969, -0.03237152099609375, -0.025178909301757812, -0.017986297607421875, -0.010793685913085938, -0.00360107421875, 0.0035915374755859375, 0.010784149169921875, 0.017976760864257812, 0.02516937255859375, 0.03236198425292969, 0.039554595947265625, 0.04674720764160156, 0.0539398193359375, 0.06113243103027344, 0.06832504272460938, 0.07551765441894531, 0.08271026611328125, 0.08990287780761719, 0.09709548950195312, 0.10428810119628906, 0.111480712890625, 0.11867332458496094, 0.12586593627929688, 0.1330585479736328, 0.14025115966796875, 0.1474437713623047, 0.15463638305664062, 0.16182899475097656, 0.1690216064453125, 0.17621421813964844, 0.18340682983398438, 0.1905994415283203, 0.19779205322265625, 0.2049846649169922, 0.21217727661132812, 0.21936988830566406, 0.2265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 15.0, 24.0, 31.0, 87.0, 74.0, 107.0, 135.0, 121.0, 133.0, 94.0, 67.0, 28.0, 22.0, 14.0, 12.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002570152282714844, -0.00025132112205028534, -0.0002456270158290863, -0.00023993290960788727, -0.00023423880338668823, -0.0002285446971654892, -0.00022285059094429016, -0.00021715648472309113, -0.0002114623785018921, -0.00020576827228069305, -0.00020007416605949402, -0.00019438005983829498, -0.00018868595361709595, -0.0001829918473958969, -0.00017729774117469788, -0.00017160363495349884, -0.0001659095287322998, -0.00016021542251110077, -0.00015452131628990173, -0.0001488272100687027, -0.00014313310384750366, -0.00013743899762630463, -0.0001317448914051056, -0.00012605078518390656, -0.00012035667896270752, -0.00011466257274150848, -0.00010896846652030945, -0.00010327436029911041, -9.758025407791138e-05, -9.188614785671234e-05, -8.61920416355133e-05, -8.049793541431427e-05, -7.480382919311523e-05, -6.91097229719162e-05, -6.341561675071716e-05, -5.772151052951813e-05, -5.202740430831909e-05, -4.6333298087120056e-05, -4.063919186592102e-05, -3.4945085644721985e-05, -2.925097942352295e-05, -2.3556873202323914e-05, -1.7862766981124878e-05, -1.2168660759925842e-05, -6.474554538726807e-06, -7.80448317527771e-07, 4.913657903671265e-06, 1.06077641248703e-05, 1.6301870346069336e-05, 2.199597656726837e-05, 2.7690082788467407e-05, 3.338418900966644e-05, 3.907829523086548e-05, 4.4772401452064514e-05, 5.046650767326355e-05, 5.6160613894462585e-05, 6.185472011566162e-05, 6.754882633686066e-05, 7.324293255805969e-05, 7.893703877925873e-05, 8.463114500045776e-05, 9.03252512216568e-05, 9.601935744285583e-05, 0.00010171346366405487, 0.0001074075698852539]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 1.0, 6.0, 1.0, 6.0, 9.0, 22.0, 28.0, 30.0, 37.0, 65.0, 125.0, 184.0, 393.0, 990.0, 3313.0, 17108.0, 176050.0, 711297.0, 121323.0, 13258.0, 2702.0, 840.0, 339.0, 155.0, 83.0, 57.0, 38.0, 20.0, 18.0, 13.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.487884521484375, -0.47283935546875, -0.457794189453125, -0.4427490234375, -0.427703857421875, -0.41265869140625, -0.397613525390625, -0.382568359375, -0.367523193359375, -0.35247802734375, -0.337432861328125, -0.3223876953125, -0.307342529296875, -0.29229736328125, -0.277252197265625, -0.26220703125, -0.247161865234375, -0.23211669921875, -0.217071533203125, -0.2020263671875, -0.186981201171875, -0.17193603515625, -0.156890869140625, -0.141845703125, -0.126800537109375, -0.11175537109375, -0.096710205078125, -0.0816650390625, -0.066619873046875, -0.05157470703125, -0.036529541015625, -0.021484375, -0.006439208984375, 0.00860595703125, 0.023651123046875, 0.0386962890625, 0.053741455078125, 0.06878662109375, 0.083831787109375, 0.098876953125, 0.113922119140625, 0.12896728515625, 0.144012451171875, 0.1590576171875, 0.174102783203125, 0.18914794921875, 0.204193115234375, 0.21923828125, 0.234283447265625, 0.24932861328125, 0.264373779296875, 0.2794189453125, 0.294464111328125, 0.30950927734375, 0.324554443359375, 0.339599609375, 0.354644775390625, 0.36968994140625, 0.384735107421875, 0.3997802734375, 0.414825439453125, 0.42987060546875, 0.444915771484375, 0.4599609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 9.0, 5.0, 18.0, 11.0, 23.0, 26.0, 33.0, 36.0, 54.0, 56.0, 63.0, 71.0, 67.0, 65.0, 78.0, 57.0, 65.0, 56.0, 41.0, 34.0, 24.0, 21.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061370849609375, -0.05948448181152344, -0.057598114013671875, -0.05571174621582031, -0.05382537841796875, -0.05193901062011719, -0.050052642822265625, -0.04816627502441406, -0.0462799072265625, -0.04439353942871094, -0.042507171630859375, -0.04062080383300781, -0.03873443603515625, -0.03684806823730469, -0.034961700439453125, -0.03307533264160156, -0.03118896484375, -0.029302597045898438, -0.027416229248046875, -0.025529861450195312, -0.02364349365234375, -0.021757125854492188, -0.019870758056640625, -0.017984390258789062, -0.0160980224609375, -0.014211654663085938, -0.012325286865234375, -0.010438919067382812, -0.00855255126953125, -0.0066661834716796875, -0.004779815673828125, -0.0028934478759765625, -0.001007080078125, 0.0008792877197265625, 0.002765655517578125, 0.0046520233154296875, 0.00653839111328125, 0.008424758911132812, 0.010311126708984375, 0.012197494506835938, 0.0140838623046875, 0.015970230102539062, 0.017856597900390625, 0.019742965698242188, 0.02162933349609375, 0.023515701293945312, 0.025402069091796875, 0.027288436889648438, 0.0291748046875, 0.031061172485351562, 0.032947540283203125, 0.03483390808105469, 0.03672027587890625, 0.03860664367675781, 0.040493011474609375, 0.04237937927246094, 0.0442657470703125, 0.04615211486816406, 0.048038482666015625, 0.04992485046386719, 0.05181121826171875, 0.05369758605957031, 0.055583953857421875, 0.05747032165527344, 0.059356689453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 15.0, 13.0, 39.0, 81.0, 82.0, 110.0, 115.0, 142.0, 123.0, 81.0, 62.0, 38.0, 29.0, 18.0, 18.0, 6.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0483486652374268, -1.98997163772583, -1.931594729423523, -1.8732177019119263, -1.8148406744003296, -1.7564637660980225, -1.6980867385864258, -1.639709711074829, -1.5813326835632324, -1.5229556560516357, -1.4645787477493286, -1.406201720237732, -1.3478246927261353, -1.2894477844238281, -1.2310707569122314, -1.1726937294006348, -1.1143168210983276, -1.055939793586731, -0.997562825679779, -0.9391858577728271, -0.8808088302612305, -0.8224318623542786, -0.7640548944473267, -0.70567786693573, -0.6473008990287781, -0.5889239311218262, -0.5305469036102295, -0.4721699357032776, -0.4137929379940033, -0.355415940284729, -0.2970389723777771, -0.2386619746685028, -0.18028485774993896, -0.12190786749124527, -0.06353087723255157, -0.0051538944244384766, 0.053223103284835815, 0.11160010099411011, 0.169977068901062, 0.2283540666103363, 0.2867310643196106, 0.3451080620288849, 0.4034850597381592, 0.4618620276451111, 0.520238995552063, 0.5786160230636597, 0.6369929909706116, 0.6953699588775635, 0.7537469863891602, 0.8121239542961121, 0.8705009818077087, 0.9288779497146606, 0.9872549772262573, 1.0456318855285645, 1.1040089130401611, 1.1623859405517578, 1.2207629680633545, 1.2791399955749512, 1.3375169038772583, 1.395893931388855, 1.4542709589004517, 1.5126478672027588, 1.5710248947143555, 1.6294019222259521, 1.6877788305282593]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 12.0, 7.0, 12.0, 6.0, 16.0, 14.0, 10.0, 13.0, 15.0, 15.0, 27.0, 34.0, 44.0, 41.0, 48.0, 38.0, 57.0, 45.0, 31.0, 55.0, 33.0, 21.0, 53.0, 37.0, 34.0, 36.0, 30.0, 35.0, 29.0, 20.0, 25.0, 22.0, 14.0, 16.0, 4.0, 9.0, 9.0, 9.0, 8.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8311824202537537, -0.8067749738693237, -0.7823675274848938, -0.7579600811004639, -0.7335526347160339, -0.709145188331604, -0.6847377419471741, -0.6603302955627441, -0.6359228491783142, -0.6115154027938843, -0.5871079564094543, -0.5627005100250244, -0.5382930636405945, -0.5138856172561646, -0.4894781708717346, -0.4650707244873047, -0.44066324830055237, -0.41625580191612244, -0.3918483555316925, -0.3674409091472626, -0.34303346276283264, -0.3186260163784027, -0.2942185401916504, -0.26981109380722046, -0.24540366232395172, -0.2209962159395218, -0.19658876955509186, -0.17218130826950073, -0.1477738618850708, -0.12336642295122147, -0.09895896911621094, -0.074551522731781, -0.050144076347351074, -0.025736628100275993, -0.0013291798532009125, 0.023078270256519318, 0.04748571664094925, 0.07189316302537918, 0.09630061686038971, 0.12070806324481964, 0.14511550962924957, 0.1695229560136795, 0.19393040239810944, 0.21833786368370056, 0.2427453100681305, 0.2671527564525604, 0.29156020283699036, 0.3159676492214203, 0.3403750956058502, 0.36478254199028015, 0.3891899883747101, 0.41359743475914, 0.43800488114356995, 0.4624123275279999, 0.4868198037147522, 0.5112272500991821, 0.5356346964836121, 0.560042142868042, 0.5844495892524719, 0.6088570356369019, 0.6332644820213318, 0.6576719284057617, 0.6820793747901917, 0.7064868211746216, 0.7308942675590515]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 8.0, 6.0, 17.0, 16.0, 26.0, 30.0, 45.0, 59.0, 93.0, 164.0, 263.0, 477.0, 917.0, 1967.0, 4225.0, 9298.0, 21263.0, 51639.0, 139694.0, 479150.0, 215024.0, 72435.0, 28822.0, 12243.0, 5367.0, 2493.0, 1273.0, 650.0, 334.0, 205.0, 98.0, 80.0, 34.0, 33.0, 34.0, 17.0, 11.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7646484375, -0.740509033203125, -0.71636962890625, -0.692230224609375, -0.6680908203125, -0.643951416015625, -0.61981201171875, -0.595672607421875, -0.571533203125, -0.547393798828125, -0.52325439453125, -0.499114990234375, -0.4749755859375, -0.450836181640625, -0.42669677734375, -0.402557373046875, -0.37841796875, -0.354278564453125, -0.33013916015625, -0.305999755859375, -0.2818603515625, -0.257720947265625, -0.23358154296875, -0.209442138671875, -0.185302734375, -0.161163330078125, -0.13702392578125, -0.112884521484375, -0.0887451171875, -0.064605712890625, -0.04046630859375, -0.016326904296875, 0.0078125, 0.031951904296875, 0.05609130859375, 0.080230712890625, 0.1043701171875, 0.128509521484375, 0.15264892578125, 0.176788330078125, 0.200927734375, 0.225067138671875, 0.24920654296875, 0.273345947265625, 0.2974853515625, 0.321624755859375, 0.34576416015625, 0.369903564453125, 0.39404296875, 0.418182373046875, 0.44232177734375, 0.466461181640625, 0.4906005859375, 0.514739990234375, 0.53887939453125, 0.563018798828125, 0.587158203125, 0.611297607421875, 0.63543701171875, 0.659576416015625, 0.6837158203125, 0.707855224609375, 0.73199462890625, 0.756134033203125, 0.7802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 3.0, 9.0, 11.0, 5.0, 14.0, 7.0, 13.0, 23.0, 20.0, 21.0, 26.0, 21.0, 40.0, 31.0, 43.0, 43.0, 47.0, 40.0, 42.0, 48.0, 36.0, 44.0, 41.0, 33.0, 35.0, 31.0, 23.0, 33.0, 26.0, 33.0, 17.0, 17.0, 14.0, 19.0, 12.0, 13.0, 13.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.791015625, -1.7405242919921875, -1.690032958984375, -1.6395416259765625, -1.58905029296875, -1.5385589599609375, -1.488067626953125, -1.4375762939453125, -1.3870849609375, -1.3365936279296875, -1.286102294921875, -1.2356109619140625, -1.18511962890625, -1.1346282958984375, -1.084136962890625, -1.0336456298828125, -0.983154296875, -0.9326629638671875, -0.882171630859375, -0.8316802978515625, -0.78118896484375, -0.7306976318359375, -0.680206298828125, -0.6297149658203125, -0.5792236328125, -0.5287322998046875, -0.478240966796875, -0.4277496337890625, -0.37725830078125, -0.3267669677734375, -0.276275634765625, -0.2257843017578125, -0.17529296875, -0.1248016357421875, -0.074310302734375, -0.0238189697265625, 0.02667236328125, 0.0771636962890625, 0.127655029296875, 0.1781463623046875, 0.2286376953125, 0.2791290283203125, 0.329620361328125, 0.3801116943359375, 0.43060302734375, 0.4810943603515625, 0.531585693359375, 0.5820770263671875, 0.632568359375, 0.6830596923828125, 0.733551025390625, 0.7840423583984375, 0.83453369140625, 0.8850250244140625, 0.935516357421875, 0.9860076904296875, 1.0364990234375, 1.0869903564453125, 1.137481689453125, 1.1879730224609375, 1.23846435546875, 1.2889556884765625, 1.339447021484375, 1.3899383544921875, 1.4404296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 7.0, 7.0, 13.0, 14.0, 10.0, 17.0, 22.0, 27.0, 35.0, 31.0, 37.0, 57.0, 85.0, 115.0, 411.0, 87717.0, 958613.0, 762.0, 165.0, 86.0, 58.0, 33.0, 38.0, 29.0, 35.0, 20.0, 18.0, 18.0, 18.0, 10.0, 7.0, 7.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.5823974609375, -8.297607421875, -8.0128173828125, -7.72802734375, -7.4432373046875, -7.158447265625, -6.8736572265625, -6.5888671875, -6.3040771484375, -6.019287109375, -5.7344970703125, -5.44970703125, -5.1649169921875, -4.880126953125, -4.5953369140625, -4.310546875, -4.0257568359375, -3.740966796875, -3.4561767578125, -3.17138671875, -2.8865966796875, -2.601806640625, -2.3170166015625, -2.0322265625, -1.7474365234375, -1.462646484375, -1.1778564453125, -0.89306640625, -0.6082763671875, -0.323486328125, -0.0386962890625, 0.24609375, 0.5308837890625, 0.815673828125, 1.1004638671875, 1.38525390625, 1.6700439453125, 1.954833984375, 2.2396240234375, 2.5244140625, 2.8092041015625, 3.093994140625, 3.3787841796875, 3.66357421875, 3.9483642578125, 4.233154296875, 4.5179443359375, 4.802734375, 5.0875244140625, 5.372314453125, 5.6571044921875, 5.94189453125, 6.2266845703125, 6.511474609375, 6.7962646484375, 7.0810546875, 7.3658447265625, 7.650634765625, 7.9354248046875, 8.22021484375, 8.5050048828125, 8.789794921875, 9.0745849609375, 9.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 5.0, 8.0, 11.0, 17.0, 18.0, 19.0, 26.0, 38.0, 28.0, 34.0, 37.0, 39.0, 49.0, 49.0, 43.0, 52.0, 57.0, 55.0, 51.0, 46.0, 45.0, 30.0, 32.0, 33.0, 36.0, 22.0, 20.0, 18.0, 12.0, 8.0, 16.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.01123046875, -1.9462890625, -1.88134765625, -1.81640625, -1.75146484375, -1.6865234375, -1.62158203125, -1.556640625, -1.49169921875, -1.4267578125, -1.36181640625, -1.296875, -1.23193359375, -1.1669921875, -1.10205078125, -1.037109375, -0.97216796875, -0.9072265625, -0.84228515625, -0.77734375, -0.71240234375, -0.6474609375, -0.58251953125, -0.517578125, -0.45263671875, -0.3876953125, -0.32275390625, -0.2578125, -0.19287109375, -0.1279296875, -0.06298828125, 0.001953125, 0.06689453125, 0.1318359375, 0.19677734375, 0.26171875, 0.32666015625, 0.3916015625, 0.45654296875, 0.521484375, 0.58642578125, 0.6513671875, 0.71630859375, 0.78125, 0.84619140625, 0.9111328125, 0.97607421875, 1.041015625, 1.10595703125, 1.1708984375, 1.23583984375, 1.30078125, 1.36572265625, 1.4306640625, 1.49560546875, 1.560546875, 1.62548828125, 1.6904296875, 1.75537109375, 1.8203125, 1.88525390625, 1.9501953125, 2.01513671875, 2.080078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 12.0, 25.0, 29.0, 40.0, 77.0, 277.0, 920.0, 8631.0, 936777.0, 98358.0, 2655.0, 422.0, 138.0, 68.0, 34.0, 23.0, 17.0, 9.0, 6.0, 12.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.272796630859375, -1.22528076171875, -1.177764892578125, -1.1302490234375, -1.082733154296875, -1.03521728515625, -0.987701416015625, -0.940185546875, -0.892669677734375, -0.84515380859375, -0.797637939453125, -0.7501220703125, -0.702606201171875, -0.65509033203125, -0.607574462890625, -0.56005859375, -0.512542724609375, -0.46502685546875, -0.417510986328125, -0.3699951171875, -0.322479248046875, -0.27496337890625, -0.227447509765625, -0.179931640625, -0.132415771484375, -0.08489990234375, -0.037384033203125, 0.0101318359375, 0.057647705078125, 0.10516357421875, 0.152679443359375, 0.2001953125, 0.247711181640625, 0.29522705078125, 0.342742919921875, 0.3902587890625, 0.437774658203125, 0.48529052734375, 0.532806396484375, 0.580322265625, 0.627838134765625, 0.67535400390625, 0.722869873046875, 0.7703857421875, 0.817901611328125, 0.86541748046875, 0.912933349609375, 0.96044921875, 1.007965087890625, 1.05548095703125, 1.102996826171875, 1.1505126953125, 1.198028564453125, 1.24554443359375, 1.293060302734375, 1.340576171875, 1.388092041015625, 1.43560791015625, 1.483123779296875, 1.5306396484375, 1.578155517578125, 1.62567138671875, 1.673187255859375, 1.720703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 13.0, 39.0, 58.0, 106.0, 219.0, 263.0, 122.0, 67.0, 22.0, 23.0, 14.0, 13.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.130073547363281e-05, -7.778778672218323e-05, -7.427483797073364e-05, -7.076188921928406e-05, -6.724894046783447e-05, -6.373599171638489e-05, -6.02230429649353e-05, -5.671009421348572e-05, -5.319714546203613e-05, -4.968419671058655e-05, -4.617124795913696e-05, -4.265829920768738e-05, -3.914535045623779e-05, -3.563240170478821e-05, -3.211945295333862e-05, -2.8606504201889038e-05, -2.5093555450439453e-05, -2.1580606698989868e-05, -1.8067657947540283e-05, -1.4554709196090698e-05, -1.1041760444641113e-05, -7.528811693191528e-06, -4.015862941741943e-06, -5.029141902923584e-07, 3.0100345611572266e-06, 6.5229833126068115e-06, 1.0035932064056396e-05, 1.3548880815505981e-05, 1.7061829566955566e-05, 2.057477831840515e-05, 2.4087727069854736e-05, 2.760067582130432e-05, 3.1113624572753906e-05, 3.462657332420349e-05, 3.8139522075653076e-05, 4.165247082710266e-05, 4.5165419578552246e-05, 4.867836833000183e-05, 5.2191317081451416e-05, 5.5704265832901e-05, 5.9217214584350586e-05, 6.273016333580017e-05, 6.624311208724976e-05, 6.975606083869934e-05, 7.326900959014893e-05, 7.678195834159851e-05, 8.02949070930481e-05, 8.380785584449768e-05, 8.732080459594727e-05, 9.083375334739685e-05, 9.434670209884644e-05, 9.785965085029602e-05, 0.0001013725996017456, 0.00010488554835319519, 0.00010839849710464478, 0.00011191144585609436, 0.00011542439460754395, 0.00011893734335899353, 0.00012245029211044312, 0.0001259632408618927, 0.00012947618961334229, 0.00013298913836479187, 0.00013650208711624146, 0.00014001503586769104, 0.00014352798461914062]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 9.0, 14.0, 17.0, 30.0, 47.0, 109.0, 262.0, 759.0, 3097.0, 28242.0, 914627.0, 93270.0, 6088.0, 1252.0, 386.0, 155.0, 62.0, 34.0, 30.0, 13.0, 8.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.9323272705078125, -0.899810791015625, -0.8672943115234375, -0.83477783203125, -0.8022613525390625, -0.769744873046875, -0.7372283935546875, -0.7047119140625, -0.6721954345703125, -0.639678955078125, -0.6071624755859375, -0.57464599609375, -0.5421295166015625, -0.509613037109375, -0.4770965576171875, -0.444580078125, -0.4120635986328125, -0.379547119140625, -0.3470306396484375, -0.31451416015625, -0.2819976806640625, -0.249481201171875, -0.2169647216796875, -0.1844482421875, -0.1519317626953125, -0.119415283203125, -0.0868988037109375, -0.05438232421875, -0.0218658447265625, 0.010650634765625, 0.0431671142578125, 0.07568359375, 0.1082000732421875, 0.140716552734375, 0.1732330322265625, 0.20574951171875, 0.2382659912109375, 0.270782470703125, 0.3032989501953125, 0.3358154296875, 0.3683319091796875, 0.400848388671875, 0.4333648681640625, 0.46588134765625, 0.4983978271484375, 0.530914306640625, 0.5634307861328125, 0.595947265625, 0.6284637451171875, 0.660980224609375, 0.6934967041015625, 0.72601318359375, 0.7585296630859375, 0.791046142578125, 0.8235626220703125, 0.8560791015625, 0.8885955810546875, 0.921112060546875, 0.9536285400390625, 0.98614501953125, 1.0186614990234375, 1.051177978515625, 1.0836944580078125, 1.1162109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 16.0, 29.0, 19.0, 79.0, 154.0, 316.0, 173.0, 63.0, 48.0, 20.0, 15.0, 16.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2993621826171875, -0.288909912109375, -0.2784576416015625, -0.26800537109375, -0.2575531005859375, -0.247100830078125, -0.2366485595703125, -0.2261962890625, -0.2157440185546875, -0.205291748046875, -0.1948394775390625, -0.18438720703125, -0.1739349365234375, -0.163482666015625, -0.1530303955078125, -0.142578125, -0.1321258544921875, -0.121673583984375, -0.1112213134765625, -0.10076904296875, -0.0903167724609375, -0.079864501953125, -0.0694122314453125, -0.0589599609375, -0.0485076904296875, -0.038055419921875, -0.0276031494140625, -0.01715087890625, -0.0066986083984375, 0.003753662109375, 0.0142059326171875, 0.024658203125, 0.0351104736328125, 0.045562744140625, 0.0560150146484375, 0.06646728515625, 0.0769195556640625, 0.087371826171875, 0.0978240966796875, 0.1082763671875, 0.1187286376953125, 0.129180908203125, 0.1396331787109375, 0.15008544921875, 0.1605377197265625, 0.170989990234375, 0.1814422607421875, 0.19189453125, 0.2023468017578125, 0.212799072265625, 0.2232513427734375, 0.23370361328125, 0.2441558837890625, 0.254608154296875, 0.2650604248046875, 0.2755126953125, 0.2859649658203125, 0.296417236328125, 0.3068695068359375, 0.31732177734375, 0.3277740478515625, 0.338226318359375, 0.3486785888671875, 0.359130859375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 42.0, 197.0, 384.0, 290.0, 69.0, 15.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.681331634521484, -21.291372299194336, -20.901411056518555, -20.511451721191406, -20.121490478515625, -19.731531143188477, -19.341569900512695, -18.951610565185547, -18.561649322509766, -18.171689987182617, -17.781728744506836, -17.391769409179688, -17.001808166503906, -16.611848831176758, -16.221887588500977, -15.831928253173828, -15.441967964172363, -15.052007675170898, -14.662047386169434, -14.272087097167969, -13.882126808166504, -13.492166519165039, -13.10220718383789, -12.71224594116211, -12.322286605834961, -11.932326316833496, -11.542366027832031, -11.152405738830566, -10.762445449829102, -10.372485160827637, -9.982524871826172, -9.592565536499023, -9.202604293823242, -8.812644004821777, -8.422683715820312, -8.032723426818848, -7.642763137817383, -7.252802848815918, -6.862843036651611, -6.4728827476501465, -6.082921981811523, -5.692961692810059, -5.303001403808594, -4.913041114807129, -4.523080825805664, -4.133120536804199, -3.7431607246398926, -3.3532004356384277, -2.963240385055542, -2.573280096054077, -2.1833200454711914, -1.7933597564697266, -1.4033994674682617, -1.0134391784667969, -0.6234791278839111, -0.2335188388824463, 0.15644145011901855, 0.5464016795158386, 0.9363619089126587, 1.326322078704834, 1.7162823677062988, 2.1062426567077637, 2.4962027072906494, 2.8861629962921143, 3.276123285293579]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 7.0, 4.0, 7.0, 5.0, 7.0, 17.0, 16.0, 21.0, 26.0, 24.0, 20.0, 26.0, 29.0, 25.0, 35.0, 33.0, 32.0, 34.0, 28.0, 33.0, 47.0, 46.0, 46.0, 39.0, 48.0, 37.0, 31.0, 34.0, 23.0, 41.0, 27.0, 22.0, 18.0, 17.0, 11.0, 16.0, 12.0, 6.0, 13.0, 4.0, 8.0, 10.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0], "bins": [-2.9436018466949463, -2.8690743446350098, -2.7945470809936523, -2.720019817352295, -2.6454923152923584, -2.570964813232422, -2.4964375495910645, -2.421910285949707, -2.3473827838897705, -2.272855281829834, -2.1983280181884766, -2.123800754547119, -2.0492732524871826, -1.9747458696365356, -1.9002184867858887, -1.8256911039352417, -1.7511637210845947, -1.6766363382339478, -1.6021089553833008, -1.5275815725326538, -1.4530541896820068, -1.3785268068313599, -1.303999423980713, -1.229472041130066, -1.154944658279419, -1.080417275428772, -1.005889892578125, -0.931362509727478, -0.856835126876831, -0.7823077440261841, -0.7077803611755371, -0.6332529783248901, -0.5587254762649536, -0.48419809341430664, -0.40967071056365967, -0.3351433277130127, -0.2606159448623657, -0.18608856201171875, -0.11156117916107178, -0.037033796310424805, 0.03749358654022217, 0.11202096939086914, 0.1865483522415161, 0.2610757350921631, 0.33560311794281006, 0.41013050079345703, 0.484657883644104, 0.559185266494751, 0.633712649345398, 0.7082400321960449, 0.7827674150466919, 0.8572947978973389, 0.9318221807479858, 1.0063495635986328, 1.0808769464492798, 1.1554043292999268, 1.2299317121505737, 1.3044590950012207, 1.3789864778518677, 1.4535138607025146, 1.5280412435531616, 1.6025686264038086, 1.6770960092544556, 1.7516233921051025, 1.8261507749557495]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 7.0, 11.0, 17.0, 34.0, 49.0, 73.0, 101.0, 205.0, 400.0, 801.0, 2060.0, 6292.0, 24952.0, 155174.0, 1007214.0, 2138552.0, 716245.0, 111892.0, 21589.0, 5462.0, 1764.0, 716.0, 288.0, 146.0, 93.0, 57.0, 26.0, 21.0, 9.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.33203125, -2.2743072509765625, -2.216583251953125, -2.1588592529296875, -2.10113525390625, -2.0434112548828125, -1.985687255859375, -1.9279632568359375, -1.8702392578125, -1.8125152587890625, -1.754791259765625, -1.6970672607421875, -1.63934326171875, -1.5816192626953125, -1.523895263671875, -1.4661712646484375, -1.408447265625, -1.3507232666015625, -1.292999267578125, -1.2352752685546875, -1.17755126953125, -1.1198272705078125, -1.062103271484375, -1.0043792724609375, -0.9466552734375, -0.8889312744140625, -0.831207275390625, -0.7734832763671875, -0.71575927734375, -0.6580352783203125, -0.600311279296875, -0.5425872802734375, -0.48486328125, -0.4271392822265625, -0.369415283203125, -0.3116912841796875, -0.25396728515625, -0.1962432861328125, -0.138519287109375, -0.0807952880859375, -0.0230712890625, 0.0346527099609375, 0.092376708984375, 0.1501007080078125, 0.20782470703125, 0.2655487060546875, 0.323272705078125, 0.3809967041015625, 0.438720703125, 0.4964447021484375, 0.554168701171875, 0.6118927001953125, 0.66961669921875, 0.7273406982421875, 0.785064697265625, 0.8427886962890625, 0.9005126953125, 0.9582366943359375, 1.015960693359375, 1.0736846923828125, 1.13140869140625, 1.1891326904296875, 1.246856689453125, 1.3045806884765625, 1.3623046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 18.0, 16.0, 14.0, 26.0, 24.0, 25.0, 21.0, 48.0, 43.0, 41.0, 44.0, 46.0, 46.0, 57.0, 51.0, 63.0, 58.0, 36.0, 40.0, 42.0, 37.0, 36.0, 26.0, 25.0, 19.0, 13.0, 11.0, 16.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3869781494140625, -1.343292236328125, -1.2996063232421875, -1.25592041015625, -1.2122344970703125, -1.168548583984375, -1.1248626708984375, -1.0811767578125, -1.0374908447265625, -0.993804931640625, -0.9501190185546875, -0.90643310546875, -0.8627471923828125, -0.819061279296875, -0.7753753662109375, -0.731689453125, -0.6880035400390625, -0.644317626953125, -0.6006317138671875, -0.55694580078125, -0.5132598876953125, -0.469573974609375, -0.4258880615234375, -0.3822021484375, -0.3385162353515625, -0.294830322265625, -0.2511444091796875, -0.20745849609375, -0.1637725830078125, -0.120086669921875, -0.0764007568359375, -0.03271484375, 0.0109710693359375, 0.054656982421875, 0.0983428955078125, 0.14202880859375, 0.1857147216796875, 0.229400634765625, 0.2730865478515625, 0.3167724609375, 0.3604583740234375, 0.404144287109375, 0.4478302001953125, 0.49151611328125, 0.5352020263671875, 0.578887939453125, 0.6225738525390625, 0.666259765625, 0.7099456787109375, 0.753631591796875, 0.7973175048828125, 0.84100341796875, 0.8846893310546875, 0.928375244140625, 0.9720611572265625, 1.0157470703125, 1.0594329833984375, 1.103118896484375, 1.1468048095703125, 1.19049072265625, 1.2341766357421875, 1.277862548828125, 1.3215484619140625, 1.365234375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 10.0, 11.0, 12.0, 12.0, 25.0, 46.0, 49.0, 80.0, 114.0, 247.0, 516.0, 1970.0, 12255.0, 590468.0, 3546778.0, 36671.0, 3470.0, 778.0, 275.0, 162.0, 102.0, 65.0, 42.0, 28.0, 22.0, 20.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.23150634765625, -4.0958251953125, -3.96014404296875, -3.824462890625, -3.68878173828125, -3.5531005859375, -3.41741943359375, -3.28173828125, -3.14605712890625, -3.0103759765625, -2.87469482421875, -2.739013671875, -2.60333251953125, -2.4676513671875, -2.33197021484375, -2.1962890625, -2.06060791015625, -1.9249267578125, -1.78924560546875, -1.653564453125, -1.51788330078125, -1.3822021484375, -1.24652099609375, -1.11083984375, -0.97515869140625, -0.8394775390625, -0.70379638671875, -0.568115234375, -0.43243408203125, -0.2967529296875, -0.16107177734375, -0.025390625, 0.11029052734375, 0.2459716796875, 0.38165283203125, 0.517333984375, 0.65301513671875, 0.7886962890625, 0.92437744140625, 1.06005859375, 1.19573974609375, 1.3314208984375, 1.46710205078125, 1.602783203125, 1.73846435546875, 1.8741455078125, 2.00982666015625, 2.1455078125, 2.28118896484375, 2.4168701171875, 2.55255126953125, 2.688232421875, 2.82391357421875, 2.9595947265625, 3.09527587890625, 3.23095703125, 3.36663818359375, 3.5023193359375, 3.63800048828125, 3.773681640625, 3.90936279296875, 4.0450439453125, 4.18072509765625, 4.31640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 11.0, 6.0, 15.0, 11.0, 12.0, 34.0, 45.0, 46.0, 81.0, 108.0, 187.0, 233.0, 387.0, 525.0, 586.0, 558.0, 401.0, 292.0, 181.0, 115.0, 70.0, 39.0, 38.0, 24.0, 21.0, 9.0, 13.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6299285888671875, -0.609954833984375, -0.5899810791015625, -0.57000732421875, -0.5500335693359375, -0.530059814453125, -0.5100860595703125, -0.4901123046875, -0.4701385498046875, -0.450164794921875, -0.4301910400390625, -0.41021728515625, -0.3902435302734375, -0.370269775390625, -0.3502960205078125, -0.330322265625, -0.3103485107421875, -0.290374755859375, -0.2704010009765625, -0.25042724609375, -0.2304534912109375, -0.210479736328125, -0.1905059814453125, -0.1705322265625, -0.1505584716796875, -0.130584716796875, -0.1106109619140625, -0.09063720703125, -0.0706634521484375, -0.050689697265625, -0.0307159423828125, -0.0107421875, 0.0092315673828125, 0.029205322265625, 0.0491790771484375, 0.06915283203125, 0.0891265869140625, 0.109100341796875, 0.1290740966796875, 0.1490478515625, 0.1690216064453125, 0.188995361328125, 0.2089691162109375, 0.22894287109375, 0.2489166259765625, 0.268890380859375, 0.2888641357421875, 0.308837890625, 0.3288116455078125, 0.348785400390625, 0.3687591552734375, 0.38873291015625, 0.4087066650390625, 0.428680419921875, 0.4486541748046875, 0.4686279296875, 0.4886016845703125, 0.508575439453125, 0.5285491943359375, 0.54852294921875, 0.5684967041015625, 0.588470458984375, 0.6084442138671875, 0.62841796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 16.0, 18.0, 24.0, 47.0, 63.0, 83.0, 121.0, 134.0, 121.0, 110.0, 90.0, 64.0, 35.0, 29.0, 14.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.809737205505371, -2.7159247398376465, -2.622112274169922, -2.5282998085021973, -2.4344875812530518, -2.340675115585327, -2.2468626499176025, -2.153050184249878, -2.0592379570007324, -1.9654254913330078, -1.8716131448745728, -1.7778006792068481, -1.683988332748413, -1.5901758670806885, -1.4963634014129639, -1.4025509357452393, -1.3087384700775146, -1.21492600440979, -1.121113657951355, -1.0273011922836304, -0.9334887862205505, -0.8396763801574707, -0.7458639144897461, -0.6520515084266663, -0.5582391023635864, -0.4644266963005066, -0.37061426043510437, -0.27680182456970215, -0.18298941850662231, -0.08917701244354248, 0.004635453224182129, 0.09844785928726196, 0.1922605037689209, 0.28607290983200073, 0.37988534569740295, 0.4736977815628052, 0.567510187625885, 0.6613225936889648, 0.7551350593566895, 0.8489474654197693, 0.9427598714828491, 1.0365723371505737, 1.1303846836090088, 1.2241971492767334, 1.318009614944458, 1.411821961402893, 1.5056344270706177, 1.5994467735290527, 1.6932592391967773, 1.787071704864502, 1.880884051322937, 1.9746965169906616, 2.0685088634490967, 2.1623213291168213, 2.256133794784546, 2.3499462604522705, 2.443758487701416, 2.5375709533691406, 2.6313834190368652, 2.72519588470459, 2.8190081119537354, 2.91282057762146, 3.0066330432891846, 3.100445508956909, 3.194257974624634]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 2.0, 10.0, 3.0, 9.0, 7.0, 11.0, 14.0, 13.0, 10.0, 18.0, 15.0, 25.0, 28.0, 36.0, 24.0, 40.0, 33.0, 34.0, 40.0, 42.0, 43.0, 40.0, 43.0, 33.0, 46.0, 28.0, 36.0, 33.0, 48.0, 39.0, 26.0, 31.0, 15.0, 20.0, 13.0, 15.0, 16.0, 6.0, 8.0, 10.0, 3.0, 8.0, 8.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.2898352146148682, -1.252617359161377, -1.2153996229171753, -1.178181767463684, -1.1409639120101929, -1.1037461757659912, -1.0665283203125, -1.0293104648590088, -0.9920926690101624, -0.9548748731613159, -0.9176570177078247, -0.8804392218589783, -0.8432214260101318, -0.8060035705566406, -0.7687857747077942, -0.7315679788589478, -0.6943501234054565, -0.6571323275566101, -0.6199144721031189, -0.5826966762542725, -0.5454788208007812, -0.5082610249519348, -0.4710432291030884, -0.43382540345191956, -0.39660757780075073, -0.3593897521495819, -0.3221719264984131, -0.28495413064956665, -0.24773630499839783, -0.210518479347229, -0.17330066859722137, -0.13608285784721375, -0.09886491298675537, -0.061647094786167145, -0.02442927658557892, 0.012788541615009308, 0.050006359815597534, 0.08722418546676636, 0.12444199621677399, 0.16165980696678162, 0.19887763261795044, 0.23609545826911926, 0.2733132839202881, 0.3105310797691345, 0.34774890542030334, 0.38496673107147217, 0.4221845269203186, 0.4594023525714874, 0.49662017822265625, 0.5338379740715027, 0.5710558295249939, 0.6082736253738403, 0.6454914808273315, 0.682709276676178, 0.7199270725250244, 0.7571449279785156, 0.7943627238273621, 0.8315805196762085, 0.8687983751296997, 0.9060161709785461, 0.9432339668273926, 0.9804518222808838, 1.017669677734375, 1.0548874139785767, 1.0921052694320679]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 18.0, 15.0, 33.0, 37.0, 105.0, 171.0, 334.0, 964.0, 2925.0, 11639.0, 61414.0, 388248.0, 482786.0, 80044.0, 14669.0, 3377.0, 1041.0, 385.0, 155.0, 79.0, 52.0, 34.0, 9.0, 10.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19140625, -1.1623992919921875, -1.133392333984375, -1.1043853759765625, -1.07537841796875, -1.0463714599609375, -1.017364501953125, -0.9883575439453125, -0.9593505859375, -0.9303436279296875, -0.901336669921875, -0.8723297119140625, -0.84332275390625, -0.8143157958984375, -0.785308837890625, -0.7563018798828125, -0.727294921875, -0.6982879638671875, -0.669281005859375, -0.6402740478515625, -0.61126708984375, -0.5822601318359375, -0.553253173828125, -0.5242462158203125, -0.4952392578125, -0.4662322998046875, -0.437225341796875, -0.4082183837890625, -0.37921142578125, -0.3502044677734375, -0.321197509765625, -0.2921905517578125, -0.26318359375, -0.2341766357421875, -0.205169677734375, -0.1761627197265625, -0.14715576171875, -0.1181488037109375, -0.089141845703125, -0.0601348876953125, -0.0311279296875, -0.0021209716796875, 0.026885986328125, 0.0558929443359375, 0.08489990234375, 0.1139068603515625, 0.142913818359375, 0.1719207763671875, 0.200927734375, 0.2299346923828125, 0.258941650390625, 0.2879486083984375, 0.31695556640625, 0.3459625244140625, 0.374969482421875, 0.4039764404296875, 0.4329833984375, 0.4619903564453125, 0.490997314453125, 0.5200042724609375, 0.54901123046875, 0.5780181884765625, 0.607025146484375, 0.6360321044921875, 0.6650390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 9.0, 11.0, 7.0, 10.0, 9.0, 21.0, 23.0, 23.0, 33.0, 27.0, 46.0, 54.0, 51.0, 64.0, 53.0, 57.0, 68.0, 51.0, 57.0, 43.0, 61.0, 44.0, 34.0, 38.0, 21.0, 16.0, 18.0, 11.0, 8.0, 8.0, 6.0, 9.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.181640625, -1.151092529296875, -1.12054443359375, -1.089996337890625, -1.0594482421875, -1.028900146484375, -0.99835205078125, -0.967803955078125, -0.937255859375, -0.906707763671875, -0.87615966796875, -0.845611572265625, -0.8150634765625, -0.784515380859375, -0.75396728515625, -0.723419189453125, -0.69287109375, -0.662322998046875, -0.63177490234375, -0.601226806640625, -0.5706787109375, -0.540130615234375, -0.50958251953125, -0.479034423828125, -0.448486328125, -0.417938232421875, -0.38739013671875, -0.356842041015625, -0.3262939453125, -0.295745849609375, -0.26519775390625, -0.234649658203125, -0.2041015625, -0.173553466796875, -0.14300537109375, -0.112457275390625, -0.0819091796875, -0.051361083984375, -0.02081298828125, 0.009735107421875, 0.040283203125, 0.070831298828125, 0.10137939453125, 0.131927490234375, 0.1624755859375, 0.193023681640625, 0.22357177734375, 0.254119873046875, 0.28466796875, 0.315216064453125, 0.34576416015625, 0.376312255859375, 0.4068603515625, 0.437408447265625, 0.46795654296875, 0.498504638671875, 0.529052734375, 0.559600830078125, 0.59014892578125, 0.620697021484375, 0.6512451171875, 0.681793212890625, 0.71234130859375, 0.742889404296875, 0.7734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 13.0, 21.0, 28.0, 28.0, 49.0, 63.0, 87.0, 147.0, 211.0, 362.0, 631.0, 1149.0, 2302.0, 4955.0, 11537.0, 27506.0, 69143.0, 175107.0, 338799.0, 245990.0, 101106.0, 39664.0, 16264.0, 6826.0, 3085.0, 1423.0, 813.0, 425.0, 252.0, 166.0, 114.0, 82.0, 50.0, 40.0, 17.0, 16.0, 21.0, 15.0, 2.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.461181640625, -0.4478912353515625, -0.434600830078125, -0.4213104248046875, -0.40802001953125, -0.3947296142578125, -0.381439208984375, -0.3681488037109375, -0.3548583984375, -0.3415679931640625, -0.328277587890625, -0.3149871826171875, -0.30169677734375, -0.2884063720703125, -0.275115966796875, -0.2618255615234375, -0.24853515625, -0.2352447509765625, -0.221954345703125, -0.2086639404296875, -0.19537353515625, -0.1820831298828125, -0.168792724609375, -0.1555023193359375, -0.1422119140625, -0.1289215087890625, -0.115631103515625, -0.1023406982421875, -0.08905029296875, -0.0757598876953125, -0.062469482421875, -0.0491790771484375, -0.035888671875, -0.0225982666015625, -0.009307861328125, 0.0039825439453125, 0.01727294921875, 0.0305633544921875, 0.043853759765625, 0.0571441650390625, 0.0704345703125, 0.0837249755859375, 0.097015380859375, 0.1103057861328125, 0.12359619140625, 0.1368865966796875, 0.150177001953125, 0.1634674072265625, 0.1767578125, 0.1900482177734375, 0.203338623046875, 0.2166290283203125, 0.22991943359375, 0.2432098388671875, 0.256500244140625, 0.2697906494140625, 0.2830810546875, 0.2963714599609375, 0.309661865234375, 0.3229522705078125, 0.33624267578125, 0.3495330810546875, 0.362823486328125, 0.3761138916015625, 0.389404296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 13.0, 12.0, 9.0, 20.0, 14.0, 22.0, 19.0, 37.0, 28.0, 40.0, 40.0, 38.0, 37.0, 51.0, 48.0, 46.0, 51.0, 54.0, 46.0, 58.0, 46.0, 38.0, 28.0, 27.0, 32.0, 26.0, 22.0, 15.0, 8.0, 10.0, 9.0, 8.0, 10.0, 7.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.638671875, -1.5912322998046875, -1.543792724609375, -1.4963531494140625, -1.44891357421875, -1.4014739990234375, -1.354034423828125, -1.3065948486328125, -1.2591552734375, -1.2117156982421875, -1.164276123046875, -1.1168365478515625, -1.06939697265625, -1.0219573974609375, -0.974517822265625, -0.9270782470703125, -0.879638671875, -0.8321990966796875, -0.784759521484375, -0.7373199462890625, -0.68988037109375, -0.6424407958984375, -0.595001220703125, -0.5475616455078125, -0.5001220703125, -0.4526824951171875, -0.405242919921875, -0.3578033447265625, -0.31036376953125, -0.2629241943359375, -0.215484619140625, -0.1680450439453125, -0.12060546875, -0.0731658935546875, -0.025726318359375, 0.0217132568359375, 0.06915283203125, 0.1165924072265625, 0.164031982421875, 0.2114715576171875, 0.2589111328125, 0.3063507080078125, 0.353790283203125, 0.4012298583984375, 0.44866943359375, 0.4961090087890625, 0.543548583984375, 0.5909881591796875, 0.638427734375, 0.6858673095703125, 0.733306884765625, 0.7807464599609375, 0.82818603515625, 0.8756256103515625, 0.923065185546875, 0.9705047607421875, 1.0179443359375, 1.0653839111328125, 1.112823486328125, 1.1602630615234375, 1.20770263671875, 1.2551422119140625, 1.302581787109375, 1.3500213623046875, 1.3974609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 10.0, 12.0, 24.0, 20.0, 31.0, 52.0, 72.0, 107.0, 153.0, 266.0, 364.0, 683.0, 1093.0, 1869.0, 3596.0, 6711.0, 13939.0, 31665.0, 88997.0, 279339.0, 384240.0, 147632.0, 48323.0, 19441.0, 9073.0, 4629.0, 2490.0, 1387.0, 861.0, 505.0, 310.0, 224.0, 138.0, 95.0, 60.0, 37.0, 23.0, 26.0, 12.0, 4.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.192626953125, -0.1866474151611328, -0.18066787719726562, -0.17468833923339844, -0.16870880126953125, -0.16272926330566406, -0.15674972534179688, -0.1507701873779297, -0.1447906494140625, -0.1388111114501953, -0.13283157348632812, -0.12685203552246094, -0.12087249755859375, -0.11489295959472656, -0.10891342163085938, -0.10293388366699219, -0.096954345703125, -0.09097480773925781, -0.08499526977539062, -0.07901573181152344, -0.07303619384765625, -0.06705665588378906, -0.061077117919921875, -0.05509757995605469, -0.0491180419921875, -0.04313850402832031, -0.037158966064453125, -0.031179428100585938, -0.02519989013671875, -0.019220352172851562, -0.013240814208984375, -0.0072612762451171875, -0.00128173828125, 0.0046977996826171875, 0.010677337646484375, 0.016656875610351562, 0.02263641357421875, 0.028615951538085938, 0.034595489501953125, 0.04057502746582031, 0.0465545654296875, 0.05253410339355469, 0.058513641357421875, 0.06449317932128906, 0.07047271728515625, 0.07645225524902344, 0.08243179321289062, 0.08841133117675781, 0.094390869140625, 0.10037040710449219, 0.10634994506835938, 0.11232948303222656, 0.11830902099609375, 0.12428855895996094, 0.13026809692382812, 0.1362476348876953, 0.1422271728515625, 0.1482067108154297, 0.15418624877929688, 0.16016578674316406, 0.16614532470703125, 0.17212486267089844, 0.17810440063476562, 0.1840839385986328, 0.1900634765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 14.0, 15.0, 41.0, 36.0, 64.0, 108.0, 157.0, 169.0, 143.0, 84.0, 52.0, 31.0, 29.0, 14.0, 9.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00015306472778320312, -0.0001476295292377472, -0.00014219433069229126, -0.00013675913214683533, -0.0001313239336013794, -0.00012588873505592346, -0.00012045353651046753, -0.0001150183379650116, -0.00010958313941955566, -0.00010414794087409973, -9.87127423286438e-05, -9.327754378318787e-05, -8.784234523773193e-05, -8.2407146692276e-05, -7.697194814682007e-05, -7.153674960136414e-05, -6.61015510559082e-05, -6.066635251045227e-05, -5.523115396499634e-05, -4.9795955419540405e-05, -4.436075687408447e-05, -3.892555832862854e-05, -3.349035978317261e-05, -2.8055161237716675e-05, -2.2619962692260742e-05, -1.718476414680481e-05, -1.1749565601348877e-05, -6.314367055892944e-06, -8.791685104370117e-07, 4.556030035018921e-06, 9.991228580474854e-06, 1.5426427125930786e-05, 2.086162567138672e-05, 2.629682421684265e-05, 3.1732022762298584e-05, 3.7167221307754517e-05, 4.260241985321045e-05, 4.803761839866638e-05, 5.3472816944122314e-05, 5.890801548957825e-05, 6.434321403503418e-05, 6.977841258049011e-05, 7.521361112594604e-05, 8.064880967140198e-05, 8.608400821685791e-05, 9.151920676231384e-05, 9.695440530776978e-05, 0.00010238960385322571, 0.00010782480239868164, 0.00011326000094413757, 0.0001186951994895935, 0.00012413039803504944, 0.00012956559658050537, 0.0001350007951259613, 0.00014043599367141724, 0.00014587119221687317, 0.0001513063907623291, 0.00015674158930778503, 0.00016217678785324097, 0.0001676119863986969, 0.00017304718494415283, 0.00017848238348960876, 0.0001839175820350647, 0.00018935278058052063, 0.00019478797912597656]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 25.0, 42.0, 50.0, 93.0, 135.0, 267.0, 610.0, 1506.0, 4159.0, 13943.0, 60360.0, 380559.0, 480742.0, 80184.0, 17482.0, 5116.0, 1743.0, 691.0, 335.0, 166.0, 98.0, 41.0, 32.0, 22.0, 17.0, 9.0, 10.0, 16.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.29845428466796875, -0.2878265380859375, -0.27719879150390625, -0.266571044921875, -0.25594329833984375, -0.2453155517578125, -0.23468780517578125, -0.22406005859375, -0.21343231201171875, -0.2028045654296875, -0.19217681884765625, -0.181549072265625, -0.17092132568359375, -0.1602935791015625, -0.14966583251953125, -0.1390380859375, -0.12841033935546875, -0.1177825927734375, -0.10715484619140625, -0.096527099609375, -0.08589935302734375, -0.0752716064453125, -0.06464385986328125, -0.05401611328125, -0.04338836669921875, -0.0327606201171875, -0.02213287353515625, -0.011505126953125, -0.00087738037109375, 0.0097503662109375, 0.02037811279296875, 0.031005859375, 0.04163360595703125, 0.0522613525390625, 0.06288909912109375, 0.073516845703125, 0.08414459228515625, 0.0947723388671875, 0.10540008544921875, 0.11602783203125, 0.12665557861328125, 0.1372833251953125, 0.14791107177734375, 0.158538818359375, 0.16916656494140625, 0.1797943115234375, 0.19042205810546875, 0.2010498046875, 0.21167755126953125, 0.2223052978515625, 0.23293304443359375, 0.243560791015625, 0.25418853759765625, 0.2648162841796875, 0.27544403076171875, 0.28607177734375, 0.29669952392578125, 0.3073272705078125, 0.31795501708984375, 0.328582763671875, 0.33921051025390625, 0.3498382568359375, 0.36046600341796875, 0.37109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 16.0, 14.0, 11.0, 18.0, 27.0, 23.0, 40.0, 46.0, 64.0, 62.0, 78.0, 74.0, 86.0, 69.0, 50.0, 51.0, 41.0, 32.0, 31.0, 33.0, 7.0, 20.0, 12.0, 13.0, 5.0, 7.0, 5.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.0410923957824707, -0.039429664611816406, -0.03776693344116211, -0.03610420227050781, -0.034441471099853516, -0.03277873992919922, -0.031116008758544922, -0.029453277587890625, -0.027790546417236328, -0.02612781524658203, -0.024465084075927734, -0.022802352905273438, -0.02113962173461914, -0.019476890563964844, -0.017814159393310547, -0.01615142822265625, -0.014488697052001953, -0.012825965881347656, -0.01116323471069336, -0.009500503540039062, -0.007837772369384766, -0.006175041198730469, -0.004512310028076172, -0.002849578857421875, -0.0011868476867675781, 0.00047588348388671875, 0.0021386146545410156, 0.0038013458251953125, 0.005464076995849609, 0.007126808166503906, 0.008789539337158203, 0.0104522705078125, 0.012115001678466797, 0.013777732849121094, 0.01544046401977539, 0.017103195190429688, 0.018765926361083984, 0.02042865753173828, 0.022091388702392578, 0.023754119873046875, 0.025416851043701172, 0.02707958221435547, 0.028742313385009766, 0.030405044555664062, 0.03206777572631836, 0.033730506896972656, 0.03539323806762695, 0.03705596923828125, 0.03871870040893555, 0.040381431579589844, 0.04204416275024414, 0.04370689392089844, 0.045369625091552734, 0.04703235626220703, 0.04869508743286133, 0.050357818603515625, 0.05202054977416992, 0.05368328094482422, 0.055346012115478516, 0.05700874328613281, 0.05867147445678711, 0.060334205627441406, 0.0619969367980957, 0.06365966796875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 23.0, 29.0, 59.0, 104.0, 149.0, 166.0, 131.0, 131.0, 83.0, 45.0, 23.0, 20.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2450764179229736, -2.180626153945923, -2.116175651550293, -2.051725387573242, -1.9872751235961914, -1.9228248596191406, -1.8583744764328003, -1.79392409324646, -1.7294738292694092, -1.6650235652923584, -1.600573182106018, -1.5361227989196777, -1.471672534942627, -1.4072222709655762, -1.3427718877792358, -1.2783215045928955, -1.2138712406158447, -1.149420976638794, -1.0849705934524536, -1.0205202102661133, -0.9560699462890625, -0.8916196227073669, -0.8271692991256714, -0.7627189755439758, -0.6982686519622803, -0.6338183283805847, -0.5693680047988892, -0.5049176812171936, -0.44046735763549805, -0.3760170340538025, -0.31156671047210693, -0.24711638689041138, -0.18266618251800537, -0.11821585893630981, -0.05376553535461426, 0.010684788227081299, 0.07513511180877686, 0.1395854353904724, 0.20403575897216797, 0.2684860825538635, 0.3329364061355591, 0.39738672971725464, 0.4618370532989502, 0.5262873768806458, 0.5907377004623413, 0.6551880240440369, 0.7196383476257324, 0.784088671207428, 0.8485389947891235, 0.9129893183708191, 0.9774396419525146, 1.0418899059295654, 1.1063402891159058, 1.170790672302246, 1.2352409362792969, 1.2996912002563477, 1.364141583442688, 1.4285919666290283, 1.493042230606079, 1.5574924945831299, 1.6219428777694702, 1.6863932609558105, 1.7508435249328613, 1.815293788909912, 1.8797441720962524]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 9.0, 12.0, 10.0, 7.0, 12.0, 15.0, 13.0, 15.0, 21.0, 27.0, 23.0, 45.0, 30.0, 36.0, 42.0, 38.0, 53.0, 41.0, 52.0, 37.0, 43.0, 53.0, 30.0, 49.0, 49.0, 29.0, 36.0, 31.0, 23.0, 10.0, 21.0, 17.0, 10.0, 15.0, 5.0, 7.0, 6.0, 2.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.8412993550300598, -0.8182972073554993, -0.795295000076294, -0.7722928524017334, -0.7492907047271729, -0.7262884974479675, -0.703286349773407, -0.6802841424942017, -0.6572819948196411, -0.6342798471450806, -0.6112776398658752, -0.5882754921913147, -0.5652733445167542, -0.5422711372375488, -0.5192689895629883, -0.49626681208610535, -0.4732646644115448, -0.45026248693466187, -0.4272603392601013, -0.4042581617832184, -0.38125598430633545, -0.3582538366317749, -0.33525165915489197, -0.31224948167800903, -0.2892473340034485, -0.26624515652656555, -0.2432429939508438, -0.22024083137512207, -0.19723865389823914, -0.1742364913225174, -0.15123432874679565, -0.12823215126991272, -0.10522997379302979, -0.08222780376672745, -0.05922563746571541, -0.03622347116470337, -0.013221301138401031, 0.009780868887901306, 0.03278303146362305, 0.05578520894050598, 0.07878737151622772, 0.10178954154253006, 0.1247917115688324, 0.14779387414455414, 0.17079603672027588, 0.1937982141971588, 0.21680037677288055, 0.2398025542497635, 0.26280471682548523, 0.28580689430236816, 0.3088090419769287, 0.33181121945381165, 0.3548133969306946, 0.3778155446052551, 0.40081772208213806, 0.423819899559021, 0.44682204723358154, 0.4698242247104645, 0.492826372385025, 0.515828549861908, 0.5388306975364685, 0.5618329048156738, 0.5848350524902344, 0.6078372001647949, 0.6308394074440002]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 7.0, 10.0, 9.0, 11.0, 23.0, 45.0, 49.0, 79.0, 149.0, 260.0, 505.0, 1256.0, 2892.0, 7996.0, 23085.0, 81999.0, 327430.0, 429229.0, 123624.0, 32535.0, 10454.0, 3826.0, 1603.0, 714.0, 317.0, 156.0, 98.0, 65.0, 24.0, 33.0, 18.0, 11.0, 11.0, 9.0, 7.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0560150146484375, -1.023162841796875, -0.9903106689453125, -0.95745849609375, -0.9246063232421875, -0.891754150390625, -0.8589019775390625, -0.8260498046875, -0.7931976318359375, -0.760345458984375, -0.7274932861328125, -0.69464111328125, -0.6617889404296875, -0.628936767578125, -0.5960845947265625, -0.563232421875, -0.5303802490234375, -0.497528076171875, -0.4646759033203125, -0.43182373046875, -0.3989715576171875, -0.366119384765625, -0.3332672119140625, -0.3004150390625, -0.2675628662109375, -0.234710693359375, -0.2018585205078125, -0.16900634765625, -0.1361541748046875, -0.103302001953125, -0.0704498291015625, -0.03759765625, -0.0047454833984375, 0.028106689453125, 0.0609588623046875, 0.09381103515625, 0.1266632080078125, 0.159515380859375, 0.1923675537109375, 0.2252197265625, 0.2580718994140625, 0.290924072265625, 0.3237762451171875, 0.35662841796875, 0.3894805908203125, 0.422332763671875, 0.4551849365234375, 0.488037109375, 0.5208892822265625, 0.553741455078125, 0.5865936279296875, 0.61944580078125, 0.6522979736328125, 0.685150146484375, 0.7180023193359375, 0.7508544921875, 0.7837066650390625, 0.816558837890625, 0.8494110107421875, 0.88226318359375, 0.9151153564453125, 0.947967529296875, 0.9808197021484375, 1.013671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 6.0, 11.0, 16.0, 5.0, 20.0, 14.0, 20.0, 22.0, 26.0, 25.0, 42.0, 35.0, 36.0, 27.0, 51.0, 60.0, 59.0, 37.0, 38.0, 44.0, 51.0, 39.0, 42.0, 34.0, 36.0, 32.0, 22.0, 25.0, 21.0, 14.0, 10.0, 9.0, 15.0, 8.0, 9.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.654296875, -1.6071319580078125, -1.559967041015625, -1.5128021240234375, -1.46563720703125, -1.4184722900390625, -1.371307373046875, -1.3241424560546875, -1.2769775390625, -1.2298126220703125, -1.182647705078125, -1.1354827880859375, -1.08831787109375, -1.0411529541015625, -0.993988037109375, -0.9468231201171875, -0.899658203125, -0.8524932861328125, -0.805328369140625, -0.7581634521484375, -0.71099853515625, -0.6638336181640625, -0.616668701171875, -0.5695037841796875, -0.5223388671875, -0.4751739501953125, -0.428009033203125, -0.3808441162109375, -0.33367919921875, -0.2865142822265625, -0.239349365234375, -0.1921844482421875, -0.14501953125, -0.0978546142578125, -0.050689697265625, -0.0035247802734375, 0.04364013671875, 0.0908050537109375, 0.137969970703125, 0.1851348876953125, 0.2322998046875, 0.2794647216796875, 0.326629638671875, 0.3737945556640625, 0.42095947265625, 0.4681243896484375, 0.515289306640625, 0.5624542236328125, 0.609619140625, 0.6567840576171875, 0.703948974609375, 0.7511138916015625, 0.79827880859375, 0.8454437255859375, 0.892608642578125, 0.9397735595703125, 0.9869384765625, 1.0341033935546875, 1.081268310546875, 1.1284332275390625, 1.17559814453125, 1.2227630615234375, 1.269927978515625, 1.3170928955078125, 1.3642578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 7.0, 13.0, 8.0, 15.0, 24.0, 23.0, 26.0, 26.0, 50.0, 53.0, 61.0, 81.0, 146.0, 177.0, 285.0, 1007.0, 22327.0, 958685.0, 62671.0, 1678.0, 349.0, 216.0, 136.0, 98.0, 79.0, 60.0, 39.0, 36.0, 28.0, 19.0, 12.0, 16.0, 7.0, 7.0, 13.0, 7.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-4.1484375, -4.0172119140625, -3.885986328125, -3.7547607421875, -3.62353515625, -3.4923095703125, -3.361083984375, -3.2298583984375, -3.0986328125, -2.9674072265625, -2.836181640625, -2.7049560546875, -2.57373046875, -2.4425048828125, -2.311279296875, -2.1800537109375, -2.048828125, -1.9176025390625, -1.786376953125, -1.6551513671875, -1.52392578125, -1.3927001953125, -1.261474609375, -1.1302490234375, -0.9990234375, -0.8677978515625, -0.736572265625, -0.6053466796875, -0.47412109375, -0.3428955078125, -0.211669921875, -0.0804443359375, 0.05078125, 0.1820068359375, 0.313232421875, 0.4444580078125, 0.57568359375, 0.7069091796875, 0.838134765625, 0.9693603515625, 1.1005859375, 1.2318115234375, 1.363037109375, 1.4942626953125, 1.62548828125, 1.7567138671875, 1.887939453125, 2.0191650390625, 2.150390625, 2.2816162109375, 2.412841796875, 2.5440673828125, 2.67529296875, 2.8065185546875, 2.937744140625, 3.0689697265625, 3.2001953125, 3.3314208984375, 3.462646484375, 3.5938720703125, 3.72509765625, 3.8563232421875, 3.987548828125, 4.1187744140625, 4.25]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 3.0, 6.0, 10.0, 11.0, 11.0, 11.0, 20.0, 27.0, 26.0, 40.0, 34.0, 35.0, 31.0, 37.0, 52.0, 41.0, 39.0, 48.0, 59.0, 55.0, 34.0, 52.0, 48.0, 44.0, 40.0, 38.0, 26.0, 18.0, 23.0, 14.0, 7.0, 12.0, 13.0, 3.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.90234375, -1.847564697265625, -1.79278564453125, -1.738006591796875, -1.6832275390625, -1.628448486328125, -1.57366943359375, -1.518890380859375, -1.464111328125, -1.409332275390625, -1.35455322265625, -1.299774169921875, -1.2449951171875, -1.190216064453125, -1.13543701171875, -1.080657958984375, -1.02587890625, -0.971099853515625, -0.91632080078125, -0.861541748046875, -0.8067626953125, -0.751983642578125, -0.69720458984375, -0.642425537109375, -0.587646484375, -0.532867431640625, -0.47808837890625, -0.423309326171875, -0.3685302734375, -0.313751220703125, -0.25897216796875, -0.204193115234375, -0.1494140625, -0.094635009765625, -0.03985595703125, 0.014923095703125, 0.0697021484375, 0.124481201171875, 0.17926025390625, 0.234039306640625, 0.288818359375, 0.343597412109375, 0.39837646484375, 0.453155517578125, 0.5079345703125, 0.562713623046875, 0.61749267578125, 0.672271728515625, 0.72705078125, 0.781829833984375, 0.83660888671875, 0.891387939453125, 0.9461669921875, 1.000946044921875, 1.05572509765625, 1.110504150390625, 1.165283203125, 1.220062255859375, 1.27484130859375, 1.329620361328125, 1.3843994140625, 1.439178466796875, 1.49395751953125, 1.548736572265625, 1.603515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 10.0, 15.0, 13.0, 23.0, 40.0, 60.0, 90.0, 155.0, 286.0, 631.0, 1253.0, 3240.0, 10457.0, 61093.0, 621494.0, 309585.0, 29466.0, 6505.0, 2201.0, 909.0, 438.0, 195.0, 110.0, 88.0, 54.0, 45.0, 21.0, 12.0, 12.0, 4.0, 7.0, 3.0, 3.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3806610107421875, -0.365325927734375, -0.3499908447265625, -0.33465576171875, -0.3193206787109375, -0.303985595703125, -0.2886505126953125, -0.2733154296875, -0.2579803466796875, -0.242645263671875, -0.2273101806640625, -0.21197509765625, -0.1966400146484375, -0.181304931640625, -0.1659698486328125, -0.150634765625, -0.1352996826171875, -0.119964599609375, -0.1046295166015625, -0.08929443359375, -0.0739593505859375, -0.058624267578125, -0.0432891845703125, -0.0279541015625, -0.0126190185546875, 0.002716064453125, 0.0180511474609375, 0.03338623046875, 0.0487213134765625, 0.064056396484375, 0.0793914794921875, 0.0947265625, 0.1100616455078125, 0.125396728515625, 0.1407318115234375, 0.15606689453125, 0.1714019775390625, 0.186737060546875, 0.2020721435546875, 0.2174072265625, 0.2327423095703125, 0.248077392578125, 0.2634124755859375, 0.27874755859375, 0.2940826416015625, 0.309417724609375, 0.3247528076171875, 0.340087890625, 0.3554229736328125, 0.370758056640625, 0.3860931396484375, 0.40142822265625, 0.4167633056640625, 0.432098388671875, 0.4474334716796875, 0.4627685546875, 0.4781036376953125, 0.493438720703125, 0.5087738037109375, 0.52410888671875, 0.5394439697265625, 0.554779052734375, 0.5701141357421875, 0.58544921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 12.0, 7.0, 16.0, 20.0, 22.0, 32.0, 48.0, 92.0, 114.0, 108.0, 128.0, 120.0, 76.0, 51.0, 41.0, 27.0, 14.0, 21.0, 8.0, 9.0, 8.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.282329559326172e-05, -6.074737757444382e-05, -5.8671459555625916e-05, -5.6595541536808014e-05, -5.451962351799011e-05, -5.244370549917221e-05, -5.036778748035431e-05, -4.829186946153641e-05, -4.6215951442718506e-05, -4.4140033423900604e-05, -4.20641154050827e-05, -3.99881973862648e-05, -3.79122793674469e-05, -3.5836361348629e-05, -3.3760443329811096e-05, -3.1684525310993195e-05, -2.9608607292175293e-05, -2.753268927335739e-05, -2.545677125453949e-05, -2.3380853235721588e-05, -2.1304935216903687e-05, -1.9229017198085785e-05, -1.7153099179267883e-05, -1.5077181160449982e-05, -1.300126314163208e-05, -1.0925345122814178e-05, -8.849427103996277e-06, -6.773509085178375e-06, -4.697591066360474e-06, -2.621673047542572e-06, -5.457550287246704e-07, 1.5301629900932312e-06, 3.606081008911133e-06, 5.6819990277290344e-06, 7.757917046546936e-06, 9.833835065364838e-06, 1.190975308418274e-05, 1.3985671103000641e-05, 1.6061589121818542e-05, 1.8137507140636444e-05, 2.0213425159454346e-05, 2.2289343178272247e-05, 2.436526119709015e-05, 2.644117921590805e-05, 2.8517097234725952e-05, 3.0593015253543854e-05, 3.2668933272361755e-05, 3.474485129117966e-05, 3.682076930999756e-05, 3.889668732881546e-05, 4.097260534763336e-05, 4.3048523366451263e-05, 4.5124441385269165e-05, 4.720035940408707e-05, 4.927627742290497e-05, 5.135219544172287e-05, 5.342811346054077e-05, 5.550403147935867e-05, 5.7579949498176575e-05, 5.9655867516994476e-05, 6.173178553581238e-05, 6.380770355463028e-05, 6.588362157344818e-05, 6.795953959226608e-05, 7.003545761108398e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 1.0, 7.0, 9.0, 5.0, 17.0, 14.0, 11.0, 29.0, 47.0, 65.0, 117.0, 236.0, 589.0, 1850.0, 7562.0, 52832.0, 667949.0, 288651.0, 22567.0, 4045.0, 1101.0, 388.0, 188.0, 91.0, 60.0, 25.0, 20.0, 18.0, 13.0, 10.0, 8.0, 12.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55078125, -0.5323028564453125, -0.513824462890625, -0.4953460693359375, -0.47686767578125, -0.4583892822265625, -0.439910888671875, -0.4214324951171875, -0.4029541015625, -0.3844757080078125, -0.365997314453125, -0.3475189208984375, -0.32904052734375, -0.3105621337890625, -0.292083740234375, -0.2736053466796875, -0.255126953125, -0.2366485595703125, -0.218170166015625, -0.1996917724609375, -0.18121337890625, -0.1627349853515625, -0.144256591796875, -0.1257781982421875, -0.1072998046875, -0.0888214111328125, -0.070343017578125, -0.0518646240234375, -0.03338623046875, -0.0149078369140625, 0.003570556640625, 0.0220489501953125, 0.04052734375, 0.0590057373046875, 0.077484130859375, 0.0959625244140625, 0.11444091796875, 0.1329193115234375, 0.151397705078125, 0.1698760986328125, 0.1883544921875, 0.2068328857421875, 0.225311279296875, 0.2437896728515625, 0.26226806640625, 0.2807464599609375, 0.299224853515625, 0.3177032470703125, 0.336181640625, 0.3546600341796875, 0.373138427734375, 0.3916168212890625, 0.41009521484375, 0.4285736083984375, 0.447052001953125, 0.4655303955078125, 0.4840087890625, 0.5024871826171875, 0.520965576171875, 0.5394439697265625, 0.55792236328125, 0.5764007568359375, 0.594879150390625, 0.6133575439453125, 0.6318359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 13.0, 8.0, 7.0, 14.0, 18.0, 24.0, 45.0, 51.0, 60.0, 71.0, 86.0, 98.0, 99.0, 80.0, 78.0, 58.0, 46.0, 36.0, 20.0, 19.0, 13.0, 7.0, 11.0, 3.0, 4.0, 2.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15454483032226562, -0.14917755126953125, -0.14381027221679688, -0.1384429931640625, -0.13307571411132812, -0.12770843505859375, -0.12234115600585938, -0.116973876953125, -0.11160659790039062, -0.10623931884765625, -0.10087203979492188, -0.0955047607421875, -0.09013748168945312, -0.08477020263671875, -0.07940292358398438, -0.07403564453125, -0.06866836547851562, -0.06330108642578125, -0.057933807373046875, -0.0525665283203125, -0.047199249267578125, -0.04183197021484375, -0.036464691162109375, -0.031097412109375, -0.025730133056640625, -0.02036285400390625, -0.014995574951171875, -0.0096282958984375, -0.004261016845703125, 0.00110626220703125, 0.006473541259765625, 0.0118408203125, 0.017208099365234375, 0.02257537841796875, 0.027942657470703125, 0.0333099365234375, 0.038677215576171875, 0.04404449462890625, 0.049411773681640625, 0.054779052734375, 0.060146331787109375, 0.06551361083984375, 0.07088088989257812, 0.0762481689453125, 0.08161544799804688, 0.08698272705078125, 0.09235000610351562, 0.09771728515625, 0.10308456420898438, 0.10845184326171875, 0.11381912231445312, 0.1191864013671875, 0.12455368041992188, 0.12992095947265625, 0.13528823852539062, 0.140655517578125, 0.14602279663085938, 0.15139007568359375, 0.15675735473632812, 0.1621246337890625, 0.16749191284179688, 0.17285919189453125, 0.17822647094726562, 0.18359375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 19.0, 35.0, 60.0, 116.0, 133.0, 144.0, 144.0, 118.0, 81.0, 53.0, 34.0, 11.0, 6.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.344545841217041, -4.219826698303223, -4.095107555389404, -3.970388650894165, -3.845669746398926, -3.7209506034851074, -3.596231460571289, -3.47151255607605, -3.3467936515808105, -3.222074508666992, -3.097355604171753, -2.9726364612579346, -2.8479175567626953, -2.723198413848877, -2.5984792709350586, -2.4737603664398193, -2.349041223526001, -2.2243220806121826, -2.0996031761169434, -1.974884033203125, -1.8501651287078857, -1.7254459857940674, -1.6007269620895386, -1.4760079383850098, -1.351288914680481, -1.2265698909759521, -1.1018508672714233, -0.9771317839622498, -0.852412760257721, -0.7276937365531921, -0.6029746532440186, -0.47825562953948975, -0.35353636741638184, -0.22881732881069183, -0.10409829020500183, 0.020620763301849365, 0.14533978700637817, 0.270058810710907, 0.39477789402008057, 0.5194969177246094, 0.6442159414291382, 0.768934965133667, 0.8936539888381958, 1.0183730125427246, 1.143092155456543, 1.2678110599517822, 1.3925302028656006, 1.5172492265701294, 1.6419682502746582, 1.766687273979187, 1.8914062976837158, 2.016125440597534, 2.1408443450927734, 2.265563488006592, 2.39028263092041, 2.5150015354156494, 2.6397204399108887, 2.764439582824707, 2.8891584873199463, 3.0138776302337646, 3.138596534729004, 3.2633156776428223, 3.3880348205566406, 3.51275372505188, 3.6374728679656982]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 11.0, 4.0, 11.0, 13.0, 14.0, 15.0, 21.0, 21.0, 24.0, 31.0, 29.0, 26.0, 33.0, 44.0, 46.0, 43.0, 52.0, 52.0, 51.0, 48.0, 47.0, 29.0, 46.0, 32.0, 42.0, 18.0, 33.0, 19.0, 27.0, 14.0, 24.0, 15.0, 17.0, 9.0, 4.0, 8.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.8090808391571045, -2.7263031005859375, -2.6435253620147705, -2.5607473850250244, -2.4779696464538574, -2.3951919078826904, -2.3124141693115234, -2.2296364307403564, -2.1468586921691895, -2.0640809535980225, -1.981303095817566, -1.898525357246399, -1.8157474994659424, -1.7329697608947754, -1.6501920223236084, -1.5674142837524414, -1.4846363067626953, -1.4018585681915283, -1.3190807104110718, -1.2363029718399048, -1.1535251140594482, -1.0707473754882812, -0.9879696369171143, -0.9051918387413025, -0.8224140405654907, -0.739636242389679, -0.6568584442138672, -0.5740807056427002, -0.4913029074668884, -0.40852510929107666, -0.3257473409175873, -0.2429695725440979, -0.16019177436828613, -0.07741399109363556, 0.005363792181015015, 0.08814157545566559, 0.17091935873031616, 0.25369715690612793, 0.3364749252796173, 0.4192526936531067, 0.5020304918289185, 0.5848082900047302, 0.667586088180542, 0.750363826751709, 0.8331416249275208, 0.9159194231033325, 0.9986971616744995, 1.081475019454956, 1.164252758026123, 1.24703049659729, 1.3298083543777466, 1.4125860929489136, 1.4953639507293701, 1.578141689300537, 1.660919427871704, 1.743697166442871, 1.8264750242233276, 1.9092527627944946, 1.9920306205749512, 2.074808359146118, 2.157586097717285, 2.2403640747070312, 2.3231418132781982, 2.4059195518493652, 2.4886972904205322]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 10.0, 8.0, 7.0, 6.0, 12.0, 18.0, 25.0, 33.0, 37.0, 50.0, 81.0, 126.0, 241.0, 496.0, 1175.0, 3010.0, 10224.0, 52328.0, 423901.0, 2222635.0, 1269760.0, 173115.0, 27468.0, 5915.0, 1946.0, 748.0, 349.0, 183.0, 121.0, 59.0, 49.0, 33.0, 23.0, 15.0, 15.0, 12.0, 7.0, 10.0, 6.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.72900390625, -1.6689453125, -1.60888671875, -1.548828125, -1.48876953125, -1.4287109375, -1.36865234375, -1.30859375, -1.24853515625, -1.1884765625, -1.12841796875, -1.068359375, -1.00830078125, -0.9482421875, -0.88818359375, -0.828125, -0.76806640625, -0.7080078125, -0.64794921875, -0.587890625, -0.52783203125, -0.4677734375, -0.40771484375, -0.34765625, -0.28759765625, -0.2275390625, -0.16748046875, -0.107421875, -0.04736328125, 0.0126953125, 0.07275390625, 0.1328125, 0.19287109375, 0.2529296875, 0.31298828125, 0.373046875, 0.43310546875, 0.4931640625, 0.55322265625, 0.61328125, 0.67333984375, 0.7333984375, 0.79345703125, 0.853515625, 0.91357421875, 0.9736328125, 1.03369140625, 1.09375, 1.15380859375, 1.2138671875, 1.27392578125, 1.333984375, 1.39404296875, 1.4541015625, 1.51416015625, 1.57421875, 1.63427734375, 1.6943359375, 1.75439453125, 1.814453125, 1.87451171875, 1.9345703125, 1.99462890625, 2.0546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 2.0, 12.0, 5.0, 16.0, 10.0, 19.0, 22.0, 15.0, 23.0, 29.0, 28.0, 30.0, 41.0, 44.0, 39.0, 31.0, 53.0, 49.0, 50.0, 63.0, 45.0, 34.0, 41.0, 32.0, 32.0, 27.0, 26.0, 21.0, 28.0, 16.0, 15.0, 14.0, 15.0, 10.0, 9.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0], "bins": [-1.2548828125, -1.2197799682617188, -1.1846771240234375, -1.1495742797851562, -1.114471435546875, -1.0793685913085938, -1.0442657470703125, -1.0091629028320312, -0.97406005859375, -0.9389572143554688, -0.9038543701171875, -0.8687515258789062, -0.833648681640625, -0.7985458374023438, -0.7634429931640625, -0.7283401489257812, -0.6932373046875, -0.6581344604492188, -0.6230316162109375, -0.5879287719726562, -0.552825927734375, -0.5177230834960938, -0.4826202392578125, -0.44751739501953125, -0.41241455078125, -0.37731170654296875, -0.3422088623046875, -0.30710601806640625, -0.272003173828125, -0.23690032958984375, -0.2017974853515625, -0.16669464111328125, -0.131591796875, -0.09648895263671875, -0.0613861083984375, -0.02628326416015625, 0.008819580078125, 0.04392242431640625, 0.0790252685546875, 0.11412811279296875, 0.14923095703125, 0.18433380126953125, 0.2194366455078125, 0.25453948974609375, 0.289642333984375, 0.32474517822265625, 0.3598480224609375, 0.39495086669921875, 0.4300537109375, 0.46515655517578125, 0.5002593994140625, 0.5353622436523438, 0.570465087890625, 0.6055679321289062, 0.6406707763671875, 0.6757736206054688, 0.71087646484375, 0.7459793090820312, 0.7810821533203125, 0.8161849975585938, 0.851287841796875, 0.8863906860351562, 0.9214935302734375, 0.9565963745117188, 0.99169921875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 15.0, 12.0, 24.0, 40.0, 44.0, 63.0, 92.0, 147.0, 311.0, 859.0, 8474.0, 3812617.0, 367463.0, 2920.0, 552.0, 234.0, 119.0, 82.0, 48.0, 53.0, 38.0, 15.0, 14.0, 3.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.39453125, -6.19976806640625, -6.0050048828125, -5.81024169921875, -5.615478515625, -5.42071533203125, -5.2259521484375, -5.03118896484375, -4.83642578125, -4.64166259765625, -4.4468994140625, -4.25213623046875, -4.057373046875, -3.86260986328125, -3.6678466796875, -3.47308349609375, -3.2783203125, -3.08355712890625, -2.8887939453125, -2.69403076171875, -2.499267578125, -2.30450439453125, -2.1097412109375, -1.91497802734375, -1.72021484375, -1.52545166015625, -1.3306884765625, -1.13592529296875, -0.941162109375, -0.74639892578125, -0.5516357421875, -0.35687255859375, -0.162109375, 0.03265380859375, 0.2274169921875, 0.42218017578125, 0.616943359375, 0.81170654296875, 1.0064697265625, 1.20123291015625, 1.39599609375, 1.59075927734375, 1.7855224609375, 1.98028564453125, 2.175048828125, 2.36981201171875, 2.5645751953125, 2.75933837890625, 2.9541015625, 3.14886474609375, 3.3436279296875, 3.53839111328125, 3.733154296875, 3.92791748046875, 4.1226806640625, 4.31744384765625, 4.51220703125, 4.70697021484375, 4.9017333984375, 5.09649658203125, 5.291259765625, 5.48602294921875, 5.6807861328125, 5.87554931640625, 6.0703125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 8.0, 4.0, 14.0, 17.0, 29.0, 31.0, 33.0, 48.0, 72.0, 99.0, 147.0, 177.0, 251.0, 348.0, 475.0, 470.0, 473.0, 343.0, 301.0, 204.0, 148.0, 103.0, 69.0, 50.0, 31.0, 24.0, 27.0, 22.0, 13.0, 10.0, 5.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39501953125, -0.3811798095703125, -0.367340087890625, -0.3535003662109375, -0.33966064453125, -0.3258209228515625, -0.311981201171875, -0.2981414794921875, -0.2843017578125, -0.2704620361328125, -0.256622314453125, -0.2427825927734375, -0.22894287109375, -0.2151031494140625, -0.201263427734375, -0.1874237060546875, -0.173583984375, -0.1597442626953125, -0.145904541015625, -0.1320648193359375, -0.11822509765625, -0.1043853759765625, -0.090545654296875, -0.0767059326171875, -0.0628662109375, -0.0490264892578125, -0.035186767578125, -0.0213470458984375, -0.00750732421875, 0.0063323974609375, 0.020172119140625, 0.0340118408203125, 0.0478515625, 0.0616912841796875, 0.075531005859375, 0.0893707275390625, 0.10321044921875, 0.1170501708984375, 0.130889892578125, 0.1447296142578125, 0.1585693359375, 0.1724090576171875, 0.186248779296875, 0.2000885009765625, 0.21392822265625, 0.2277679443359375, 0.241607666015625, 0.2554473876953125, 0.269287109375, 0.2831268310546875, 0.296966552734375, 0.3108062744140625, 0.32464599609375, 0.3384857177734375, 0.352325439453125, 0.3661651611328125, 0.3800048828125, 0.3938446044921875, 0.407684326171875, 0.4215240478515625, 0.43536376953125, 0.4492034912109375, 0.463043212890625, 0.4768829345703125, 0.49072265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 8.0, 10.0, 8.0, 20.0, 27.0, 60.0, 71.0, 114.0, 160.0, 134.0, 134.0, 110.0, 56.0, 44.0, 22.0, 14.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1752493381500244, -3.0769264698028564, -2.9786033630371094, -2.8802804946899414, -2.7819576263427734, -2.6836347579956055, -2.5853118896484375, -2.4869887828826904, -2.3886659145355225, -2.2903430461883545, -2.1920199394226074, -2.0936970710754395, -1.9953742027282715, -1.8970513343811035, -1.798728346824646, -1.7004053592681885, -1.6020824909210205, -1.5037596225738525, -1.405436635017395, -1.3071136474609375, -1.2087907791137695, -1.1104679107666016, -1.012144923210144, -0.9138219952583313, -0.8154990673065186, -0.7171761393547058, -0.6188532114028931, -0.5205302834510803, -0.4222073554992676, -0.32388442754745483, -0.2255614995956421, -0.12723857164382935, -0.0289154052734375, 0.06940752267837524, 0.167730450630188, 0.26605337858200073, 0.3643763065338135, 0.4626992344856262, 0.561022162437439, 0.6593450903892517, 0.7576680183410645, 0.8559909462928772, 0.9543138742446899, 1.0526368618011475, 1.1509597301483154, 1.2492825984954834, 1.347605586051941, 1.4459285736083984, 1.5442514419555664, 1.6425743103027344, 1.740897297859192, 1.8392202854156494, 1.9375431537628174, 2.0358660221099854, 2.1341891288757324, 2.2325119972229004, 2.3308348655700684, 2.4291577339172363, 2.5274806022644043, 2.6258037090301514, 2.7241265773773193, 2.8224494457244873, 2.9207725524902344, 3.0190954208374023, 3.1174182891845703]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 4.0, 5.0, 4.0, 7.0, 7.0, 6.0, 10.0, 9.0, 14.0, 16.0, 21.0, 25.0, 27.0, 27.0, 18.0, 32.0, 34.0, 33.0, 28.0, 37.0, 35.0, 45.0, 39.0, 37.0, 47.0, 36.0, 30.0, 39.0, 30.0, 34.0, 31.0, 28.0, 25.0, 24.0, 16.0, 17.0, 17.0, 15.0, 12.0, 12.0, 7.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.2031254768371582, -1.170365810394287, -1.137606143951416, -1.104846477508545, -1.0720868110656738, -1.0393271446228027, -1.0065674781799316, -0.9738078117370605, -0.9410481452941895, -0.9082884788513184, -0.8755288124084473, -0.8427691459655762, -0.8100094795227051, -0.777249813079834, -0.7444901466369629, -0.7117304801940918, -0.6789708137512207, -0.6462111473083496, -0.6134514808654785, -0.5806918144226074, -0.5479321479797363, -0.5151724815368652, -0.48241281509399414, -0.44965314865112305, -0.41689348220825195, -0.38413381576538086, -0.35137414932250977, -0.31861448287963867, -0.2858548164367676, -0.2530951499938965, -0.2203354835510254, -0.1875758171081543, -0.15481621026992798, -0.12205654382705688, -0.08929687738418579, -0.0565372109413147, -0.023777544498443604, 0.00898212194442749, 0.041741788387298584, 0.07450145483016968, 0.10726112127304077, 0.14002078771591187, 0.17278045415878296, 0.20554012060165405, 0.23829978704452515, 0.27105945348739624, 0.30381911993026733, 0.3365787863731384, 0.3693384528160095, 0.4020981192588806, 0.4348577857017517, 0.4676174521446228, 0.5003771185874939, 0.533136785030365, 0.5658964514732361, 0.5986561179161072, 0.6314157843589783, 0.6641754508018494, 0.6969351172447205, 0.7296947836875916, 0.7624544501304626, 0.7952141165733337, 0.8279737830162048, 0.8607334494590759, 0.893493115901947]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 6.0, 9.0, 7.0, 20.0, 34.0, 40.0, 65.0, 128.0, 216.0, 416.0, 769.0, 1751.0, 4728.0, 14130.0, 50591.0, 215598.0, 510488.0, 185466.0, 44124.0, 12497.0, 4235.0, 1635.0, 762.0, 362.0, 168.0, 115.0, 68.0, 37.0, 19.0, 20.0, 12.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4518890380859375, -0.436004638671875, -0.4201202392578125, -0.40423583984375, -0.3883514404296875, -0.372467041015625, -0.3565826416015625, -0.3406982421875, -0.3248138427734375, -0.308929443359375, -0.2930450439453125, -0.27716064453125, -0.2612762451171875, -0.245391845703125, -0.2295074462890625, -0.213623046875, -0.1977386474609375, -0.181854248046875, -0.1659698486328125, -0.15008544921875, -0.1342010498046875, -0.118316650390625, -0.1024322509765625, -0.0865478515625, -0.0706634521484375, -0.054779052734375, -0.0388946533203125, -0.02301025390625, -0.0071258544921875, 0.008758544921875, 0.0246429443359375, 0.04052734375, 0.0564117431640625, 0.072296142578125, 0.0881805419921875, 0.10406494140625, 0.1199493408203125, 0.135833740234375, 0.1517181396484375, 0.1676025390625, 0.1834869384765625, 0.199371337890625, 0.2152557373046875, 0.23114013671875, 0.2470245361328125, 0.262908935546875, 0.2787933349609375, 0.294677734375, 0.3105621337890625, 0.326446533203125, 0.3423309326171875, 0.35821533203125, 0.3740997314453125, 0.389984130859375, 0.4058685302734375, 0.4217529296875, 0.4376373291015625, 0.453521728515625, 0.4694061279296875, 0.48529052734375, 0.5011749267578125, 0.517059326171875, 0.5329437255859375, 0.548828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 6.0, 9.0, 7.0, 6.0, 4.0, 11.0, 20.0, 28.0, 19.0, 33.0, 37.0, 45.0, 29.0, 33.0, 36.0, 55.0, 42.0, 47.0, 61.0, 54.0, 44.0, 31.0, 33.0, 41.0, 38.0, 31.0, 26.0, 26.0, 15.0, 18.0, 16.0, 14.0, 13.0, 10.0, 5.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.86328125, -0.8398056030273438, -0.8163299560546875, -0.7928543090820312, -0.769378662109375, -0.7459030151367188, -0.7224273681640625, -0.6989517211914062, -0.67547607421875, -0.6520004272460938, -0.6285247802734375, -0.6050491333007812, -0.581573486328125, -0.5580978393554688, -0.5346221923828125, -0.5111465454101562, -0.4876708984375, -0.46419525146484375, -0.4407196044921875, -0.41724395751953125, -0.393768310546875, -0.37029266357421875, -0.3468170166015625, -0.32334136962890625, -0.29986572265625, -0.27639007568359375, -0.2529144287109375, -0.22943878173828125, -0.205963134765625, -0.18248748779296875, -0.1590118408203125, -0.13553619384765625, -0.112060546875, -0.08858489990234375, -0.0651092529296875, -0.04163360595703125, -0.018157958984375, 0.00531768798828125, 0.0287933349609375, 0.05226898193359375, 0.07574462890625, 0.09922027587890625, 0.1226959228515625, 0.14617156982421875, 0.169647216796875, 0.19312286376953125, 0.2165985107421875, 0.24007415771484375, 0.2635498046875, 0.28702545166015625, 0.3105010986328125, 0.33397674560546875, 0.357452392578125, 0.38092803955078125, 0.4044036865234375, 0.42787933349609375, 0.45135498046875, 0.47483062744140625, 0.4983062744140625, 0.5217819213867188, 0.545257568359375, 0.5687332153320312, 0.5922088623046875, 0.6156845092773438, 0.63916015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 11.0, 7.0, 11.0, 16.0, 27.0, 24.0, 48.0, 57.0, 87.0, 133.0, 207.0, 323.0, 549.0, 1030.0, 2109.0, 4743.0, 11339.0, 29674.0, 79582.0, 208538.0, 359452.0, 215936.0, 82030.0, 30967.0, 12064.0, 4842.0, 2177.0, 1013.0, 576.0, 330.0, 188.0, 109.0, 90.0, 74.0, 36.0, 36.0, 31.0, 16.0, 8.0, 10.0, 9.0, 11.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.359375, -0.3483238220214844, -0.33727264404296875, -0.3262214660644531, -0.3151702880859375, -0.3041191101074219, -0.29306793212890625, -0.2820167541503906, -0.270965576171875, -0.2599143981933594, -0.24886322021484375, -0.23781204223632812, -0.2267608642578125, -0.21570968627929688, -0.20465850830078125, -0.19360733032226562, -0.18255615234375, -0.17150497436523438, -0.16045379638671875, -0.14940261840820312, -0.1383514404296875, -0.12730026245117188, -0.11624908447265625, -0.10519790649414062, -0.094146728515625, -0.08309555053710938, -0.07204437255859375, -0.060993194580078125, -0.0499420166015625, -0.038890838623046875, -0.02783966064453125, -0.016788482666015625, -0.0057373046875, 0.005313873291015625, 0.01636505126953125, 0.027416229248046875, 0.0384674072265625, 0.049518585205078125, 0.06056976318359375, 0.07162094116210938, 0.082672119140625, 0.09372329711914062, 0.10477447509765625, 0.11582565307617188, 0.1268768310546875, 0.13792800903320312, 0.14897918701171875, 0.16003036499023438, 0.17108154296875, 0.18213272094726562, 0.19318389892578125, 0.20423507690429688, 0.2152862548828125, 0.22633743286132812, 0.23738861083984375, 0.24843978881835938, 0.259490966796875, 0.2705421447753906, 0.28159332275390625, 0.2926445007324219, 0.3036956787109375, 0.3147468566894531, 0.32579803466796875, 0.3368492126464844, 0.347900390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 11.0, 19.0, 27.0, 13.0, 23.0, 24.0, 26.0, 38.0, 37.0, 40.0, 57.0, 55.0, 38.0, 47.0, 64.0, 53.0, 54.0, 55.0, 46.0, 49.0, 26.0, 25.0, 20.0, 16.0, 14.0, 16.0, 14.0, 14.0, 14.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.48828125, -1.4355926513671875, -1.382904052734375, -1.3302154541015625, -1.27752685546875, -1.2248382568359375, -1.172149658203125, -1.1194610595703125, -1.0667724609375, -1.0140838623046875, -0.961395263671875, -0.9087066650390625, -0.85601806640625, -0.8033294677734375, -0.750640869140625, -0.6979522705078125, -0.645263671875, -0.5925750732421875, -0.539886474609375, -0.4871978759765625, -0.43450927734375, -0.3818206787109375, -0.329132080078125, -0.2764434814453125, -0.2237548828125, -0.1710662841796875, -0.118377685546875, -0.0656890869140625, -0.01300048828125, 0.0396881103515625, 0.092376708984375, 0.1450653076171875, 0.19775390625, 0.2504425048828125, 0.303131103515625, 0.3558197021484375, 0.40850830078125, 0.4611968994140625, 0.513885498046875, 0.5665740966796875, 0.6192626953125, 0.6719512939453125, 0.724639892578125, 0.7773284912109375, 0.83001708984375, 0.8827056884765625, 0.935394287109375, 0.9880828857421875, 1.040771484375, 1.0934600830078125, 1.146148681640625, 1.1988372802734375, 1.25152587890625, 1.3042144775390625, 1.356903076171875, 1.4095916748046875, 1.4622802734375, 1.5149688720703125, 1.567657470703125, 1.6203460693359375, 1.67303466796875, 1.7257232666015625, 1.778411865234375, 1.8311004638671875, 1.8837890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 14.0, 16.0, 32.0, 55.0, 89.0, 171.0, 313.0, 730.0, 1837.0, 5362.0, 21754.0, 213525.0, 719323.0, 68492.0, 11265.0, 3202.0, 1211.0, 530.0, 277.0, 126.0, 91.0, 45.0, 29.0, 14.0, 10.0, 10.0, 9.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2935752868652344, -0.28148651123046875, -0.2693977355957031, -0.2573089599609375, -0.24522018432617188, -0.23313140869140625, -0.22104263305664062, -0.208953857421875, -0.19686508178710938, -0.18477630615234375, -0.17268753051757812, -0.1605987548828125, -0.14850997924804688, -0.13642120361328125, -0.12433242797851562, -0.11224365234375, -0.10015487670898438, -0.08806610107421875, -0.07597732543945312, -0.0638885498046875, -0.051799774169921875, -0.03971099853515625, -0.027622222900390625, -0.015533447265625, -0.003444671630859375, 0.00864410400390625, 0.020732879638671875, 0.0328216552734375, 0.044910430908203125, 0.05699920654296875, 0.06908798217773438, 0.0811767578125, 0.09326553344726562, 0.10535430908203125, 0.11744308471679688, 0.1295318603515625, 0.14162063598632812, 0.15370941162109375, 0.16579818725585938, 0.177886962890625, 0.18997573852539062, 0.20206451416015625, 0.21415328979492188, 0.2262420654296875, 0.23833084106445312, 0.25041961669921875, 0.2625083923339844, 0.27459716796875, 0.2866859436035156, 0.29877471923828125, 0.3108634948730469, 0.3229522705078125, 0.3350410461425781, 0.34712982177734375, 0.3592185974121094, 0.371307373046875, 0.3833961486816406, 0.39548492431640625, 0.4075736999511719, 0.4196624755859375, 0.4317512512207031, 0.44384002685546875, 0.4559288024902344, 0.468017578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 9.0, 21.0, 20.0, 37.0, 42.0, 74.0, 108.0, 109.0, 138.0, 128.0, 82.0, 45.0, 40.0, 38.0, 21.0, 13.0, 12.0, 11.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010085105895996094, -9.781122207641602e-05, -9.47713851928711e-05, -9.173154830932617e-05, -8.869171142578125e-05, -8.565187454223633e-05, -8.26120376586914e-05, -7.957220077514648e-05, -7.653236389160156e-05, -7.349252700805664e-05, -7.045269012451172e-05, -6.74128532409668e-05, -6.437301635742188e-05, -6.133317947387695e-05, -5.829334259033203e-05, -5.525350570678711e-05, -5.221366882324219e-05, -4.9173831939697266e-05, -4.6133995056152344e-05, -4.309415817260742e-05, -4.00543212890625e-05, -3.701448440551758e-05, -3.3974647521972656e-05, -3.0934810638427734e-05, -2.7894973754882812e-05, -2.485513687133789e-05, -2.181529998779297e-05, -1.8775463104248047e-05, -1.5735626220703125e-05, -1.2695789337158203e-05, -9.655952453613281e-06, -6.616115570068359e-06, -3.5762786865234375e-06, -5.364418029785156e-07, 2.5033950805664062e-06, 5.543231964111328e-06, 8.58306884765625e-06, 1.1622905731201172e-05, 1.4662742614746094e-05, 1.7702579498291016e-05, 2.0742416381835938e-05, 2.378225326538086e-05, 2.682209014892578e-05, 2.9861927032470703e-05, 3.2901763916015625e-05, 3.594160079956055e-05, 3.898143768310547e-05, 4.202127456665039e-05, 4.506111145019531e-05, 4.8100948333740234e-05, 5.1140785217285156e-05, 5.418062210083008e-05, 5.7220458984375e-05, 6.026029586791992e-05, 6.330013275146484e-05, 6.633996963500977e-05, 6.937980651855469e-05, 7.241964340209961e-05, 7.545948028564453e-05, 7.849931716918945e-05, 8.153915405273438e-05, 8.45789909362793e-05, 8.761882781982422e-05, 9.065866470336914e-05, 9.369850158691406e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 10.0, 3.0, 10.0, 17.0, 13.0, 21.0, 36.0, 40.0, 69.0, 126.0, 321.0, 688.0, 2255.0, 11477.0, 143290.0, 804978.0, 74876.0, 7550.0, 1669.0, 537.0, 246.0, 118.0, 66.0, 41.0, 17.0, 21.0, 15.0, 10.0, 10.0, 13.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.443603515625, -0.42990875244140625, -0.4162139892578125, -0.40251922607421875, -0.388824462890625, -0.37512969970703125, -0.3614349365234375, -0.34774017333984375, -0.33404541015625, -0.32035064697265625, -0.3066558837890625, -0.29296112060546875, -0.279266357421875, -0.26557159423828125, -0.2518768310546875, -0.23818206787109375, -0.2244873046875, -0.21079254150390625, -0.1970977783203125, -0.18340301513671875, -0.169708251953125, -0.15601348876953125, -0.1423187255859375, -0.12862396240234375, -0.11492919921875, -0.10123443603515625, -0.0875396728515625, -0.07384490966796875, -0.060150146484375, -0.04645538330078125, -0.0327606201171875, -0.01906585693359375, -0.00537109375, 0.00832366943359375, 0.0220184326171875, 0.03571319580078125, 0.049407958984375, 0.06310272216796875, 0.0767974853515625, 0.09049224853515625, 0.10418701171875, 0.11788177490234375, 0.1315765380859375, 0.14527130126953125, 0.158966064453125, 0.17266082763671875, 0.1863555908203125, 0.20005035400390625, 0.2137451171875, 0.22743988037109375, 0.2411346435546875, 0.25482940673828125, 0.268524169921875, 0.28221893310546875, 0.2959136962890625, 0.30960845947265625, 0.32330322265625, 0.33699798583984375, 0.3506927490234375, 0.36438751220703125, 0.378082275390625, 0.39177703857421875, 0.4054718017578125, 0.41916656494140625, 0.432861328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 12.0, 9.0, 15.0, 14.0, 25.0, 31.0, 58.0, 53.0, 84.0, 97.0, 115.0, 111.0, 86.0, 66.0, 45.0, 49.0, 33.0, 15.0, 14.0, 11.0, 7.0, 2.0, 12.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07176780700683594, -0.06956100463867188, -0.06735420227050781, -0.06514739990234375, -0.06294059753417969, -0.060733795166015625, -0.05852699279785156, -0.0563201904296875, -0.05411338806152344, -0.051906585693359375, -0.04969978332519531, -0.04749298095703125, -0.04528617858886719, -0.043079376220703125, -0.04087257385253906, -0.038665771484375, -0.03645896911621094, -0.034252166748046875, -0.03204536437988281, -0.02983856201171875, -0.027631759643554688, -0.025424957275390625, -0.023218154907226562, -0.0210113525390625, -0.018804550170898438, -0.016597747802734375, -0.014390945434570312, -0.01218414306640625, -0.009977340698242188, -0.007770538330078125, -0.0055637359619140625, -0.00335693359375, -0.0011501312255859375, 0.001056671142578125, 0.0032634735107421875, 0.00547027587890625, 0.0076770782470703125, 0.009883880615234375, 0.012090682983398438, 0.0142974853515625, 0.016504287719726562, 0.018711090087890625, 0.020917892456054688, 0.02312469482421875, 0.025331497192382812, 0.027538299560546875, 0.029745101928710938, 0.031951904296875, 0.03415870666503906, 0.036365509033203125, 0.03857231140136719, 0.04077911376953125, 0.04298591613769531, 0.045192718505859375, 0.04739952087402344, 0.0496063232421875, 0.05181312561035156, 0.054019927978515625, 0.05622673034667969, 0.05843353271484375, 0.06064033508300781, 0.06284713745117188, 0.06505393981933594, 0.0672607421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 11.0, 11.0, 19.0, 29.0, 51.0, 106.0, 163.0, 177.0, 164.0, 111.0, 65.0, 51.0, 18.0, 8.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3199594020843506, -2.2529542446136475, -2.1859488487243652, -2.118943691253662, -2.05193829536438, -1.9849331378936768, -1.917927861213684, -1.8509225845336914, -1.7839174270629883, -1.7169121503829956, -1.649906873703003, -1.5829017162322998, -1.5158964395523071, -1.4488911628723145, -1.3818858861923218, -1.314880609512329, -1.2478753328323364, -1.1808700561523438, -1.113864779472351, -1.0468595027923584, -0.9798543453216553, -0.9128490686416626, -0.8458437919616699, -0.7788385152816772, -0.7118332982063293, -0.6448280215263367, -0.5778228044509888, -0.5108175277709961, -0.4438122808933258, -0.3768070340156555, -0.30980175733566284, -0.24279651045799255, -0.17579138278961182, -0.10878612846136093, -0.041780874133110046, 0.025224387645721436, 0.09222963452339172, 0.159234881401062, 0.2262401580810547, 0.293245404958725, 0.36025065183639526, 0.42725589871406555, 0.49426114559173584, 0.5612664222717285, 0.6282716989517212, 0.6952769160270691, 0.7622821927070618, 0.8292874097824097, 0.8962926864624023, 0.963297963142395, 1.0303032398223877, 1.0973083972930908, 1.1643136739730835, 1.2313189506530762, 1.2983242273330688, 1.3653295040130615, 1.4323346614837646, 1.4993399381637573, 1.56634521484375, 1.6333503723144531, 1.7003556489944458, 1.7673609256744385, 1.8343662023544312, 1.9013714790344238, 1.9683767557144165]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 12.0, 10.0, 4.0, 12.0, 15.0, 18.0, 23.0, 30.0, 30.0, 49.0, 53.0, 58.0, 45.0, 58.0, 74.0, 58.0, 56.0, 61.0, 52.0, 40.0, 49.0, 38.0, 26.0, 32.0, 16.0, 21.0, 16.0, 16.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.267939567565918, -1.23697030544281, -1.2060011625289917, -1.1750319004058838, -1.1440626382827759, -1.113093376159668, -1.0821242332458496, -1.0511549711227417, -1.0201857089996338, -0.9892165064811707, -0.9582472443580627, -0.9272780418395996, -0.8963087797164917, -0.8653395771980286, -0.8343703746795654, -0.8034011125564575, -0.7724319100379944, -0.7414627075195312, -0.7104934453964233, -0.6795242428779602, -0.6485549807548523, -0.6175857782363892, -0.5866165161132812, -0.5556473135948181, -0.524678111076355, -0.49370887875556946, -0.46273964643478394, -0.4317704439163208, -0.4008011817932129, -0.36983197927474976, -0.33886274695396423, -0.3078935146331787, -0.2769242525100708, -0.24595502018928528, -0.21498578786849976, -0.18401657044887543, -0.1530473381280899, -0.12207810580730438, -0.09110888838768005, -0.06013965606689453, -0.02917042374610901, 0.0017988048493862152, 0.03276803344488144, 0.06373725831508636, 0.09470649063587189, 0.1256757229566574, 0.15664494037628174, 0.18761417269706726, 0.21858340501785278, 0.2495526373386383, 0.28052186965942383, 0.31149107217788696, 0.3424603343009949, 0.373429536819458, 0.40439876914024353, 0.43536800146102905, 0.4663372337818146, 0.4973064661026001, 0.5282756686210632, 0.5592449307441711, 0.5902141332626343, 0.6211833953857422, 0.6521525979042053, 0.6831218004226685, 0.7140910625457764]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 9.0, 16.0, 22.0, 31.0, 44.0, 91.0, 187.0, 3338.0, 765579.0, 277519.0, 1356.0, 135.0, 82.0, 45.0, 34.0, 23.0, 12.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.17578125, -6.031768798828125, -5.88775634765625, -5.743743896484375, -5.5997314453125, -5.455718994140625, -5.31170654296875, -5.167694091796875, -5.023681640625, -4.879669189453125, -4.73565673828125, -4.591644287109375, -4.4476318359375, -4.303619384765625, -4.15960693359375, -4.015594482421875, -3.87158203125, -3.727569580078125, -3.58355712890625, -3.439544677734375, -3.2955322265625, -3.151519775390625, -3.00750732421875, -2.863494873046875, -2.719482421875, -2.575469970703125, -2.43145751953125, -2.287445068359375, -2.1434326171875, -1.999420166015625, -1.85540771484375, -1.711395263671875, -1.5673828125, -1.423370361328125, -1.27935791015625, -1.135345458984375, -0.9913330078125, -0.847320556640625, -0.70330810546875, -0.559295654296875, -0.415283203125, -0.271270751953125, -0.12725830078125, 0.016754150390625, 0.1607666015625, 0.304779052734375, 0.44879150390625, 0.592803955078125, 0.73681640625, 0.880828857421875, 1.02484130859375, 1.168853759765625, 1.3128662109375, 1.456878662109375, 1.60089111328125, 1.744903564453125, 1.888916015625, 2.032928466796875, 2.17694091796875, 2.320953369140625, 2.4649658203125, 2.608978271484375, 2.75299072265625, 2.897003173828125, 3.041015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 9.0, 17.0, 20.0, 33.0, 38.0, 63.0, 70.0, 111.0, 83.0, 106.0, 95.0, 108.0, 62.0, 49.0, 40.0, 33.0, 24.0, 11.0, 11.0, 7.0, 7.0], "bins": [-5.59765625, -5.4905242919921875, -5.383392333984375, -5.2762603759765625, -5.16912841796875, -5.0619964599609375, -4.954864501953125, -4.8477325439453125, -4.7406005859375, -4.6334686279296875, -4.526336669921875, -4.4192047119140625, -4.31207275390625, -4.2049407958984375, -4.097808837890625, -3.9906768798828125, -3.883544921875, -3.7764129638671875, -3.669281005859375, -3.5621490478515625, -3.45501708984375, -3.3478851318359375, -3.240753173828125, -3.1336212158203125, -3.0264892578125, -2.9193572998046875, -2.812225341796875, -2.7050933837890625, -2.59796142578125, -2.4908294677734375, -2.383697509765625, -2.2765655517578125, -2.16943359375, -2.0623016357421875, -1.955169677734375, -1.8480377197265625, -1.74090576171875, -1.6337738037109375, -1.526641845703125, -1.4195098876953125, -1.3123779296875, -1.2052459716796875, -1.098114013671875, -0.9909820556640625, -0.88385009765625, -0.7767181396484375, -0.669586181640625, -0.5624542236328125, -0.455322265625, -0.3481903076171875, -0.241058349609375, -0.1339263916015625, -0.02679443359375, 0.0803375244140625, 0.187469482421875, 0.2946014404296875, 0.4017333984375, 0.5088653564453125, 0.615997314453125, 0.7231292724609375, 0.83026123046875, 0.9373931884765625, 1.044525146484375, 1.1516571044921875, 1.2587890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 13.0, 14.0, 10.0, 24.0, 22.0, 33.0, 30.0, 54.0, 53.0, 71.0, 83.0, 94.0, 143.0, 165.0, 208.0, 323.0, 688.0, 4927.0, 130685.0, 838407.0, 67404.0, 3239.0, 574.0, 294.0, 187.0, 136.0, 126.0, 109.0, 79.0, 75.0, 61.0, 43.0, 33.0, 33.0, 28.0, 19.0, 11.0, 9.0, 8.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-2.453125, -2.3818359375, -2.310546875, -2.2392578125, -2.16796875, -2.0966796875, -2.025390625, -1.9541015625, -1.8828125, -1.8115234375, -1.740234375, -1.6689453125, -1.59765625, -1.5263671875, -1.455078125, -1.3837890625, -1.3125, -1.2412109375, -1.169921875, -1.0986328125, -1.02734375, -0.9560546875, -0.884765625, -0.8134765625, -0.7421875, -0.6708984375, -0.599609375, -0.5283203125, -0.45703125, -0.3857421875, -0.314453125, -0.2431640625, -0.171875, -0.1005859375, -0.029296875, 0.0419921875, 0.11328125, 0.1845703125, 0.255859375, 0.3271484375, 0.3984375, 0.4697265625, 0.541015625, 0.6123046875, 0.68359375, 0.7548828125, 0.826171875, 0.8974609375, 0.96875, 1.0400390625, 1.111328125, 1.1826171875, 1.25390625, 1.3251953125, 1.396484375, 1.4677734375, 1.5390625, 1.6103515625, 1.681640625, 1.7529296875, 1.82421875, 1.8955078125, 1.966796875, 2.0380859375, 2.109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 5.0, 13.0, 15.0, 13.0, 18.0, 19.0, 20.0, 18.0, 16.0, 37.0, 30.0, 23.0, 47.0, 38.0, 28.0, 33.0, 38.0, 32.0, 45.0, 46.0, 48.0, 48.0, 45.0, 37.0, 24.0, 33.0, 30.0, 21.0, 31.0, 21.0, 15.0, 15.0, 11.0, 12.0, 8.0, 8.0, 12.0, 6.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.470703125, -1.4264984130859375, -1.382293701171875, -1.3380889892578125, -1.29388427734375, -1.2496795654296875, -1.205474853515625, -1.1612701416015625, -1.1170654296875, -1.0728607177734375, -1.028656005859375, -0.9844512939453125, -0.94024658203125, -0.8960418701171875, -0.851837158203125, -0.8076324462890625, -0.763427734375, -0.7192230224609375, -0.675018310546875, -0.6308135986328125, -0.58660888671875, -0.5424041748046875, -0.498199462890625, -0.4539947509765625, -0.4097900390625, -0.3655853271484375, -0.321380615234375, -0.2771759033203125, -0.23297119140625, -0.1887664794921875, -0.144561767578125, -0.1003570556640625, -0.05615234375, -0.0119476318359375, 0.032257080078125, 0.0764617919921875, 0.12066650390625, 0.1648712158203125, 0.209075927734375, 0.2532806396484375, 0.2974853515625, 0.3416900634765625, 0.385894775390625, 0.4300994873046875, 0.47430419921875, 0.5185089111328125, 0.562713623046875, 0.6069183349609375, 0.651123046875, 0.6953277587890625, 0.739532470703125, 0.7837371826171875, 0.82794189453125, 0.8721466064453125, 0.916351318359375, 0.9605560302734375, 1.0047607421875, 1.0489654541015625, 1.093170166015625, 1.1373748779296875, 1.18157958984375, 1.2257843017578125, 1.269989013671875, 1.3141937255859375, 1.3583984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 17.0, 14.0, 31.0, 38.0, 52.0, 77.0, 150.0, 290.0, 955.0, 4834.0, 51830.0, 695051.0, 276462.0, 15529.0, 2167.0, 534.0, 197.0, 93.0, 60.0, 41.0, 30.0, 32.0, 16.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5264053344726562, -0.5108184814453125, -0.49523162841796875, -0.479644775390625, -0.46405792236328125, -0.4484710693359375, -0.43288421630859375, -0.41729736328125, -0.40171051025390625, -0.3861236572265625, -0.37053680419921875, -0.354949951171875, -0.33936309814453125, -0.3237762451171875, -0.30818939208984375, -0.2926025390625, -0.27701568603515625, -0.2614288330078125, -0.24584197998046875, -0.230255126953125, -0.21466827392578125, -0.1990814208984375, -0.18349456787109375, -0.16790771484375, -0.15232086181640625, -0.1367340087890625, -0.12114715576171875, -0.105560302734375, -0.08997344970703125, -0.0743865966796875, -0.05879974365234375, -0.043212890625, -0.02762603759765625, -0.0120391845703125, 0.00354766845703125, 0.019134521484375, 0.03472137451171875, 0.0503082275390625, 0.06589508056640625, 0.08148193359375, 0.09706878662109375, 0.1126556396484375, 0.12824249267578125, 0.143829345703125, 0.15941619873046875, 0.1750030517578125, 0.19058990478515625, 0.2061767578125, 0.22176361083984375, 0.2373504638671875, 0.25293731689453125, 0.268524169921875, 0.28411102294921875, 0.2996978759765625, 0.31528472900390625, 0.33087158203125, 0.34645843505859375, 0.3620452880859375, 0.37763214111328125, 0.393218994140625, 0.40880584716796875, 0.4243927001953125, 0.43997955322265625, 0.45556640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 10.0, 8.0, 15.0, 13.0, 14.0, 27.0, 33.0, 36.0, 47.0, 58.0, 59.0, 69.0, 66.0, 86.0, 72.0, 67.0, 64.0, 43.0, 42.0, 34.0, 37.0, 14.0, 19.0, 10.0, 12.0, 8.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.190206527709961e-05, -4.078354686498642e-05, -3.966502845287323e-05, -3.854651004076004e-05, -3.742799162864685e-05, -3.630947321653366e-05, -3.519095480442047e-05, -3.407243639230728e-05, -3.295391798019409e-05, -3.18353995680809e-05, -3.071688115596771e-05, -2.9598362743854523e-05, -2.8479844331741333e-05, -2.7361325919628143e-05, -2.6242807507514954e-05, -2.5124289095401764e-05, -2.4005770683288574e-05, -2.2887252271175385e-05, -2.1768733859062195e-05, -2.0650215446949005e-05, -1.9531697034835815e-05, -1.8413178622722626e-05, -1.7294660210609436e-05, -1.6176141798496246e-05, -1.5057623386383057e-05, -1.3939104974269867e-05, -1.2820586562156677e-05, -1.1702068150043488e-05, -1.0583549737930298e-05, -9.465031325817108e-06, -8.346512913703918e-06, -7.227994501590729e-06, -6.109476089477539e-06, -4.990957677364349e-06, -3.87243926525116e-06, -2.75392085313797e-06, -1.6354024410247803e-06, -5.168840289115906e-07, 6.016343832015991e-07, 1.7201527953147888e-06, 2.8386712074279785e-06, 3.957189619541168e-06, 5.075708031654358e-06, 6.194226443767548e-06, 7.312744855880737e-06, 8.431263267993927e-06, 9.549781680107117e-06, 1.0668300092220306e-05, 1.1786818504333496e-05, 1.2905336916446686e-05, 1.4023855328559875e-05, 1.5142373740673065e-05, 1.6260892152786255e-05, 1.7379410564899445e-05, 1.8497928977012634e-05, 1.9616447389125824e-05, 2.0734965801239014e-05, 2.1853484213352203e-05, 2.2972002625465393e-05, 2.4090521037578583e-05, 2.5209039449691772e-05, 2.6327557861804962e-05, 2.7446076273918152e-05, 2.856459468603134e-05, 2.968311309814453e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 8.0, 11.0, 11.0, 25.0, 22.0, 45.0, 56.0, 124.0, 257.0, 721.0, 3291.0, 43525.0, 898314.0, 96028.0, 4573.0, 864.0, 288.0, 154.0, 86.0, 56.0, 34.0, 16.0, 17.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7004547119140625, -0.676788330078125, -0.6531219482421875, -0.62945556640625, -0.6057891845703125, -0.582122802734375, -0.5584564208984375, -0.5347900390625, -0.5111236572265625, -0.487457275390625, -0.4637908935546875, -0.44012451171875, -0.4164581298828125, -0.392791748046875, -0.3691253662109375, -0.345458984375, -0.3217926025390625, -0.298126220703125, -0.2744598388671875, -0.25079345703125, -0.2271270751953125, -0.203460693359375, -0.1797943115234375, -0.1561279296875, -0.1324615478515625, -0.108795166015625, -0.0851287841796875, -0.06146240234375, -0.0377960205078125, -0.014129638671875, 0.0095367431640625, 0.033203125, 0.0568695068359375, 0.080535888671875, 0.1042022705078125, 0.12786865234375, 0.1515350341796875, 0.175201416015625, 0.1988677978515625, 0.2225341796875, 0.2462005615234375, 0.269866943359375, 0.2935333251953125, 0.31719970703125, 0.3408660888671875, 0.364532470703125, 0.3881988525390625, 0.411865234375, 0.4355316162109375, 0.459197998046875, 0.4828643798828125, 0.50653076171875, 0.5301971435546875, 0.553863525390625, 0.5775299072265625, 0.6011962890625, 0.6248626708984375, 0.648529052734375, 0.6721954345703125, 0.69586181640625, 0.7195281982421875, 0.743194580078125, 0.7668609619140625, 0.79052734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 13.0, 18.0, 21.0, 29.0, 34.0, 50.0, 65.0, 115.0, 107.0, 113.0, 106.0, 86.0, 71.0, 46.0, 38.0, 28.0, 10.0, 11.0, 7.0, 10.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2230224609375, -0.21706771850585938, -0.21111297607421875, -0.20515823364257812, -0.1992034912109375, -0.19324874877929688, -0.18729400634765625, -0.18133926391601562, -0.175384521484375, -0.16942977905273438, -0.16347503662109375, -0.15752029418945312, -0.1515655517578125, -0.14561080932617188, -0.13965606689453125, -0.13370132446289062, -0.12774658203125, -0.12179183959960938, -0.11583709716796875, -0.10988235473632812, -0.1039276123046875, -0.09797286987304688, -0.09201812744140625, -0.08606338500976562, -0.080108642578125, -0.07415390014648438, -0.06819915771484375, -0.062244415283203125, -0.0562896728515625, -0.050334930419921875, -0.04438018798828125, -0.038425445556640625, -0.032470703125, -0.026515960693359375, -0.02056121826171875, -0.014606475830078125, -0.0086517333984375, -0.002696990966796875, 0.00325775146484375, 0.009212493896484375, 0.015167236328125, 0.021121978759765625, 0.02707672119140625, 0.033031463623046875, 0.0389862060546875, 0.044940948486328125, 0.05089569091796875, 0.056850433349609375, 0.06280517578125, 0.06875991821289062, 0.07471466064453125, 0.08066940307617188, 0.0866241455078125, 0.09257888793945312, 0.09853363037109375, 0.10448837280273438, 0.110443115234375, 0.11639785766601562, 0.12235260009765625, 0.12830734252929688, 0.1342620849609375, 0.14021682739257812, 0.14617156982421875, 0.15212631225585938, 0.1580810546875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 6.0, 27.0, 31.0, 60.0, 110.0, 147.0, 186.0, 143.0, 120.0, 69.0, 47.0, 18.0, 11.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33904504776001, -4.20599889755249, -4.072952747344971, -3.9399068355560303, -3.80686092376709, -3.6738147735595703, -3.540768623352051, -3.4077227115631104, -3.27467679977417, -3.1416306495666504, -3.00858473777771, -2.8755385875701904, -2.74249267578125, -2.6094465255737305, -2.476400375366211, -2.3433544635772705, -2.210308313369751, -2.0772621631622314, -1.944216251373291, -1.8111701011657715, -1.678124189376831, -1.5450780391693115, -1.4120320081710815, -1.2789859771728516, -1.1459399461746216, -1.0128939151763916, -0.8798478841781616, -0.7468017935752869, -0.6137557625770569, -0.4807097315788269, -0.34766364097595215, -0.21461760997772217, -0.08157157897949219, 0.05147446691989899, 0.18452051281929016, 0.31756657361984253, 0.4506126046180725, 0.5836586356163025, 0.7167047262191772, 0.8497507572174072, 0.9827967882156372, 1.1158428192138672, 1.2488888502120972, 1.3819348812103271, 1.5149810314178467, 1.648026943206787, 1.7810730934143066, 1.9141191244125366, 2.0471651554107666, 2.180211305618286, 2.3132572174072266, 2.446303367614746, 2.5793492794036865, 2.712395429611206, 2.8454413414001465, 2.978487491607666, 3.1115336418151855, 3.244579792022705, 3.3776257038116455, 3.510671854019165, 3.6437177658081055, 3.776763916015625, 3.9098100662231445, 4.042856216430664, 4.175901889801025]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 14.0, 13.0, 11.0, 23.0, 22.0, 38.0, 45.0, 39.0, 56.0, 74.0, 52.0, 66.0, 73.0, 76.0, 71.0, 75.0, 49.0, 52.0, 34.0, 33.0, 31.0, 21.0, 15.0, 13.0, 6.0, 2.0, 2.0, 6.0, 2.0], "bins": [-6.718866348266602, -6.577828407287598, -6.436790943145752, -6.295753002166748, -6.154715061187744, -6.013677597045898, -5.8726396560668945, -5.731601715087891, -5.590563774108887, -5.449525833129883, -5.308488368988037, -5.167450428009033, -5.026412487030029, -4.885375022888184, -4.74433708190918, -4.603299140930176, -4.46226167678833, -4.321223735809326, -4.1801862716674805, -4.039148330688477, -3.8981103897094727, -3.757072687149048, -3.616034984588623, -3.474997043609619, -3.3339593410491943, -3.1929216384887695, -3.0518836975097656, -2.910845994949341, -2.769808292388916, -2.628770351409912, -2.4877326488494873, -2.3466949462890625, -2.2056565284729004, -2.0646188259124756, -1.9235808849334717, -1.7825431823730469, -1.6415053606033325, -1.5004675388336182, -1.3594298362731934, -1.218392014503479, -1.0773541927337646, -0.9363163709640503, -0.7952786087989807, -0.6542408466339111, -0.5132030248641968, -0.3721652030944824, -0.23112744092941284, -0.09008967876434326, 0.050948143005371094, 0.19198593497276306, 0.33302372694015503, 0.474061518907547, 0.615099310874939, 0.7561371326446533, 0.8971748948097229, 1.0382126569747925, 1.1792504787445068, 1.3202883005142212, 1.4613261222839355, 1.6023638248443604, 1.7434016466140747, 1.884439468383789, 2.025477170944214, 2.1665148735046387, 2.3075528144836426]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 19.0, 24.0, 43.0, 59.0, 92.0, 111.0, 168.0, 294.0, 476.0, 789.0, 1514.0, 3257.0, 7631.0, 23083.0, 91941.0, 477992.0, 1794871.0, 1378635.0, 313107.0, 68599.0, 18957.0, 6426.0, 2806.0, 1399.0, 777.0, 397.0, 257.0, 143.0, 112.0, 79.0, 53.0, 30.0, 30.0, 22.0, 16.0, 12.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2142333984375, -1.173583984375, -1.1329345703125, -1.09228515625, -1.0516357421875, -1.010986328125, -0.9703369140625, -0.9296875, -0.8890380859375, -0.848388671875, -0.8077392578125, -0.76708984375, -0.7264404296875, -0.685791015625, -0.6451416015625, -0.6044921875, -0.5638427734375, -0.523193359375, -0.4825439453125, -0.44189453125, -0.4012451171875, -0.360595703125, -0.3199462890625, -0.279296875, -0.2386474609375, -0.197998046875, -0.1573486328125, -0.11669921875, -0.0760498046875, -0.035400390625, 0.0052490234375, 0.0458984375, 0.0865478515625, 0.127197265625, 0.1678466796875, 0.20849609375, 0.2491455078125, 0.289794921875, 0.3304443359375, 0.37109375, 0.4117431640625, 0.452392578125, 0.4930419921875, 0.53369140625, 0.5743408203125, 0.614990234375, 0.6556396484375, 0.6962890625, 0.7369384765625, 0.777587890625, 0.8182373046875, 0.85888671875, 0.8995361328125, 0.940185546875, 0.9808349609375, 1.021484375, 1.0621337890625, 1.102783203125, 1.1434326171875, 1.18408203125, 1.2247314453125, 1.265380859375, 1.3060302734375, 1.3466796875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 2.0, 4.0, 14.0, 19.0, 18.0, 18.0, 29.0, 33.0, 32.0, 40.0, 39.0, 41.0, 48.0, 42.0, 54.0, 47.0, 47.0, 64.0, 46.0, 52.0, 45.0, 35.0, 24.0, 34.0, 30.0, 16.0, 20.0, 23.0, 13.0, 17.0, 7.0, 6.0, 11.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1643524169921875, -1.126556396484375, -1.0887603759765625, -1.05096435546875, -1.0131683349609375, -0.975372314453125, -0.9375762939453125, -0.8997802734375, -0.8619842529296875, -0.824188232421875, -0.7863922119140625, -0.74859619140625, -0.7108001708984375, -0.673004150390625, -0.6352081298828125, -0.597412109375, -0.5596160888671875, -0.521820068359375, -0.4840240478515625, -0.44622802734375, -0.4084320068359375, -0.370635986328125, -0.3328399658203125, -0.2950439453125, -0.2572479248046875, -0.219451904296875, -0.1816558837890625, -0.14385986328125, -0.1060638427734375, -0.068267822265625, -0.0304718017578125, 0.00732421875, 0.0451202392578125, 0.082916259765625, 0.1207122802734375, 0.15850830078125, 0.1963043212890625, 0.234100341796875, 0.2718963623046875, 0.3096923828125, 0.3474884033203125, 0.385284423828125, 0.4230804443359375, 0.46087646484375, 0.4986724853515625, 0.536468505859375, 0.5742645263671875, 0.612060546875, 0.6498565673828125, 0.687652587890625, 0.7254486083984375, 0.76324462890625, 0.8010406494140625, 0.838836669921875, 0.8766326904296875, 0.9144287109375, 0.9522247314453125, 0.990020751953125, 1.0278167724609375, 1.06561279296875, 1.1034088134765625, 1.141204833984375, 1.1790008544921875, 1.216796875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 25.0, 52.0, 106.0, 170.0, 418.0, 1240.0, 13067.0, 4072636.0, 102994.0, 2419.0, 571.0, 250.0, 145.0, 74.0, 40.0, 22.0, 14.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.775726318359375, -8.57489013671875, -8.374053955078125, -8.1732177734375, -7.972381591796875, -7.77154541015625, -7.570709228515625, -7.369873046875, -7.169036865234375, -6.96820068359375, -6.767364501953125, -6.5665283203125, -6.365692138671875, -6.16485595703125, -5.964019775390625, -5.76318359375, -5.562347412109375, -5.36151123046875, -5.160675048828125, -4.9598388671875, -4.759002685546875, -4.55816650390625, -4.357330322265625, -4.156494140625, -3.955657958984375, -3.75482177734375, -3.553985595703125, -3.3531494140625, -3.152313232421875, -2.95147705078125, -2.750640869140625, -2.5498046875, -2.348968505859375, -2.14813232421875, -1.947296142578125, -1.7464599609375, -1.545623779296875, -1.34478759765625, -1.143951416015625, -0.943115234375, -0.742279052734375, -0.54144287109375, -0.340606689453125, -0.1397705078125, 0.061065673828125, 0.26190185546875, 0.462738037109375, 0.66357421875, 0.864410400390625, 1.06524658203125, 1.266082763671875, 1.4669189453125, 1.667755126953125, 1.86859130859375, 2.069427490234375, 2.270263671875, 2.471099853515625, 2.67193603515625, 2.872772216796875, 3.0736083984375, 3.274444580078125, 3.47528076171875, 3.676116943359375, 3.876953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 6.0, 3.0, 5.0, 10.0, 16.0, 17.0, 30.0, 31.0, 47.0, 64.0, 128.0, 161.0, 284.0, 471.0, 628.0, 661.0, 519.0, 377.0, 229.0, 130.0, 86.0, 46.0, 41.0, 26.0, 20.0, 12.0, 11.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5411605834960938, -0.5232391357421875, -0.5053176879882812, -0.487396240234375, -0.46947479248046875, -0.4515533447265625, -0.43363189697265625, -0.41571044921875, -0.39778900146484375, -0.3798675537109375, -0.36194610595703125, -0.344024658203125, -0.32610321044921875, -0.3081817626953125, -0.29026031494140625, -0.2723388671875, -0.25441741943359375, -0.2364959716796875, -0.21857452392578125, -0.200653076171875, -0.18273162841796875, -0.1648101806640625, -0.14688873291015625, -0.12896728515625, -0.11104583740234375, -0.0931243896484375, -0.07520294189453125, -0.057281494140625, -0.03936004638671875, -0.0214385986328125, -0.00351715087890625, 0.014404296875, 0.03232574462890625, 0.0502471923828125, 0.06816864013671875, 0.086090087890625, 0.10401153564453125, 0.1219329833984375, 0.13985443115234375, 0.15777587890625, 0.17569732666015625, 0.1936187744140625, 0.21154022216796875, 0.229461669921875, 0.24738311767578125, 0.2653045654296875, 0.28322601318359375, 0.3011474609375, 0.31906890869140625, 0.3369903564453125, 0.35491180419921875, 0.372833251953125, 0.39075469970703125, 0.4086761474609375, 0.42659759521484375, 0.44451904296875, 0.46244049072265625, 0.4803619384765625, 0.49828338623046875, 0.516204833984375, 0.5341262817382812, 0.5520477294921875, 0.5699691772460938, 0.587890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 12.0, 26.0, 36.0, 47.0, 53.0, 79.0, 104.0, 116.0, 135.0, 117.0, 89.0, 55.0, 44.0, 32.0, 17.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.475778818130493, -2.396470785140991, -2.3171629905700684, -2.2378549575805664, -2.1585469245910645, -2.0792391300201416, -1.9999310970306396, -1.9206231832504272, -1.8413152694702148, -1.7620073556900024, -1.68269944190979, -1.603391408920288, -1.5240834951400757, -1.4447755813598633, -1.3654675483703613, -1.286159634590149, -1.2068517208099365, -1.1275438070297241, -1.0482358932495117, -0.9689278602600098, -0.8896199464797974, -0.810312032699585, -0.7310040593147278, -0.6516960859298706, -0.5723881721496582, -0.4930802285671234, -0.4137722849845886, -0.33446434140205383, -0.25515639781951904, -0.17584845423698425, -0.09654051065444946, -0.017232537269592285, 0.06207537651062012, 0.1413833200931549, 0.2206912636756897, 0.2999992072582245, 0.3793071508407593, 0.45861509442329407, 0.5379230380058289, 0.617231011390686, 0.6965389251708984, 0.7758468389511108, 0.855154812335968, 0.9344627857208252, 1.0137706995010376, 1.09307861328125, 1.172386646270752, 1.2516945600509644, 1.3310024738311768, 1.4103103876113892, 1.4896183013916016, 1.5689263343811035, 1.648234248161316, 1.7275421619415283, 1.8068501949310303, 1.8861581087112427, 1.965466022491455, 2.044774055480957, 2.12408185005188, 2.203389883041382, 2.2826976776123047, 2.3620057106018066, 2.4413137435913086, 2.5206217765808105, 2.5999295711517334]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 17.0, 12.0, 24.0, 26.0, 26.0, 20.0, 24.0, 30.0, 30.0, 33.0, 31.0, 39.0, 32.0, 47.0, 39.0, 42.0, 41.0, 43.0, 37.0, 27.0, 37.0, 31.0, 29.0, 18.0, 36.0, 27.0, 26.0, 14.0, 17.0, 12.0, 10.0, 11.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.0165743827819824, -0.9838593602180481, -0.9511443376541138, -0.9184293150901794, -0.8857142925262451, -0.8529993295669556, -0.8202843070030212, -0.7875692844390869, -0.7548542618751526, -0.7221392393112183, -0.6894242167472839, -0.6567091941833496, -0.6239942312240601, -0.591279149055481, -0.5585641860961914, -0.5258491635322571, -0.49313414096832275, -0.4604191184043884, -0.4277040958404541, -0.39498910307884216, -0.36227408051490784, -0.3295590579509735, -0.2968440651893616, -0.26412904262542725, -0.23141402006149292, -0.1986989974975586, -0.16598398983478546, -0.13326898217201233, -0.100553959608078, -0.06783893704414368, -0.035123929381370544, -0.002408921718597412, 0.030306100845336914, 0.06302111595869064, 0.09573613107204437, 0.1284511387348175, 0.16116616129875183, 0.19388118386268616, 0.2265961915254593, 0.2593111991882324, 0.29202622175216675, 0.3247412443161011, 0.3574562668800354, 0.39017125964164734, 0.42288628220558167, 0.455601304769516, 0.48831629753112793, 0.5210313200950623, 0.5537463426589966, 0.5864613652229309, 0.6191763877868652, 0.6518914103507996, 0.6846064329147339, 0.7173213958740234, 0.7500364184379578, 0.7827514410018921, 0.8154664635658264, 0.8481814861297607, 0.8808965086936951, 0.9136115312576294, 0.946326494216919, 0.979041576385498, 1.0117565393447876, 1.0444715023040771, 1.0771865844726562]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 15.0, 10.0, 11.0, 29.0, 77.0, 209.0, 724.0, 2950.0, 15396.0, 119165.0, 830441.0, 66373.0, 10299.0, 2046.0, 520.0, 146.0, 54.0, 25.0, 23.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1875, -1.1548614501953125, -1.122222900390625, -1.0895843505859375, -1.05694580078125, -1.0243072509765625, -0.991668701171875, -0.9590301513671875, -0.9263916015625, -0.8937530517578125, -0.861114501953125, -0.8284759521484375, -0.79583740234375, -0.7631988525390625, -0.730560302734375, -0.6979217529296875, -0.665283203125, -0.6326446533203125, -0.600006103515625, -0.5673675537109375, -0.53472900390625, -0.5020904541015625, -0.469451904296875, -0.4368133544921875, -0.4041748046875, -0.3715362548828125, -0.338897705078125, -0.3062591552734375, -0.27362060546875, -0.2409820556640625, -0.208343505859375, -0.1757049560546875, -0.14306640625, -0.1104278564453125, -0.077789306640625, -0.0451507568359375, -0.01251220703125, 0.0201263427734375, 0.052764892578125, 0.0854034423828125, 0.1180419921875, 0.1506805419921875, 0.183319091796875, 0.2159576416015625, 0.24859619140625, 0.2812347412109375, 0.313873291015625, 0.3465118408203125, 0.379150390625, 0.4117889404296875, 0.444427490234375, 0.4770660400390625, 0.50970458984375, 0.5423431396484375, 0.574981689453125, 0.6076202392578125, 0.6402587890625, 0.6728973388671875, 0.705535888671875, 0.7381744384765625, 0.77081298828125, 0.8034515380859375, 0.836090087890625, 0.8687286376953125, 0.9013671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 4.0, 7.0, 16.0, 30.0, 25.0, 45.0, 66.0, 88.0, 95.0, 83.0, 101.0, 102.0, 92.0, 85.0, 50.0, 42.0, 31.0, 12.0, 10.0, 10.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.65234375, -2.5973129272460938, -2.5422821044921875, -2.4872512817382812, -2.432220458984375, -2.3771896362304688, -2.3221588134765625, -2.2671279907226562, -2.21209716796875, -2.1570663452148438, -2.1020355224609375, -2.0470046997070312, -1.991973876953125, -1.9369430541992188, -1.8819122314453125, -1.8268814086914062, -1.7718505859375, -1.7168197631835938, -1.6617889404296875, -1.6067581176757812, -1.551727294921875, -1.4966964721679688, -1.4416656494140625, -1.3866348266601562, -1.33160400390625, -1.2765731811523438, -1.2215423583984375, -1.1665115356445312, -1.111480712890625, -1.0564498901367188, -1.0014190673828125, -0.9463882446289062, -0.891357421875, -0.8363265991210938, -0.7812957763671875, -0.7262649536132812, -0.671234130859375, -0.6162033081054688, -0.5611724853515625, -0.5061416625976562, -0.45111083984375, -0.39608001708984375, -0.3410491943359375, -0.28601837158203125, -0.230987548828125, -0.17595672607421875, -0.1209259033203125, -0.06589508056640625, -0.0108642578125, 0.04416656494140625, 0.0991973876953125, 0.15422821044921875, 0.209259033203125, 0.26428985595703125, 0.3193206787109375, 0.37435150146484375, 0.42938232421875, 0.48441314697265625, 0.5394439697265625, 0.5944747924804688, 0.649505615234375, 0.7045364379882812, 0.7595672607421875, 0.8145980834960938, 0.86962890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 12.0, 20.0, 26.0, 46.0, 80.0, 107.0, 227.0, 507.0, 1273.0, 3446.0, 10933.0, 37918.0, 271273.0, 618266.0, 76824.0, 18459.0, 5656.0, 1955.0, 754.0, 322.0, 175.0, 88.0, 54.0, 39.0, 26.0, 15.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6245269775390625, -0.604522705078125, -0.5845184326171875, -0.56451416015625, -0.5445098876953125, -0.524505615234375, -0.5045013427734375, -0.4844970703125, -0.4644927978515625, -0.444488525390625, -0.4244842529296875, -0.40447998046875, -0.3844757080078125, -0.364471435546875, -0.3444671630859375, -0.324462890625, -0.3044586181640625, -0.284454345703125, -0.2644500732421875, -0.24444580078125, -0.2244415283203125, -0.204437255859375, -0.1844329833984375, -0.1644287109375, -0.1444244384765625, -0.124420166015625, -0.1044158935546875, -0.08441162109375, -0.0644073486328125, -0.044403076171875, -0.0243988037109375, -0.00439453125, 0.0156097412109375, 0.035614013671875, 0.0556182861328125, 0.07562255859375, 0.0956268310546875, 0.115631103515625, 0.1356353759765625, 0.1556396484375, 0.1756439208984375, 0.195648193359375, 0.2156524658203125, 0.23565673828125, 0.2556610107421875, 0.275665283203125, 0.2956695556640625, 0.315673828125, 0.3356781005859375, 0.355682373046875, 0.3756866455078125, 0.39569091796875, 0.4156951904296875, 0.435699462890625, 0.4557037353515625, 0.4757080078125, 0.4957122802734375, 0.515716552734375, 0.5357208251953125, 0.55572509765625, 0.5757293701171875, 0.595733642578125, 0.6157379150390625, 0.6357421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 8.0, 10.0, 16.0, 17.0, 39.0, 42.0, 47.0, 56.0, 56.0, 77.0, 64.0, 69.0, 89.0, 75.0, 63.0, 53.0, 49.0, 32.0, 30.0, 31.0, 17.0, 19.0, 19.0, 7.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.481048583984375, -2.39764404296875, -2.314239501953125, -2.2308349609375, -2.147430419921875, -2.06402587890625, -1.980621337890625, -1.897216796875, -1.813812255859375, -1.73040771484375, -1.647003173828125, -1.5635986328125, -1.480194091796875, -1.39678955078125, -1.313385009765625, -1.22998046875, -1.146575927734375, -1.06317138671875, -0.979766845703125, -0.8963623046875, -0.812957763671875, -0.72955322265625, -0.646148681640625, -0.562744140625, -0.479339599609375, -0.39593505859375, -0.312530517578125, -0.2291259765625, -0.145721435546875, -0.06231689453125, 0.021087646484375, 0.1044921875, 0.187896728515625, 0.27130126953125, 0.354705810546875, 0.4381103515625, 0.521514892578125, 0.60491943359375, 0.688323974609375, 0.771728515625, 0.855133056640625, 0.93853759765625, 1.021942138671875, 1.1053466796875, 1.188751220703125, 1.27215576171875, 1.355560302734375, 1.43896484375, 1.522369384765625, 1.60577392578125, 1.689178466796875, 1.7725830078125, 1.855987548828125, 1.93939208984375, 2.022796630859375, 2.106201171875, 2.189605712890625, 2.27301025390625, 2.356414794921875, 2.4398193359375, 2.523223876953125, 2.60662841796875, 2.690032958984375, 2.7734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 11.0, 12.0, 17.0, 20.0, 33.0, 69.0, 83.0, 109.0, 189.0, 328.0, 560.0, 979.0, 1907.0, 3897.0, 8186.0, 20404.0, 59893.0, 265173.0, 502428.0, 124395.0, 35269.0, 13175.0, 5669.0, 2571.0, 1420.0, 714.0, 398.0, 230.0, 159.0, 71.0, 55.0, 45.0, 22.0, 26.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.17529296875, -0.17032241821289062, -0.16535186767578125, -0.16038131713867188, -0.1554107666015625, -0.15044021606445312, -0.14546966552734375, -0.14049911499023438, -0.135528564453125, -0.13055801391601562, -0.12558746337890625, -0.12061691284179688, -0.1156463623046875, -0.11067581176757812, -0.10570526123046875, -0.10073471069335938, -0.09576416015625, -0.09079360961914062, -0.08582305908203125, -0.08085250854492188, -0.0758819580078125, -0.07091140747070312, -0.06594085693359375, -0.060970306396484375, -0.055999755859375, -0.051029205322265625, -0.04605865478515625, -0.041088104248046875, -0.0361175537109375, -0.031147003173828125, -0.02617645263671875, -0.021205902099609375, -0.0162353515625, -0.011264801025390625, -0.00629425048828125, -0.001323699951171875, 0.0036468505859375, 0.008617401123046875, 0.01358795166015625, 0.018558502197265625, 0.023529052734375, 0.028499603271484375, 0.03347015380859375, 0.038440704345703125, 0.0434112548828125, 0.048381805419921875, 0.05335235595703125, 0.058322906494140625, 0.06329345703125, 0.06826400756835938, 0.07323455810546875, 0.07820510864257812, 0.0831756591796875, 0.08814620971679688, 0.09311676025390625, 0.09808731079101562, 0.103057861328125, 0.10802841186523438, 0.11299896240234375, 0.11796951293945312, 0.1229400634765625, 0.12791061401367188, 0.13288116455078125, 0.13785171508789062, 0.142822265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 9.0, 7.0, 11.0, 19.0, 34.0, 41.0, 60.0, 113.0, 135.0, 136.0, 112.0, 95.0, 65.0, 38.0, 25.0, 15.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.347894668579102e-05, -6.106030195951462e-05, -5.864165723323822e-05, -5.622301250696182e-05, -5.3804367780685425e-05, -5.138572305440903e-05, -4.896707832813263e-05, -4.654843360185623e-05, -4.4129788875579834e-05, -4.1711144149303436e-05, -3.929249942302704e-05, -3.687385469675064e-05, -3.445520997047424e-05, -3.2036565244197845e-05, -2.9617920517921448e-05, -2.719927579164505e-05, -2.4780631065368652e-05, -2.2361986339092255e-05, -1.9943341612815857e-05, -1.752469688653946e-05, -1.5106052160263062e-05, -1.2687407433986664e-05, -1.0268762707710266e-05, -7.850117981433868e-06, -5.431473255157471e-06, -3.012828528881073e-06, -5.941838026046753e-07, 1.8244609236717224e-06, 4.24310564994812e-06, 6.661750376224518e-06, 9.080395102500916e-06, 1.1499039828777313e-05, 1.3917684555053711e-05, 1.633632928133011e-05, 1.8754974007606506e-05, 2.1173618733882904e-05, 2.3592263460159302e-05, 2.60109081864357e-05, 2.8429552912712097e-05, 3.0848197638988495e-05, 3.326684236526489e-05, 3.568548709154129e-05, 3.810413181781769e-05, 4.0522776544094086e-05, 4.2941421270370483e-05, 4.536006599664688e-05, 4.777871072292328e-05, 5.0197355449199677e-05, 5.2616000175476074e-05, 5.503464490175247e-05, 5.745328962802887e-05, 5.987193435430527e-05, 6.229057908058167e-05, 6.470922380685806e-05, 6.712786853313446e-05, 6.954651325941086e-05, 7.196515798568726e-05, 7.438380271196365e-05, 7.680244743824005e-05, 7.922109216451645e-05, 8.163973689079285e-05, 8.405838161706924e-05, 8.647702634334564e-05, 8.889567106962204e-05, 9.131431579589844e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 11.0, 12.0, 8.0, 12.0, 23.0, 37.0, 45.0, 79.0, 127.0, 316.0, 852.0, 3103.0, 13080.0, 73565.0, 711691.0, 211341.0, 26249.0, 5649.0, 1377.0, 487.0, 183.0, 98.0, 45.0, 33.0, 25.0, 12.0, 18.0, 6.0, 8.0, 8.0, 2.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2792816162109375, -0.270477294921875, -0.2616729736328125, -0.25286865234375, -0.2440643310546875, -0.235260009765625, -0.2264556884765625, -0.2176513671875, -0.2088470458984375, -0.200042724609375, -0.1912384033203125, -0.18243408203125, -0.1736297607421875, -0.164825439453125, -0.1560211181640625, -0.147216796875, -0.1384124755859375, -0.129608154296875, -0.1208038330078125, -0.11199951171875, -0.1031951904296875, -0.094390869140625, -0.0855865478515625, -0.0767822265625, -0.0679779052734375, -0.059173583984375, -0.0503692626953125, -0.04156494140625, -0.0327606201171875, -0.023956298828125, -0.0151519775390625, -0.00634765625, 0.0024566650390625, 0.011260986328125, 0.0200653076171875, 0.02886962890625, 0.0376739501953125, 0.046478271484375, 0.0552825927734375, 0.0640869140625, 0.0728912353515625, 0.081695556640625, 0.0904998779296875, 0.09930419921875, 0.1081085205078125, 0.116912841796875, 0.1257171630859375, 0.134521484375, 0.1433258056640625, 0.152130126953125, 0.1609344482421875, 0.16973876953125, 0.1785430908203125, 0.187347412109375, 0.1961517333984375, 0.2049560546875, 0.2137603759765625, 0.222564697265625, 0.2313690185546875, 0.24017333984375, 0.2489776611328125, 0.257781982421875, 0.2665863037109375, 0.275390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 5.0, 7.0, 11.0, 6.0, 13.0, 20.0, 21.0, 51.0, 38.0, 66.0, 81.0, 85.0, 104.0, 95.0, 87.0, 78.0, 46.0, 30.0, 29.0, 25.0, 20.0, 17.0, 6.0, 7.0, 3.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03960466384887695, -0.038224220275878906, -0.03684377670288086, -0.03546333312988281, -0.034082889556884766, -0.03270244598388672, -0.03132200241088867, -0.029941558837890625, -0.028561115264892578, -0.02718067169189453, -0.025800228118896484, -0.024419784545898438, -0.02303934097290039, -0.021658897399902344, -0.020278453826904297, -0.01889801025390625, -0.017517566680908203, -0.016137123107910156, -0.01475667953491211, -0.013376235961914062, -0.011995792388916016, -0.010615348815917969, -0.009234905242919922, -0.007854461669921875, -0.006474018096923828, -0.005093574523925781, -0.0037131309509277344, -0.0023326873779296875, -0.0009522438049316406, 0.00042819976806640625, 0.0018086433410644531, 0.0031890869140625, 0.004569530487060547, 0.005949974060058594, 0.007330417633056641, 0.008710861206054688, 0.010091304779052734, 0.011471748352050781, 0.012852191925048828, 0.014232635498046875, 0.015613079071044922, 0.01699352264404297, 0.018373966217041016, 0.019754409790039062, 0.02113485336303711, 0.022515296936035156, 0.023895740509033203, 0.02527618408203125, 0.026656627655029297, 0.028037071228027344, 0.02941751480102539, 0.030797958374023438, 0.032178401947021484, 0.03355884552001953, 0.03493928909301758, 0.036319732666015625, 0.03770017623901367, 0.03908061981201172, 0.040461063385009766, 0.04184150695800781, 0.04322195053100586, 0.044602394104003906, 0.04598283767700195, 0.04736328125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 15.0, 34.0, 36.0, 65.0, 87.0, 148.0, 174.0, 153.0, 99.0, 71.0, 42.0, 25.0, 15.0, 11.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8319793939590454, -1.7723743915557861, -1.7127693891525269, -1.6531643867492676, -1.5935593843460083, -1.533954381942749, -1.4743494987487793, -1.41474449634552, -1.3551394939422607, -1.2955344915390015, -1.2359294891357422, -1.176324486732483, -1.1167194843292236, -1.057114601135254, -0.9975095391273499, -0.9379045963287354, -0.8782995343208313, -0.818694531917572, -0.7590895295143127, -0.6994845867156982, -0.639879584312439, -0.5802745819091797, -0.5206695795059204, -0.4610646069049835, -0.40145960450172424, -0.34185460209846497, -0.2822496294975281, -0.2226446270942688, -0.16303963959217072, -0.10343465209007263, -0.043829649686813354, 0.015775322914123535, 0.07538032531738281, 0.1349853128194809, 0.19459030032157898, 0.25419530272483826, 0.31380027532577515, 0.3734052777290344, 0.4330102801322937, 0.4926152527332306, 0.5522202253341675, 0.6118252277374268, 0.671430230140686, 0.7310352325439453, 0.7906401753425598, 0.8502451777458191, 0.9098501801490784, 0.9694551229476929, 1.0290601253509521, 1.0886651277542114, 1.1482701301574707, 1.20787513256073, 1.2674801349639893, 1.327085018157959, 1.3866901397705078, 1.4462950229644775, 1.5059001445770264, 1.5655051469802856, 1.625110149383545, 1.6847151517868042, 1.7443201541900635, 1.8039250373840332, 1.863530158996582, 1.9231350421905518, 1.982740044593811]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 5.0, 9.0, 15.0, 27.0, 26.0, 37.0, 48.0, 61.0, 56.0, 70.0, 85.0, 82.0, 62.0, 81.0, 69.0, 57.0, 55.0, 40.0, 34.0, 16.0, 17.0, 12.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7790000438690186, -1.7380934953689575, -1.697186827659607, -1.656280279159546, -1.6153736114501953, -1.5744670629501343, -1.5335603952407837, -1.4926538467407227, -1.451747179031372, -1.410840630531311, -1.3699339628219604, -1.3290274143218994, -1.2881207466125488, -1.2472141981124878, -1.2063075304031372, -1.1654009819030762, -1.1244944334030151, -1.083587884902954, -1.0426812171936035, -1.0017746686935425, -0.9608680009841919, -0.9199614524841309, -0.879054844379425, -0.8381482362747192, -0.7972416281700134, -0.7563350200653076, -0.7154284119606018, -0.674521803855896, -0.633615255355835, -0.5927085876464844, -0.5518020391464233, -0.5108954310417175, -0.46998870372772217, -0.42908209562301636, -0.38817548751831055, -0.3472689092159271, -0.3063623011112213, -0.2654556930065155, -0.2245490998029709, -0.18364250659942627, -0.14273589849472046, -0.10182929784059525, -0.06092269718647003, -0.020016096532344818, 0.020890504121780396, 0.061797112226486206, 0.10270370543003082, 0.14361029863357544, 0.18451690673828125, 0.22542351484298706, 0.26633012294769287, 0.3072367012500763, 0.3481433093547821, 0.3890499174594879, 0.42995649576187134, 0.47086310386657715, 0.511769711971283, 0.5526763200759888, 0.5935829281806946, 0.6344895362854004, 0.6753960847854614, 0.716302752494812, 0.757209300994873, 0.7981159090995789, 0.8390225172042847]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 1.0, 7.0, 2.0, 7.0, 12.0, 12.0, 21.0, 11.0, 37.0, 53.0, 97.0, 522.0, 9425.0, 963256.0, 73322.0, 1356.0, 179.0, 62.0, 34.0, 35.0, 23.0, 19.0, 11.0, 15.0, 5.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.15625, -5.029571533203125, -4.90289306640625, -4.776214599609375, -4.6495361328125, -4.522857666015625, -4.39617919921875, -4.269500732421875, -4.142822265625, -4.016143798828125, -3.88946533203125, -3.762786865234375, -3.6361083984375, -3.509429931640625, -3.38275146484375, -3.256072998046875, -3.12939453125, -3.002716064453125, -2.87603759765625, -2.749359130859375, -2.6226806640625, -2.496002197265625, -2.36932373046875, -2.242645263671875, -2.115966796875, -1.989288330078125, -1.86260986328125, -1.735931396484375, -1.6092529296875, -1.482574462890625, -1.35589599609375, -1.229217529296875, -1.1025390625, -0.975860595703125, -0.84918212890625, -0.722503662109375, -0.5958251953125, -0.469146728515625, -0.34246826171875, -0.215789794921875, -0.089111328125, 0.037567138671875, 0.16424560546875, 0.290924072265625, 0.4176025390625, 0.544281005859375, 0.67095947265625, 0.797637939453125, 0.92431640625, 1.050994873046875, 1.17767333984375, 1.304351806640625, 1.4310302734375, 1.557708740234375, 1.68438720703125, 1.811065673828125, 1.937744140625, 2.064422607421875, 2.19110107421875, 2.317779541015625, 2.4444580078125, 2.571136474609375, 2.69781494140625, 2.824493408203125, 2.951171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 13.0, 14.0, 35.0, 72.0, 109.0, 166.0, 193.0, 161.0, 117.0, 69.0, 35.0, 18.0, 8.0, 6.0], "bins": [-10.8671875, -10.674575805664062, -10.481964111328125, -10.289352416992188, -10.09674072265625, -9.904129028320312, -9.711517333984375, -9.518905639648438, -9.3262939453125, -9.133682250976562, -8.941070556640625, -8.748458862304688, -8.55584716796875, -8.363235473632812, -8.170623779296875, -7.9780120849609375, -7.785400390625, -7.5927886962890625, -7.400177001953125, -7.2075653076171875, -7.01495361328125, -6.8223419189453125, -6.629730224609375, -6.4371185302734375, -6.2445068359375, -6.0518951416015625, -5.859283447265625, -5.6666717529296875, -5.47406005859375, -5.2814483642578125, -5.088836669921875, -4.8962249755859375, -4.70361328125, -4.5110015869140625, -4.318389892578125, -4.1257781982421875, -3.93316650390625, -3.7405548095703125, -3.547943115234375, -3.3553314208984375, -3.1627197265625, -2.9701080322265625, -2.777496337890625, -2.5848846435546875, -2.39227294921875, -2.1996612548828125, -2.007049560546875, -1.8144378662109375, -1.621826171875, -1.4292144775390625, -1.236602783203125, -1.0439910888671875, -0.85137939453125, -0.6587677001953125, -0.466156005859375, -0.2735443115234375, -0.0809326171875, 0.1116790771484375, 0.304290771484375, 0.4969024658203125, 0.68951416015625, 0.8821258544921875, 1.074737548828125, 1.2673492431640625, 1.4599609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 13.0, 10.0, 16.0, 19.0, 25.0, 37.0, 41.0, 60.0, 52.0, 94.0, 104.0, 147.0, 209.0, 406.0, 1317.0, 10130.0, 334266.0, 677923.0, 20222.0, 2002.0, 533.0, 249.0, 177.0, 125.0, 75.0, 64.0, 59.0, 37.0, 26.0, 19.0, 20.0, 17.0, 6.0, 12.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.967864990234375, -1.90252685546875, -1.837188720703125, -1.7718505859375, -1.706512451171875, -1.64117431640625, -1.575836181640625, -1.510498046875, -1.445159912109375, -1.37982177734375, -1.314483642578125, -1.2491455078125, -1.183807373046875, -1.11846923828125, -1.053131103515625, -0.98779296875, -0.922454833984375, -0.85711669921875, -0.791778564453125, -0.7264404296875, -0.661102294921875, -0.59576416015625, -0.530426025390625, -0.465087890625, -0.399749755859375, -0.33441162109375, -0.269073486328125, -0.2037353515625, -0.138397216796875, -0.07305908203125, -0.007720947265625, 0.0576171875, 0.122955322265625, 0.18829345703125, 0.253631591796875, 0.3189697265625, 0.384307861328125, 0.44964599609375, 0.514984130859375, 0.580322265625, 0.645660400390625, 0.71099853515625, 0.776336669921875, 0.8416748046875, 0.907012939453125, 0.97235107421875, 1.037689208984375, 1.10302734375, 1.168365478515625, 1.23370361328125, 1.299041748046875, 1.3643798828125, 1.429718017578125, 1.49505615234375, 1.560394287109375, 1.625732421875, 1.691070556640625, 1.75640869140625, 1.821746826171875, 1.8870849609375, 1.952423095703125, 2.01776123046875, 2.083099365234375, 2.1484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 8.0, 9.0, 7.0, 19.0, 12.0, 18.0, 18.0, 19.0, 21.0, 22.0, 21.0, 35.0, 34.0, 28.0, 42.0, 29.0, 47.0, 44.0, 43.0, 49.0, 42.0, 45.0, 31.0, 38.0, 37.0, 40.0, 28.0, 26.0, 29.0, 26.0, 18.0, 14.0, 17.0, 18.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8203125, -1.765899658203125, -1.71148681640625, -1.657073974609375, -1.6026611328125, -1.548248291015625, -1.49383544921875, -1.439422607421875, -1.385009765625, -1.330596923828125, -1.27618408203125, -1.221771240234375, -1.1673583984375, -1.112945556640625, -1.05853271484375, -1.004119873046875, -0.94970703125, -0.895294189453125, -0.84088134765625, -0.786468505859375, -0.7320556640625, -0.677642822265625, -0.62322998046875, -0.568817138671875, -0.514404296875, -0.459991455078125, -0.40557861328125, -0.351165771484375, -0.2967529296875, -0.242340087890625, -0.18792724609375, -0.133514404296875, -0.0791015625, -0.024688720703125, 0.02972412109375, 0.084136962890625, 0.1385498046875, 0.192962646484375, 0.24737548828125, 0.301788330078125, 0.356201171875, 0.410614013671875, 0.46502685546875, 0.519439697265625, 0.5738525390625, 0.628265380859375, 0.68267822265625, 0.737091064453125, 0.79150390625, 0.845916748046875, 0.90032958984375, 0.954742431640625, 1.0091552734375, 1.063568115234375, 1.11798095703125, 1.172393798828125, 1.226806640625, 1.281219482421875, 1.33563232421875, 1.390045166015625, 1.4444580078125, 1.498870849609375, 1.55328369140625, 1.607696533203125, 1.662109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 2.0, 8.0, 7.0, 19.0, 21.0, 38.0, 68.0, 147.0, 481.0, 2379.0, 41845.0, 958264.0, 42085.0, 2381.0, 466.0, 160.0, 71.0, 46.0, 22.0, 13.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1338272094726562, -1.1035919189453125, -1.0733566284179688, -1.043121337890625, -1.0128860473632812, -0.9826507568359375, -0.9524154663085938, -0.92218017578125, -0.8919448852539062, -0.8617095947265625, -0.8314743041992188, -0.801239013671875, -0.7710037231445312, -0.7407684326171875, -0.7105331420898438, -0.6802978515625, -0.6500625610351562, -0.6198272705078125, -0.5895919799804688, -0.559356689453125, -0.5291213989257812, -0.4988861083984375, -0.46865081787109375, -0.43841552734375, -0.40818023681640625, -0.3779449462890625, -0.34770965576171875, -0.317474365234375, -0.28723907470703125, -0.2570037841796875, -0.22676849365234375, -0.196533203125, -0.16629791259765625, -0.1360626220703125, -0.10582733154296875, -0.075592041015625, -0.04535675048828125, -0.0151214599609375, 0.01511383056640625, 0.04534912109375, 0.07558441162109375, 0.1058197021484375, 0.13605499267578125, 0.166290283203125, 0.19652557373046875, 0.2267608642578125, 0.25699615478515625, 0.2872314453125, 0.31746673583984375, 0.3477020263671875, 0.37793731689453125, 0.408172607421875, 0.43840789794921875, 0.4686431884765625, 0.49887847900390625, 0.52911376953125, 0.5593490600585938, 0.5895843505859375, 0.6198196411132812, 0.650054931640625, 0.6802902221679688, 0.7105255126953125, 0.7407608032226562, 0.77099609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 12.0, 25.0, 47.0, 91.0, 124.0, 166.0, 150.0, 113.0, 92.0, 64.0, 33.0, 20.0, 12.0, 11.0, 7.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.56978988647461e-05, -7.308833301067352e-05, -7.047876715660095e-05, -6.786920130252838e-05, -6.525963544845581e-05, -6.265006959438324e-05, -6.004050374031067e-05, -5.74309378862381e-05, -5.482137203216553e-05, -5.2211806178092957e-05, -4.9602240324020386e-05, -4.6992674469947815e-05, -4.4383108615875244e-05, -4.177354276180267e-05, -3.91639769077301e-05, -3.655441105365753e-05, -3.394484519958496e-05, -3.133527934551239e-05, -2.872571349143982e-05, -2.611614763736725e-05, -2.3506581783294678e-05, -2.0897015929222107e-05, -1.8287450075149536e-05, -1.5677884221076965e-05, -1.3068318367004395e-05, -1.0458752512931824e-05, -7.849186658859253e-06, -5.239620804786682e-06, -2.6300549507141113e-06, -2.0489096641540527e-08, 2.5890767574310303e-06, 5.198642611503601e-06, 7.808208465576172e-06, 1.0417774319648743e-05, 1.3027340173721313e-05, 1.5636906027793884e-05, 1.8246471881866455e-05, 2.0856037735939026e-05, 2.3465603590011597e-05, 2.6075169444084167e-05, 2.8684735298156738e-05, 3.129430115222931e-05, 3.390386700630188e-05, 3.651343286037445e-05, 3.912299871444702e-05, 4.173256456851959e-05, 4.434213042259216e-05, 4.6951696276664734e-05, 4.9561262130737305e-05, 5.2170827984809875e-05, 5.4780393838882446e-05, 5.738995969295502e-05, 5.999952554702759e-05, 6.260909140110016e-05, 6.521865725517273e-05, 6.78282231092453e-05, 7.043778896331787e-05, 7.304735481739044e-05, 7.565692067146301e-05, 7.826648652553558e-05, 8.087605237960815e-05, 8.348561823368073e-05, 8.60951840877533e-05, 8.870474994182587e-05, 9.131431579589844e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 17.0, 19.0, 20.0, 52.0, 88.0, 183.0, 479.0, 1822.0, 19189.0, 930105.0, 91323.0, 3876.0, 808.0, 283.0, 106.0, 74.0, 28.0, 19.0, 13.0, 9.0, 8.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1684646606445312, -1.1347808837890625, -1.1010971069335938, -1.067413330078125, -1.0337295532226562, -1.0000457763671875, -0.9663619995117188, -0.93267822265625, -0.8989944458007812, -0.8653106689453125, -0.8316268920898438, -0.797943115234375, -0.7642593383789062, -0.7305755615234375, -0.6968917846679688, -0.6632080078125, -0.6295242309570312, -0.5958404541015625, -0.5621566772460938, -0.528472900390625, -0.49478912353515625, -0.4611053466796875, -0.42742156982421875, -0.39373779296875, -0.36005401611328125, -0.3263702392578125, -0.29268646240234375, -0.259002685546875, -0.22531890869140625, -0.1916351318359375, -0.15795135498046875, -0.124267578125, -0.09058380126953125, -0.0569000244140625, -0.02321624755859375, 0.010467529296875, 0.04415130615234375, 0.0778350830078125, 0.11151885986328125, 0.14520263671875, 0.17888641357421875, 0.2125701904296875, 0.24625396728515625, 0.279937744140625, 0.31362152099609375, 0.3473052978515625, 0.38098907470703125, 0.4146728515625, 0.44835662841796875, 0.4820404052734375, 0.5157241821289062, 0.549407958984375, 0.5830917358398438, 0.6167755126953125, 0.6504592895507812, 0.68414306640625, 0.7178268432617188, 0.7515106201171875, 0.7851943969726562, 0.818878173828125, 0.8525619506835938, 0.8862457275390625, 0.9199295043945312, 0.95361328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 11.0, 16.0, 15.0, 24.0, 38.0, 60.0, 64.0, 112.0, 125.0, 129.0, 104.0, 82.0, 67.0, 49.0, 26.0, 16.0, 15.0, 16.0, 7.0, 2.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1781005859375, -0.17127418518066406, -0.16444778442382812, -0.1576213836669922, -0.15079498291015625, -0.1439685821533203, -0.13714218139648438, -0.13031578063964844, -0.1234893798828125, -0.11666297912597656, -0.10983657836914062, -0.10301017761230469, -0.09618377685546875, -0.08935737609863281, -0.08253097534179688, -0.07570457458496094, -0.068878173828125, -0.06205177307128906, -0.055225372314453125, -0.04839897155761719, -0.04157257080078125, -0.03474617004394531, -0.027919769287109375, -0.021093368530273438, -0.0142669677734375, -0.0074405670166015625, -0.000614166259765625, 0.0062122344970703125, 0.01303863525390625, 0.019865036010742188, 0.026691436767578125, 0.03351783752441406, 0.04034423828125, 0.04717063903808594, 0.053997039794921875, 0.06082344055175781, 0.06764984130859375, 0.07447624206542969, 0.08130264282226562, 0.08812904357910156, 0.0949554443359375, 0.10178184509277344, 0.10860824584960938, 0.11543464660644531, 0.12226104736328125, 0.1290874481201172, 0.13591384887695312, 0.14274024963378906, 0.149566650390625, 0.15639305114746094, 0.16321945190429688, 0.1700458526611328, 0.17687225341796875, 0.1836986541748047, 0.19052505493164062, 0.19735145568847656, 0.2041778564453125, 0.21100425720214844, 0.21783065795898438, 0.2246570587158203, 0.23148345947265625, 0.2383098602294922, 0.24513626098632812, 0.25196266174316406, 0.2587890625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 14.0, 27.0, 60.0, 106.0, 183.0, 190.0, 189.0, 111.0, 46.0, 34.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.292221784591675, -3.1399030685424805, -2.987584352493286, -2.835265636444092, -2.6829471588134766, -2.5306284427642822, -2.378309726715088, -2.2259912490844727, -2.073672294616699, -1.9213535785675049, -1.7690349817276, -1.6167162656784058, -1.464397668838501, -1.3120789527893066, -1.1597602367401123, -1.0074416399002075, -0.8551230430603027, -0.7028043866157532, -0.5504857301712036, -0.3981670141220093, -0.24584835767745972, -0.09352970123291016, 0.05878901481628418, 0.21110761165618896, 0.3634263277053833, 0.5157449841499329, 0.6680636405944824, 0.8203823566436768, 0.9727010130882263, 1.1250196695327759, 1.2773383855819702, 1.429656982421875, 1.5819754600524902, 1.7342941761016846, 1.8866127729415894, 2.038931369781494, 2.1912500858306885, 2.343568801879883, 2.495887517929077, 2.6482062339782715, 2.8005247116088867, 2.952843427658081, 3.1051621437072754, 3.2574806213378906, 3.409799337387085, 3.5621180534362793, 3.7144367694854736, 3.866755485534668, 4.019074440002441, 4.171392917633057, 4.32371187210083, 4.476030349731445, 4.628349304199219, 4.780667781829834, 4.932986259460449, 5.085305213928223, 5.237623691558838, 5.389942169189453, 5.542261123657227, 5.694579601287842, 5.846898555755615, 5.9992170333862305, 6.151535987854004, 6.303854465484619, 6.456172943115234]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 16.0, 13.0, 29.0, 31.0, 28.0, 40.0, 47.0, 60.0, 58.0, 98.0, 83.0, 65.0, 71.0, 69.0, 59.0, 59.0, 37.0, 39.0, 37.0, 25.0, 23.0, 9.0, 8.0, 7.0], "bins": [-8.575007438659668, -8.407403945922852, -8.239800453186035, -8.072196960449219, -7.904592990875244, -7.736989498138428, -7.569386005401611, -7.401782512664795, -7.2341790199279785, -7.066575527191162, -6.898972034454346, -6.731368064880371, -6.563764572143555, -6.396161079406738, -6.228557586669922, -6.0609540939331055, -5.893350601196289, -5.725747108459473, -5.558143615722656, -5.39054012298584, -5.222936153411865, -5.055332660675049, -4.887729167938232, -4.720125675201416, -4.552521705627441, -4.384918212890625, -4.217314720153809, -4.049711227416992, -3.8821074962615967, -3.714503765106201, -3.5469002723693848, -3.3792967796325684, -3.211693048477173, -3.0440895557403564, -2.876485824584961, -2.7088823318481445, -2.541278839111328, -2.3736753463745117, -2.206071615219116, -2.0384681224823, -1.8708645105361938, -1.703260898590088, -1.5356574058532715, -1.3680537939071655, -1.2004501819610596, -1.0328466892242432, -0.8652430772781372, -0.6976395845413208, -0.5300359725952148, -0.36243242025375366, -0.1948288381099701, -0.027225255966186523, 0.14037829637527466, 0.30798184871673584, 0.4755854606628418, 0.6431889533996582, 0.8107925653457642, 0.9783961176872253, 1.1459996700286865, 1.3136032819747925, 1.4812068939208984, 1.6488103866577148, 1.8164139986038208, 1.9840174913406372, 2.151621103286743]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 17.0, 24.0, 34.0, 65.0, 84.0, 132.0, 242.0, 437.0, 878.0, 1783.0, 4099.0, 11850.0, 45513.0, 269701.0, 1576463.0, 1862057.0, 343067.0, 55804.0, 13166.0, 4503.0, 2023.0, 1026.0, 521.0, 310.0, 173.0, 103.0, 62.0, 39.0, 20.0, 20.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6923828125, -1.646728515625, -1.60107421875, -1.555419921875, -1.509765625, -1.464111328125, -1.41845703125, -1.372802734375, -1.3271484375, -1.281494140625, -1.23583984375, -1.190185546875, -1.14453125, -1.098876953125, -1.05322265625, -1.007568359375, -0.9619140625, -0.916259765625, -0.87060546875, -0.824951171875, -0.779296875, -0.733642578125, -0.68798828125, -0.642333984375, -0.5966796875, -0.551025390625, -0.50537109375, -0.459716796875, -0.4140625, -0.368408203125, -0.32275390625, -0.277099609375, -0.2314453125, -0.185791015625, -0.14013671875, -0.094482421875, -0.048828125, -0.003173828125, 0.04248046875, 0.088134765625, 0.1337890625, 0.179443359375, 0.22509765625, 0.270751953125, 0.31640625, 0.362060546875, 0.40771484375, 0.453369140625, 0.4990234375, 0.544677734375, 0.59033203125, 0.635986328125, 0.681640625, 0.727294921875, 0.77294921875, 0.818603515625, 0.8642578125, 0.909912109375, 0.95556640625, 1.001220703125, 1.046875, 1.092529296875, 1.13818359375, 1.183837890625, 1.2294921875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 16.0, 11.0, 18.0, 26.0, 21.0, 22.0, 35.0, 31.0, 42.0, 35.0, 41.0, 55.0, 52.0, 59.0, 68.0, 46.0, 56.0, 43.0, 48.0, 31.0, 34.0, 39.0, 41.0, 17.0, 19.0, 7.0, 11.0, 13.0, 7.0, 5.0, 10.0, 3.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0846405029296875, -1.047210693359375, -1.0097808837890625, -0.97235107421875, -0.9349212646484375, -0.897491455078125, -0.8600616455078125, -0.8226318359375, -0.7852020263671875, -0.747772216796875, -0.7103424072265625, -0.67291259765625, -0.6354827880859375, -0.598052978515625, -0.5606231689453125, -0.523193359375, -0.4857635498046875, -0.448333740234375, -0.4109039306640625, -0.37347412109375, -0.3360443115234375, -0.298614501953125, -0.2611846923828125, -0.2237548828125, -0.1863250732421875, -0.148895263671875, -0.1114654541015625, -0.07403564453125, -0.0366058349609375, 0.000823974609375, 0.0382537841796875, 0.07568359375, 0.1131134033203125, 0.150543212890625, 0.1879730224609375, 0.22540283203125, 0.2628326416015625, 0.300262451171875, 0.3376922607421875, 0.3751220703125, 0.4125518798828125, 0.449981689453125, 0.4874114990234375, 0.52484130859375, 0.5622711181640625, 0.599700927734375, 0.6371307373046875, 0.674560546875, 0.7119903564453125, 0.749420166015625, 0.7868499755859375, 0.82427978515625, 0.8617095947265625, 0.899139404296875, 0.9365692138671875, 0.9739990234375, 1.0114288330078125, 1.048858642578125, 1.0862884521484375, 1.12371826171875, 1.1611480712890625, 1.198577880859375, 1.2360076904296875, 1.2734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 7.0, 15.0, 9.0, 15.0, 26.0, 41.0, 52.0, 69.0, 119.0, 166.0, 306.0, 631.0, 1410.0, 4793.0, 29436.0, 744288.0, 3313587.0, 85640.0, 9419.0, 2329.0, 840.0, 376.0, 212.0, 138.0, 78.0, 64.0, 50.0, 38.0, 36.0, 18.0, 11.0, 9.0, 9.0, 9.0, 8.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.1953125, -2.120147705078125, -2.04498291015625, -1.969818115234375, -1.8946533203125, -1.819488525390625, -1.74432373046875, -1.669158935546875, -1.593994140625, -1.518829345703125, -1.44366455078125, -1.368499755859375, -1.2933349609375, -1.218170166015625, -1.14300537109375, -1.067840576171875, -0.99267578125, -0.917510986328125, -0.84234619140625, -0.767181396484375, -0.6920166015625, -0.616851806640625, -0.54168701171875, -0.466522216796875, -0.391357421875, -0.316192626953125, -0.24102783203125, -0.165863037109375, -0.0906982421875, -0.015533447265625, 0.05963134765625, 0.134796142578125, 0.2099609375, 0.285125732421875, 0.36029052734375, 0.435455322265625, 0.5106201171875, 0.585784912109375, 0.66094970703125, 0.736114501953125, 0.811279296875, 0.886444091796875, 0.96160888671875, 1.036773681640625, 1.1119384765625, 1.187103271484375, 1.26226806640625, 1.337432861328125, 1.41259765625, 1.487762451171875, 1.56292724609375, 1.638092041015625, 1.7132568359375, 1.788421630859375, 1.86358642578125, 1.938751220703125, 2.013916015625, 2.089080810546875, 2.16424560546875, 2.239410400390625, 2.3145751953125, 2.389739990234375, 2.46490478515625, 2.540069580078125, 2.615234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 9.0, 12.0, 10.0, 21.0, 28.0, 29.0, 43.0, 42.0, 63.0, 94.0, 148.0, 204.0, 332.0, 426.0, 495.0, 517.0, 438.0, 329.0, 273.0, 153.0, 99.0, 68.0, 55.0, 42.0, 23.0, 25.0, 16.0, 9.0, 16.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.4384193420410156, -0.42517852783203125, -0.4119377136230469, -0.3986968994140625, -0.3854560852050781, -0.37221527099609375, -0.3589744567871094, -0.345733642578125, -0.3324928283691406, -0.31925201416015625, -0.3060111999511719, -0.2927703857421875, -0.2795295715332031, -0.26628875732421875, -0.2530479431152344, -0.23980712890625, -0.22656631469726562, -0.21332550048828125, -0.20008468627929688, -0.1868438720703125, -0.17360305786132812, -0.16036224365234375, -0.14712142944335938, -0.133880615234375, -0.12063980102539062, -0.10739898681640625, -0.09415817260742188, -0.0809173583984375, -0.06767654418945312, -0.05443572998046875, -0.041194915771484375, -0.0279541015625, -0.014713287353515625, -0.00147247314453125, 0.011768341064453125, 0.0250091552734375, 0.038249969482421875, 0.05149078369140625, 0.06473159790039062, 0.077972412109375, 0.09121322631835938, 0.10445404052734375, 0.11769485473632812, 0.1309356689453125, 0.14417648315429688, 0.15741729736328125, 0.17065811157226562, 0.18389892578125, 0.19713973999023438, 0.21038055419921875, 0.22362136840820312, 0.2368621826171875, 0.2501029968261719, 0.26334381103515625, 0.2765846252441406, 0.289825439453125, 0.3030662536621094, 0.31630706787109375, 0.3295478820800781, 0.3427886962890625, 0.3560295104980469, 0.36927032470703125, 0.3825111389160156, 0.395751953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 20.0, 23.0, 35.0, 43.0, 73.0, 94.0, 101.0, 125.0, 135.0, 98.0, 78.0, 56.0, 39.0, 25.0, 16.0, 12.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3336222171783447, -2.2580389976501465, -2.1824557781219482, -2.10687255859375, -2.031289577484131, -1.955706238746643, -1.8801231384277344, -1.8045399188995361, -1.728956699371338, -1.6533734798431396, -1.5777902603149414, -1.5022071599960327, -1.4266239404678345, -1.3510407209396362, -1.2754576206207275, -1.1998744010925293, -1.124291181564331, -1.0487079620361328, -0.9731248021125793, -0.8975416421890259, -0.8219584226608276, -0.7463752031326294, -0.6707920432090759, -0.5952088832855225, -0.5196256637573242, -0.44404247403144836, -0.3684592843055725, -0.29287609457969666, -0.2172929048538208, -0.14170971512794495, -0.06612652540206909, 0.009456634521484375, 0.08504009246826172, 0.16062328219413757, 0.23620647192001343, 0.3117896616458893, 0.38737285137176514, 0.462956041097641, 0.5385392308235168, 0.6141223907470703, 0.6897056102752686, 0.7652888298034668, 0.8408719897270203, 0.9164551496505737, 0.992038369178772, 1.0676215887069702, 1.143204689025879, 1.2187879085540771, 1.2943711280822754, 1.3699543476104736, 1.4455375671386719, 1.5211206674575806, 1.5967038869857788, 1.672287106513977, 1.7478702068328857, 1.823453426361084, 1.8990366458892822, 1.9746198654174805, 2.0502030849456787, 2.125786304473877, 2.201369285583496, 2.2769525051116943, 2.3525357246398926, 2.428118944168091, 2.503702163696289]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 4.0, 13.0, 19.0, 15.0, 20.0, 21.0, 26.0, 35.0, 25.0, 36.0, 37.0, 38.0, 42.0, 39.0, 41.0, 57.0, 43.0, 49.0, 44.0, 51.0, 46.0, 41.0, 36.0, 27.0, 27.0, 28.0, 25.0, 17.0, 13.0, 13.0, 4.0, 7.0, 11.0, 5.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.130346655845642, -1.093722939491272, -1.0570991039276123, -1.0204753875732422, -0.9838516712188721, -0.9472278952598572, -0.9106041193008423, -0.8739804029464722, -0.8373566269874573, -0.8007328510284424, -0.7641091346740723, -0.7274853587150574, -0.6908615827560425, -0.6542378664016724, -0.6176140904426575, -0.5809903144836426, -0.5443665981292725, -0.5077428221702576, -0.47111910581588745, -0.43449532985687256, -0.39787158370018005, -0.36124783754348755, -0.32462406158447266, -0.28800031542778015, -0.25137656927108765, -0.21475282311439514, -0.17812906205654144, -0.14150530099868774, -0.10488155484199524, -0.06825780868530273, -0.031634047627449036, 0.004989713430404663, 0.04161334037780762, 0.07823709398508072, 0.11486084759235382, 0.15148460865020752, 0.18810835480690002, 0.22473210096359253, 0.2613558769226074, 0.2979796230792999, 0.33460336923599243, 0.37122711539268494, 0.40785086154937744, 0.44447463750839233, 0.48109838366508484, 0.5177221298217773, 0.5543459057807922, 0.5909696817398071, 0.6275933980941772, 0.6642171740531921, 0.7008408904075623, 0.7374646663665771, 0.7740883827209473, 0.8107121586799622, 0.847335934638977, 0.8839596509933472, 0.9205834269523621, 0.957207202911377, 0.9938309192657471, 1.0304546356201172, 1.0670784711837769, 1.103702187538147, 1.140325903892517, 1.1769497394561768, 1.2135734558105469]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 14.0, 11.0, 20.0, 29.0, 51.0, 84.0, 97.0, 155.0, 237.0, 417.0, 640.0, 1137.0, 1949.0, 3824.0, 7274.0, 14821.0, 31996.0, 72921.0, 164020.0, 285878.0, 243800.0, 119427.0, 52732.0, 23576.0, 10899.0, 5572.0, 2964.0, 1659.0, 867.0, 485.0, 323.0, 199.0, 142.0, 101.0, 55.0, 38.0, 31.0, 26.0, 15.0, 17.0, 11.0, 2.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.19634056091308594, -0.19016647338867188, -0.1839923858642578, -0.17781829833984375, -0.1716442108154297, -0.16547012329101562, -0.15929603576660156, -0.1531219482421875, -0.14694786071777344, -0.14077377319335938, -0.1345996856689453, -0.12842559814453125, -0.12225151062011719, -0.11607742309570312, -0.10990333557128906, -0.103729248046875, -0.09755516052246094, -0.09138107299804688, -0.08520698547363281, -0.07903289794921875, -0.07285881042480469, -0.06668472290039062, -0.06051063537597656, -0.0543365478515625, -0.04816246032714844, -0.041988372802734375, -0.03581428527832031, -0.02964019775390625, -0.023466110229492188, -0.017292022705078125, -0.011117935180664062, -0.00494384765625, 0.0012302398681640625, 0.007404327392578125, 0.013578414916992188, 0.01975250244140625, 0.025926589965820312, 0.032100677490234375, 0.03827476501464844, 0.0444488525390625, 0.05062294006347656, 0.056797027587890625, 0.06297111511230469, 0.06914520263671875, 0.07531929016113281, 0.08149337768554688, 0.08766746520996094, 0.093841552734375, 0.10001564025878906, 0.10618972778320312, 0.11236381530761719, 0.11853790283203125, 0.12471199035644531, 0.13088607788085938, 0.13706016540527344, 0.1432342529296875, 0.14940834045410156, 0.15558242797851562, 0.1617565155029297, 0.16793060302734375, 0.1741046905517578, 0.18027877807617188, 0.18645286560058594, 0.192626953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 5.0, 7.0, 13.0, 11.0, 17.0, 26.0, 21.0, 27.0, 33.0, 35.0, 39.0, 41.0, 48.0, 48.0, 60.0, 56.0, 46.0, 53.0, 59.0, 56.0, 42.0, 33.0, 38.0, 33.0, 25.0, 22.0, 27.0, 15.0, 7.0, 6.0, 11.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6525802612304688, -0.6264495849609375, -0.6003189086914062, -0.574188232421875, -0.5480575561523438, -0.5219268798828125, -0.49579620361328125, -0.46966552734375, -0.44353485107421875, -0.4174041748046875, -0.39127349853515625, -0.365142822265625, -0.33901214599609375, -0.3128814697265625, -0.28675079345703125, -0.2606201171875, -0.23448944091796875, -0.2083587646484375, -0.18222808837890625, -0.156097412109375, -0.12996673583984375, -0.1038360595703125, -0.07770538330078125, -0.05157470703125, -0.02544403076171875, 0.0006866455078125, 0.02681732177734375, 0.052947998046875, 0.07907867431640625, 0.1052093505859375, 0.13134002685546875, 0.157470703125, 0.18360137939453125, 0.2097320556640625, 0.23586273193359375, 0.261993408203125, 0.28812408447265625, 0.3142547607421875, 0.34038543701171875, 0.36651611328125, 0.39264678955078125, 0.4187774658203125, 0.44490814208984375, 0.471038818359375, 0.49716949462890625, 0.5233001708984375, 0.5494308471679688, 0.5755615234375, 0.6016921997070312, 0.6278228759765625, 0.6539535522460938, 0.680084228515625, 0.7062149047851562, 0.7323455810546875, 0.7584762573242188, 0.78460693359375, 0.8107376098632812, 0.8368682861328125, 0.8629989624023438, 0.889129638671875, 0.9152603149414062, 0.9413909912109375, 0.9675216674804688, 0.99365234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 11.0, 23.0, 32.0, 53.0, 105.0, 184.0, 292.0, 476.0, 865.0, 1946.0, 4544.0, 12581.0, 38918.0, 126202.0, 331036.0, 338264.0, 130951.0, 40239.0, 13015.0, 4716.0, 1940.0, 933.0, 486.0, 259.0, 170.0, 99.0, 80.0, 36.0, 22.0, 24.0, 8.0, 3.0, 9.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.244873046875, -0.23613357543945312, -0.22739410400390625, -0.21865463256835938, -0.2099151611328125, -0.20117568969726562, -0.19243621826171875, -0.18369674682617188, -0.174957275390625, -0.16621780395507812, -0.15747833251953125, -0.14873886108398438, -0.1399993896484375, -0.13125991821289062, -0.12252044677734375, -0.11378097534179688, -0.10504150390625, -0.09630203247070312, -0.08756256103515625, -0.07882308959960938, -0.0700836181640625, -0.061344146728515625, -0.05260467529296875, -0.043865203857421875, -0.035125732421875, -0.026386260986328125, -0.01764678955078125, -0.008907318115234375, -0.0001678466796875, 0.008571624755859375, 0.01731109619140625, 0.026050567626953125, 0.0347900390625, 0.043529510498046875, 0.05226898193359375, 0.061008453369140625, 0.0697479248046875, 0.07848739624023438, 0.08722686767578125, 0.09596633911132812, 0.104705810546875, 0.11344528198242188, 0.12218475341796875, 0.13092422485351562, 0.1396636962890625, 0.14840316772460938, 0.15714263916015625, 0.16588211059570312, 0.17462158203125, 0.18336105346679688, 0.19210052490234375, 0.20083999633789062, 0.2095794677734375, 0.21831893920898438, 0.22705841064453125, 0.23579788208007812, 0.244537353515625, 0.2532768249511719, 0.26201629638671875, 0.2707557678222656, 0.2794952392578125, 0.2882347106933594, 0.29697418212890625, 0.3057136535644531, 0.314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 5.0, 14.0, 14.0, 17.0, 18.0, 21.0, 24.0, 24.0, 36.0, 43.0, 48.0, 53.0, 51.0, 55.0, 65.0, 66.0, 49.0, 52.0, 50.0, 55.0, 33.0, 35.0, 22.0, 21.0, 25.0, 21.0, 11.0, 18.0, 10.0, 13.0, 8.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.080078125, -2.0226593017578125, -1.965240478515625, -1.9078216552734375, -1.85040283203125, -1.7929840087890625, -1.735565185546875, -1.6781463623046875, -1.6207275390625, -1.5633087158203125, -1.505889892578125, -1.4484710693359375, -1.39105224609375, -1.3336334228515625, -1.276214599609375, -1.2187957763671875, -1.161376953125, -1.1039581298828125, -1.046539306640625, -0.9891204833984375, -0.93170166015625, -0.8742828369140625, -0.816864013671875, -0.7594451904296875, -0.7020263671875, -0.6446075439453125, -0.587188720703125, -0.5297698974609375, -0.47235107421875, -0.4149322509765625, -0.357513427734375, -0.3000946044921875, -0.24267578125, -0.1852569580078125, -0.127838134765625, -0.0704193115234375, -0.01300048828125, 0.0444183349609375, 0.101837158203125, 0.1592559814453125, 0.2166748046875, 0.2740936279296875, 0.331512451171875, 0.3889312744140625, 0.44635009765625, 0.5037689208984375, 0.561187744140625, 0.6186065673828125, 0.676025390625, 0.7334442138671875, 0.790863037109375, 0.8482818603515625, 0.90570068359375, 0.9631195068359375, 1.020538330078125, 1.0779571533203125, 1.1353759765625, 1.1927947998046875, 1.250213623046875, 1.3076324462890625, 1.36505126953125, 1.4224700927734375, 1.479888916015625, 1.5373077392578125, 1.5947265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 10.0, 13.0, 18.0, 36.0, 47.0, 69.0, 103.0, 162.0, 285.0, 501.0, 940.0, 2034.0, 4681.0, 13961.0, 61460.0, 334073.0, 485199.0, 110870.0, 22008.0, 6683.0, 2636.0, 1198.0, 616.0, 326.0, 226.0, 122.0, 75.0, 50.0, 39.0, 38.0, 23.0, 14.0, 8.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14208984375, -0.13753128051757812, -0.13297271728515625, -0.12841415405273438, -0.1238555908203125, -0.11929702758789062, -0.11473846435546875, -0.11017990112304688, -0.105621337890625, -0.10106277465820312, -0.09650421142578125, -0.09194564819335938, -0.0873870849609375, -0.08282852172851562, -0.07826995849609375, -0.07371139526367188, -0.06915283203125, -0.06459426879882812, -0.06003570556640625, -0.055477142333984375, -0.0509185791015625, -0.046360015869140625, -0.04180145263671875, -0.037242889404296875, -0.032684326171875, -0.028125762939453125, -0.02356719970703125, -0.019008636474609375, -0.0144500732421875, -0.009891510009765625, -0.00533294677734375, -0.000774383544921875, 0.0037841796875, 0.008342742919921875, 0.01290130615234375, 0.017459869384765625, 0.0220184326171875, 0.026576995849609375, 0.03113555908203125, 0.035694122314453125, 0.040252685546875, 0.044811248779296875, 0.04936981201171875, 0.053928375244140625, 0.0584869384765625, 0.06304550170898438, 0.06760406494140625, 0.07216262817382812, 0.07672119140625, 0.08127975463867188, 0.08583831787109375, 0.09039688110351562, 0.0949554443359375, 0.09951400756835938, 0.10407257080078125, 0.10863113403320312, 0.113189697265625, 0.11774826049804688, 0.12230682373046875, 0.12686538696289062, 0.1314239501953125, 0.13598251342773438, 0.14054107666015625, 0.14509963989257812, 0.149658203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 7.0, 14.0, 16.0, 27.0, 43.0, 64.0, 72.0, 96.0, 97.0, 125.0, 117.0, 98.0, 66.0, 56.0, 34.0, 18.0, 12.0, 10.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87973403930664e-05, -7.68834725022316e-05, -7.496960461139679e-05, -7.305573672056198e-05, -7.114186882972717e-05, -6.922800093889236e-05, -6.731413304805756e-05, -6.540026515722275e-05, -6.348639726638794e-05, -6.157252937555313e-05, -5.965866148471832e-05, -5.7744793593883514e-05, -5.5830925703048706e-05, -5.39170578122139e-05, -5.200318992137909e-05, -5.008932203054428e-05, -4.817545413970947e-05, -4.6261586248874664e-05, -4.4347718358039856e-05, -4.243385046720505e-05, -4.051998257637024e-05, -3.860611468553543e-05, -3.669224679470062e-05, -3.4778378903865814e-05, -3.2864511013031006e-05, -3.09506431221962e-05, -2.903677523136139e-05, -2.712290734052658e-05, -2.5209039449691772e-05, -2.3295171558856964e-05, -2.1381303668022156e-05, -1.9467435777187347e-05, -1.755356788635254e-05, -1.563969999551773e-05, -1.3725832104682922e-05, -1.1811964213848114e-05, -9.898096323013306e-06, -7.984228432178497e-06, -6.070360541343689e-06, -4.156492650508881e-06, -2.2426247596740723e-06, -3.287568688392639e-07, 1.5851110219955444e-06, 3.4989789128303528e-06, 5.412846803665161e-06, 7.3267146944999695e-06, 9.240582585334778e-06, 1.1154450476169586e-05, 1.3068318367004395e-05, 1.4982186257839203e-05, 1.689605414867401e-05, 1.880992203950882e-05, 2.0723789930343628e-05, 2.2637657821178436e-05, 2.4551525712013245e-05, 2.6465393602848053e-05, 2.837926149368286e-05, 3.029312938451767e-05, 3.220699727535248e-05, 3.4120865166187286e-05, 3.6034733057022095e-05, 3.79486009478569e-05, 3.986246883869171e-05, 4.177633672952652e-05, 4.369020462036133e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 0.0, 6.0, 4.0, 13.0, 9.0, 11.0, 9.0, 11.0, 19.0, 22.0, 36.0, 67.0, 95.0, 143.0, 262.0, 616.0, 1472.0, 5574.0, 27218.0, 191105.0, 627930.0, 162501.0, 23734.0, 4973.0, 1439.0, 588.0, 287.0, 155.0, 72.0, 60.0, 37.0, 18.0, 19.0, 16.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2294921875, -0.22336578369140625, -0.2172393798828125, -0.21111297607421875, -0.204986572265625, -0.19886016845703125, -0.1927337646484375, -0.18660736083984375, -0.18048095703125, -0.17435455322265625, -0.1682281494140625, -0.16210174560546875, -0.155975341796875, -0.14984893798828125, -0.1437225341796875, -0.13759613037109375, -0.1314697265625, -0.12534332275390625, -0.1192169189453125, -0.11309051513671875, -0.106964111328125, -0.10083770751953125, -0.0947113037109375, -0.08858489990234375, -0.08245849609375, -0.07633209228515625, -0.0702056884765625, -0.06407928466796875, -0.057952880859375, -0.05182647705078125, -0.0457000732421875, -0.03957366943359375, -0.033447265625, -0.02732086181640625, -0.0211944580078125, -0.01506805419921875, -0.008941650390625, -0.00281524658203125, 0.0033111572265625, 0.00943756103515625, 0.01556396484375, 0.02169036865234375, 0.0278167724609375, 0.03394317626953125, 0.040069580078125, 0.04619598388671875, 0.0523223876953125, 0.05844879150390625, 0.0645751953125, 0.07070159912109375, 0.0768280029296875, 0.08295440673828125, 0.089080810546875, 0.09520721435546875, 0.1013336181640625, 0.10746002197265625, 0.11358642578125, 0.11971282958984375, 0.1258392333984375, 0.13196563720703125, 0.138092041015625, 0.14421844482421875, 0.1503448486328125, 0.15647125244140625, 0.16259765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 11.0, 7.0, 13.0, 14.0, 16.0, 25.0, 26.0, 50.0, 40.0, 68.0, 56.0, 80.0, 82.0, 80.0, 87.0, 71.0, 66.0, 35.0, 40.0, 25.0, 20.0, 25.0, 13.0, 8.0, 8.0, 5.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0304107666015625, -0.02928328514099121, -0.028155803680419922, -0.027028322219848633, -0.025900840759277344, -0.024773359298706055, -0.023645877838134766, -0.022518396377563477, -0.021390914916992188, -0.0202634334564209, -0.01913595199584961, -0.01800847053527832, -0.01688098907470703, -0.015753507614135742, -0.014626026153564453, -0.013498544692993164, -0.012371063232421875, -0.011243581771850586, -0.010116100311279297, -0.008988618850708008, -0.007861137390136719, -0.00673365592956543, -0.005606174468994141, -0.0044786930084228516, -0.0033512115478515625, -0.0022237300872802734, -0.0010962486267089844, 3.123283386230469e-05, 0.0011587142944335938, 0.002286195755004883, 0.003413677215576172, 0.004541158676147461, 0.00566864013671875, 0.006796121597290039, 0.007923603057861328, 0.009051084518432617, 0.010178565979003906, 0.011306047439575195, 0.012433528900146484, 0.013561010360717773, 0.014688491821289062, 0.01581597328186035, 0.01694345474243164, 0.01807093620300293, 0.01919841766357422, 0.020325899124145508, 0.021453380584716797, 0.022580862045288086, 0.023708343505859375, 0.024835824966430664, 0.025963306427001953, 0.027090787887573242, 0.02821826934814453, 0.02934575080871582, 0.03047323226928711, 0.0316007137298584, 0.03272819519042969, 0.03385567665100098, 0.034983158111572266, 0.036110639572143555, 0.037238121032714844, 0.03836560249328613, 0.03949308395385742, 0.04062056541442871, 0.041748046875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 14.0, 29.0, 40.0, 90.0, 127.0, 170.0, 199.0, 122.0, 91.0, 49.0, 30.0, 15.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.035905599594116, -1.9725351333618164, -1.9091647863388062, -1.8457943201065063, -1.782423973083496, -1.7190535068511963, -1.6556830406188965, -1.5923125743865967, -1.5289422273635864, -1.4655717611312866, -1.4022014141082764, -1.3388309478759766, -1.2754604816436768, -1.2120901346206665, -1.1487196683883667, -1.0853493213653564, -1.0219788551330566, -0.9586084485054016, -0.8952380418777466, -0.8318675756454468, -0.7684971690177917, -0.7051267623901367, -0.6417562961578369, -0.5783858895301819, -0.5150154829025269, -0.4516450762748718, -0.3882746398448944, -0.324904203414917, -0.26153379678726196, -0.19816339015960693, -0.13479295372962952, -0.0714225172996521, -0.00805211067199707, 0.05531831085681915, 0.11868873238563538, 0.1820591539144516, 0.24542957544326782, 0.30879998207092285, 0.37217041850090027, 0.4355408549308777, 0.4989112615585327, 0.5622816681861877, 0.6256520748138428, 0.6890225410461426, 0.7523929476737976, 0.8157633543014526, 0.8791338205337524, 0.9425042271614075, 1.0058746337890625, 1.0692451000213623, 1.1326154470443726, 1.1959859132766724, 1.2593562602996826, 1.3227267265319824, 1.3860971927642822, 1.449467658996582, 1.5128380060195923, 1.576208472251892, 1.6395788192749023, 1.7029492855072021, 1.766319751739502, 1.8296900987625122, 1.893060564994812, 1.9564309120178223, 2.019801378250122]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 7.0, 8.0, 12.0, 17.0, 10.0, 15.0, 21.0, 30.0, 33.0, 37.0, 34.0, 38.0, 54.0, 45.0, 48.0, 51.0, 66.0, 46.0, 55.0, 55.0, 45.0, 48.0, 29.0, 24.0, 39.0, 26.0, 13.0, 18.0, 16.0, 4.0, 8.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6306495070457458, -0.6057257056236267, -0.5808018445968628, -0.5558780431747437, -0.5309542417526245, -0.5060304403305054, -0.48110657930374146, -0.4561827778816223, -0.4312589466571808, -0.40633511543273926, -0.3814113140106201, -0.3564874827861786, -0.33156365156173706, -0.3066398501396179, -0.2817160189151764, -0.25679218769073486, -0.23186838626861572, -0.2069445699453354, -0.18202075362205505, -0.15709692239761353, -0.1321731060743332, -0.10724928975105286, -0.08232545852661133, -0.057401642203330994, -0.03247782588005066, -0.007554005831480026, 0.017369814217090607, 0.04229363799095154, 0.06721745431423187, 0.09214127063751221, 0.11706510186195374, 0.14198891818523407, 0.1669127345085144, 0.19183655083179474, 0.21676036715507507, 0.2416841983795166, 0.26660799980163574, 0.29153183102607727, 0.3164556622505188, 0.34137946367263794, 0.36630329489707947, 0.391227126121521, 0.41615092754364014, 0.44107475876808167, 0.4659985899925232, 0.49092239141464233, 0.5158462524414062, 0.5407700538635254, 0.5656938552856445, 0.5906176567077637, 0.6155415177345276, 0.6404653191566467, 0.6653891205787659, 0.6903129816055298, 0.7152367830276489, 0.7401605844497681, 0.7650843858718872, 0.7900081872940063, 0.8149320483207703, 0.8398558497428894, 0.8647796511650085, 0.8897035121917725, 0.9146273136138916, 0.9395511150360107, 0.9644749760627747]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 9.0, 6.0, 22.0, 22.0, 39.0, 46.0, 84.0, 123.0, 219.0, 474.0, 877.0, 1762.0, 4290.0, 11457.0, 36329.0, 143029.0, 517698.0, 247705.0, 56627.0, 16903.0, 5923.0, 2484.0, 1146.0, 557.0, 254.0, 188.0, 117.0, 57.0, 39.0, 20.0, 15.0, 11.0, 12.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0107421875, -0.9858932495117188, -0.9610443115234375, -0.9361953735351562, -0.911346435546875, -0.8864974975585938, -0.8616485595703125, -0.8367996215820312, -0.81195068359375, -0.7871017456054688, -0.7622528076171875, -0.7374038696289062, -0.712554931640625, -0.6877059936523438, -0.6628570556640625, -0.6380081176757812, -0.6131591796875, -0.5883102416992188, -0.5634613037109375, -0.5386123657226562, -0.513763427734375, -0.48891448974609375, -0.4640655517578125, -0.43921661376953125, -0.41436767578125, -0.38951873779296875, -0.3646697998046875, -0.33982086181640625, -0.314971923828125, -0.29012298583984375, -0.2652740478515625, -0.24042510986328125, -0.215576171875, -0.19072723388671875, -0.1658782958984375, -0.14102935791015625, -0.116180419921875, -0.09133148193359375, -0.0664825439453125, -0.04163360595703125, -0.01678466796875, 0.00806427001953125, 0.0329132080078125, 0.05776214599609375, 0.082611083984375, 0.10746002197265625, 0.1323089599609375, 0.15715789794921875, 0.1820068359375, 0.20685577392578125, 0.2317047119140625, 0.25655364990234375, 0.281402587890625, 0.30625152587890625, 0.3311004638671875, 0.35594940185546875, 0.38079833984375, 0.40564727783203125, 0.4304962158203125, 0.45534515380859375, 0.480194091796875, 0.5050430297851562, 0.5298919677734375, 0.5547409057617188, 0.57958984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 12.0, 18.0, 14.0, 23.0, 28.0, 42.0, 47.0, 50.0, 46.0, 66.0, 57.0, 70.0, 67.0, 54.0, 68.0, 66.0, 48.0, 48.0, 25.0, 19.0, 32.0, 16.0, 18.0, 9.0, 6.0, 8.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2624053955078125, -1.199615478515625, -1.1368255615234375, -1.07403564453125, -1.0112457275390625, -0.948455810546875, -0.8856658935546875, -0.8228759765625, -0.7600860595703125, -0.697296142578125, -0.6345062255859375, -0.57171630859375, -0.5089263916015625, -0.446136474609375, -0.3833465576171875, -0.320556640625, -0.2577667236328125, -0.194976806640625, -0.1321868896484375, -0.06939697265625, -0.0066070556640625, 0.056182861328125, 0.1189727783203125, 0.1817626953125, 0.2445526123046875, 0.307342529296875, 0.3701324462890625, 0.43292236328125, 0.4957122802734375, 0.558502197265625, 0.6212921142578125, 0.68408203125, 0.7468719482421875, 0.809661865234375, 0.8724517822265625, 0.93524169921875, 0.9980316162109375, 1.060821533203125, 1.1236114501953125, 1.1864013671875, 1.2491912841796875, 1.311981201171875, 1.3747711181640625, 1.43756103515625, 1.5003509521484375, 1.563140869140625, 1.6259307861328125, 1.688720703125, 1.7515106201171875, 1.814300537109375, 1.8770904541015625, 1.93988037109375, 2.0026702880859375, 2.065460205078125, 2.1282501220703125, 2.1910400390625, 2.2538299560546875, 2.316619873046875, 2.3794097900390625, 2.44219970703125, 2.5049896240234375, 2.567779541015625, 2.6305694580078125, 2.693359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 8.0, 3.0, 9.0, 8.0, 9.0, 23.0, 26.0, 36.0, 64.0, 74.0, 84.0, 151.0, 241.0, 465.0, 1097.0, 7606.0, 199562.0, 805890.0, 29121.0, 2409.0, 695.0, 325.0, 224.0, 117.0, 78.0, 58.0, 48.0, 25.0, 18.0, 17.0, 13.0, 15.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8480682373046875, -1.788909912109375, -1.7297515869140625, -1.67059326171875, -1.6114349365234375, -1.552276611328125, -1.4931182861328125, -1.4339599609375, -1.3748016357421875, -1.315643310546875, -1.2564849853515625, -1.19732666015625, -1.1381683349609375, -1.079010009765625, -1.0198516845703125, -0.960693359375, -0.9015350341796875, -0.842376708984375, -0.7832183837890625, -0.72406005859375, -0.6649017333984375, -0.605743408203125, -0.5465850830078125, -0.4874267578125, -0.4282684326171875, -0.369110107421875, -0.3099517822265625, -0.25079345703125, -0.1916351318359375, -0.132476806640625, -0.0733184814453125, -0.01416015625, 0.0449981689453125, 0.104156494140625, 0.1633148193359375, 0.22247314453125, 0.2816314697265625, 0.340789794921875, 0.3999481201171875, 0.4591064453125, 0.5182647705078125, 0.577423095703125, 0.6365814208984375, 0.69573974609375, 0.7548980712890625, 0.814056396484375, 0.8732147216796875, 0.932373046875, 0.9915313720703125, 1.050689697265625, 1.1098480224609375, 1.16900634765625, 1.2281646728515625, 1.287322998046875, 1.3464813232421875, 1.4056396484375, 1.4647979736328125, 1.523956298828125, 1.5831146240234375, 1.64227294921875, 1.7014312744140625, 1.760589599609375, 1.8197479248046875, 1.87890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 3.0, 6.0, 5.0, 7.0, 17.0, 16.0, 24.0, 16.0, 26.0, 31.0, 24.0, 28.0, 27.0, 40.0, 37.0, 47.0, 54.0, 45.0, 39.0, 38.0, 50.0, 48.0, 47.0, 40.0, 28.0, 32.0, 31.0, 30.0, 34.0, 18.0, 13.0, 15.0, 11.0, 7.0, 12.0, 10.0, 6.0, 12.0, 2.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6767578125, -1.624114990234375, -1.57147216796875, -1.518829345703125, -1.4661865234375, -1.413543701171875, -1.36090087890625, -1.308258056640625, -1.255615234375, -1.202972412109375, -1.15032958984375, -1.097686767578125, -1.0450439453125, -0.992401123046875, -0.93975830078125, -0.887115478515625, -0.83447265625, -0.781829833984375, -0.72918701171875, -0.676544189453125, -0.6239013671875, -0.571258544921875, -0.51861572265625, -0.465972900390625, -0.413330078125, -0.360687255859375, -0.30804443359375, -0.255401611328125, -0.2027587890625, -0.150115966796875, -0.09747314453125, -0.044830322265625, 0.0078125, 0.060455322265625, 0.11309814453125, 0.165740966796875, 0.2183837890625, 0.271026611328125, 0.32366943359375, 0.376312255859375, 0.428955078125, 0.481597900390625, 0.53424072265625, 0.586883544921875, 0.6395263671875, 0.692169189453125, 0.74481201171875, 0.797454833984375, 0.85009765625, 0.902740478515625, 0.95538330078125, 1.008026123046875, 1.0606689453125, 1.113311767578125, 1.16595458984375, 1.218597412109375, 1.271240234375, 1.323883056640625, 1.37652587890625, 1.429168701171875, 1.4818115234375, 1.534454345703125, 1.58709716796875, 1.639739990234375, 1.6923828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 0.0, 9.0, 11.0, 17.0, 28.0, 49.0, 59.0, 123.0, 254.0, 813.0, 3290.0, 41345.0, 904692.0, 91334.0, 4793.0, 994.0, 351.0, 141.0, 84.0, 50.0, 30.0, 19.0, 15.0, 13.0, 12.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.66546630859375, -0.6444091796875, -0.62335205078125, -0.602294921875, -0.58123779296875, -0.5601806640625, -0.53912353515625, -0.51806640625, -0.49700927734375, -0.4759521484375, -0.45489501953125, -0.433837890625, -0.41278076171875, -0.3917236328125, -0.37066650390625, -0.349609375, -0.32855224609375, -0.3074951171875, -0.28643798828125, -0.265380859375, -0.24432373046875, -0.2232666015625, -0.20220947265625, -0.18115234375, -0.16009521484375, -0.1390380859375, -0.11798095703125, -0.096923828125, -0.07586669921875, -0.0548095703125, -0.03375244140625, -0.0126953125, 0.00836181640625, 0.0294189453125, 0.05047607421875, 0.071533203125, 0.09259033203125, 0.1136474609375, 0.13470458984375, 0.15576171875, 0.17681884765625, 0.1978759765625, 0.21893310546875, 0.239990234375, 0.26104736328125, 0.2821044921875, 0.30316162109375, 0.32421875, 0.34527587890625, 0.3663330078125, 0.38739013671875, 0.408447265625, 0.42950439453125, 0.4505615234375, 0.47161865234375, 0.49267578125, 0.51373291015625, 0.5347900390625, 0.55584716796875, 0.576904296875, 0.59796142578125, 0.6190185546875, 0.64007568359375, 0.6611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 19.0, 12.0, 30.0, 41.0, 60.0, 96.0, 170.0, 167.0, 156.0, 87.0, 61.0, 35.0, 23.0, 16.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011008977890014648, -0.00010776985436677933, -0.00010544992983341217, -0.00010313000530004501, -0.00010081008076667786, -9.84901562333107e-05, -9.617023169994354e-05, -9.385030716657639e-05, -9.153038263320923e-05, -8.921045809984207e-05, -8.689053356647491e-05, -8.457060903310776e-05, -8.22506844997406e-05, -7.993075996637344e-05, -7.761083543300629e-05, -7.529091089963913e-05, -7.297098636627197e-05, -7.065106183290482e-05, -6.833113729953766e-05, -6.60112127661705e-05, -6.369128823280334e-05, -6.137136369943619e-05, -5.905143916606903e-05, -5.6731514632701874e-05, -5.441159009933472e-05, -5.209166556596756e-05, -4.97717410326004e-05, -4.7451816499233246e-05, -4.513189196586609e-05, -4.281196743249893e-05, -4.0492042899131775e-05, -3.817211836576462e-05, -3.585219383239746e-05, -3.3532269299030304e-05, -3.121234476566315e-05, -2.889242023229599e-05, -2.6572495698928833e-05, -2.4252571165561676e-05, -2.193264663219452e-05, -1.9612722098827362e-05, -1.7292797565460205e-05, -1.4972873032093048e-05, -1.2652948498725891e-05, -1.0333023965358734e-05, -8.013099431991577e-06, -5.69317489862442e-06, -3.373250365257263e-06, -1.0533258318901062e-06, 1.2665987014770508e-06, 3.5865232348442078e-06, 5.906447768211365e-06, 8.226372301578522e-06, 1.0546296834945679e-05, 1.2866221368312836e-05, 1.5186145901679993e-05, 1.750607043504715e-05, 1.9825994968414307e-05, 2.2145919501781464e-05, 2.446584403514862e-05, 2.6785768568515778e-05, 2.9105693101882935e-05, 3.142561763525009e-05, 3.374554216861725e-05, 3.6065466701984406e-05, 3.838539123535156e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 18.0, 17.0, 41.0, 59.0, 175.0, 406.0, 1774.0, 11633.0, 874560.0, 153671.0, 4651.0, 942.0, 332.0, 123.0, 52.0, 26.0, 16.0, 12.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.099609375, -1.0688934326171875, -1.038177490234375, -1.0074615478515625, -0.97674560546875, -0.9460296630859375, -0.915313720703125, -0.8845977783203125, -0.8538818359375, -0.8231658935546875, -0.792449951171875, -0.7617340087890625, -0.73101806640625, -0.7003021240234375, -0.669586181640625, -0.6388702392578125, -0.608154296875, -0.5774383544921875, -0.546722412109375, -0.5160064697265625, -0.48529052734375, -0.4545745849609375, -0.423858642578125, -0.3931427001953125, -0.3624267578125, -0.3317108154296875, -0.300994873046875, -0.2702789306640625, -0.23956298828125, -0.2088470458984375, -0.178131103515625, -0.1474151611328125, -0.11669921875, -0.0859832763671875, -0.055267333984375, -0.0245513916015625, 0.00616455078125, 0.0368804931640625, 0.067596435546875, 0.0983123779296875, 0.1290283203125, 0.1597442626953125, 0.190460205078125, 0.2211761474609375, 0.25189208984375, 0.2826080322265625, 0.313323974609375, 0.3440399169921875, 0.374755859375, 0.4054718017578125, 0.436187744140625, 0.4669036865234375, 0.49761962890625, 0.5283355712890625, 0.559051513671875, 0.5897674560546875, 0.6204833984375, 0.6511993408203125, 0.681915283203125, 0.7126312255859375, 0.74334716796875, 0.7740631103515625, 0.804779052734375, 0.8354949951171875, 0.8662109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 18.0, 17.0, 31.0, 52.0, 69.0, 91.0, 135.0, 170.0, 128.0, 93.0, 61.0, 42.0, 26.0, 10.0, 21.0, 14.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1864013671875, -0.1796245574951172, -0.17284774780273438, -0.16607093811035156, -0.15929412841796875, -0.15251731872558594, -0.14574050903320312, -0.1389636993408203, -0.1321868896484375, -0.1254100799560547, -0.11863327026367188, -0.11185646057128906, -0.10507965087890625, -0.09830284118652344, -0.09152603149414062, -0.08474922180175781, -0.077972412109375, -0.07119560241699219, -0.06441879272460938, -0.05764198303222656, -0.05086517333984375, -0.04408836364746094, -0.037311553955078125, -0.030534744262695312, -0.0237579345703125, -0.016981124877929688, -0.010204315185546875, -0.0034275054931640625, 0.00334930419921875, 0.010126113891601562, 0.016902923583984375, 0.023679733276367188, 0.03045654296875, 0.03723335266113281, 0.044010162353515625, 0.05078697204589844, 0.05756378173828125, 0.06434059143066406, 0.07111740112304688, 0.07789421081542969, 0.0846710205078125, 0.09144783020019531, 0.09822463989257812, 0.10500144958496094, 0.11177825927734375, 0.11855506896972656, 0.12533187866210938, 0.1321086883544922, 0.138885498046875, 0.1456623077392578, 0.15243911743164062, 0.15921592712402344, 0.16599273681640625, 0.17276954650878906, 0.17954635620117188, 0.1863231658935547, 0.1930999755859375, 0.1998767852783203, 0.20665359497070312, 0.21343040466308594, 0.22020721435546875, 0.22698402404785156, 0.23376083374023438, 0.2405376434326172, 0.247314453125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 25.0, 40.0, 102.0, 220.0, 247.0, 177.0, 99.0, 54.0, 17.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.928035259246826, -7.749937057495117, -7.57183837890625, -7.393740177154541, -7.215641975402832, -7.037543773651123, -6.859445095062256, -6.681346893310547, -6.503248691558838, -6.325150489807129, -6.147051811218262, -5.968953609466553, -5.790855407714844, -5.612757205963135, -5.434658527374268, -5.256560325622559, -5.078461647033691, -4.900363445281982, -4.722264766693115, -4.544166564941406, -4.366068363189697, -4.187970161437988, -4.009871482849121, -3.831773281097412, -3.653675079345703, -3.475576639175415, -3.297478437423706, -3.119379997253418, -2.941281795501709, -2.763183355331421, -2.585084915161133, -2.406986713409424, -2.2288882732391357, -2.0507898330688477, -1.8726916313171387, -1.6945931911468506, -1.5164949893951416, -1.3383965492248535, -1.160298228263855, -0.9821999073028564, -0.8041015863418579, -0.6260032653808594, -0.44790491461753845, -0.26980656385421753, -0.091708242893219, 0.08639007806777954, 0.26448845863342285, 0.4425867795944214, 0.6206851005554199, 0.7987834215164185, 0.976881742477417, 1.154980182647705, 1.333078384399414, 1.5111768245697021, 1.6892751455307007, 1.8673734664916992, 2.045471668243408, 2.2235701084136963, 2.4016683101654053, 2.5797667503356934, 2.7578649520874023, 2.9359633922576904, 3.1140618324279785, 3.2921600341796875, 3.4702584743499756]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 7.0, 4.0, 2.0, 7.0, 8.0, 13.0, 8.0, 13.0, 15.0, 22.0, 19.0, 22.0, 25.0, 24.0, 28.0, 33.0, 39.0, 51.0, 35.0, 64.0, 50.0, 52.0, 47.0, 53.0, 40.0, 33.0, 40.0, 28.0, 35.0, 39.0, 18.0, 28.0, 16.0, 14.0, 14.0, 8.0, 8.0, 10.0, 11.0, 7.0, 1.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5424437522888184, -2.4560534954071045, -2.3696634769439697, -2.283273220062256, -2.196883201599121, -2.1104929447174072, -2.0241029262542725, -1.9377126693725586, -1.8513226509094238, -1.7649325132369995, -1.6785423755645752, -1.5921522378921509, -1.5057621002197266, -1.4193719625473022, -1.332981824874878, -1.246591567993164, -1.1602014303207397, -1.0738112926483154, -0.9874211549758911, -0.9010310173034668, -0.8146408796310425, -0.7282507419586182, -0.6418605446815491, -0.5554704070091248, -0.46908026933670044, -0.3826901316642761, -0.2962999939918518, -0.2099098265171051, -0.12351968884468079, -0.03712955117225647, 0.049260616302490234, 0.13565075397491455, 0.22204089164733887, 0.3084310293197632, 0.3948211669921875, 0.4812113344669342, 0.5676014423370361, 0.6539915800094604, 0.7403817772865295, 0.8267719149589539, 0.9131620526313782, 0.9995521903038025, 1.0859423875808716, 1.172332525253296, 1.2587226629257202, 1.3451128005981445, 1.4315029382705688, 1.5178930759429932, 1.6042832136154175, 1.6906733512878418, 1.7770634889602661, 1.8634536266326904, 1.9498437643051147, 2.036233901977539, 2.122624158859253, 2.2090141773223877, 2.2954044342041016, 2.3817946910858154, 2.46818470954895, 2.554574966430664, 2.640964984893799, 2.7273552417755127, 2.8137452602386475, 2.9001355171203613, 2.986525535583496]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 11.0, 17.0, 34.0, 47.0, 88.0, 142.0, 255.0, 484.0, 1035.0, 2384.0, 6349.0, 23359.0, 125216.0, 945327.0, 2424779.0, 563429.0, 76914.0, 15835.0, 4869.0, 1871.0, 843.0, 397.0, 208.0, 136.0, 81.0, 53.0, 41.0, 19.0, 14.0, 8.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.5118865966796875, -1.465179443359375, -1.4184722900390625, -1.37176513671875, -1.3250579833984375, -1.278350830078125, -1.2316436767578125, -1.1849365234375, -1.1382293701171875, -1.091522216796875, -1.0448150634765625, -0.99810791015625, -0.9514007568359375, -0.904693603515625, -0.8579864501953125, -0.811279296875, -0.7645721435546875, -0.717864990234375, -0.6711578369140625, -0.62445068359375, -0.5777435302734375, -0.531036376953125, -0.4843292236328125, -0.4376220703125, -0.3909149169921875, -0.344207763671875, -0.2975006103515625, -0.25079345703125, -0.2040863037109375, -0.157379150390625, -0.1106719970703125, -0.06396484375, -0.0172576904296875, 0.029449462890625, 0.0761566162109375, 0.12286376953125, 0.1695709228515625, 0.216278076171875, 0.2629852294921875, 0.3096923828125, 0.3563995361328125, 0.403106689453125, 0.4498138427734375, 0.49652099609375, 0.5432281494140625, 0.589935302734375, 0.6366424560546875, 0.683349609375, 0.7300567626953125, 0.776763916015625, 0.8234710693359375, 0.87017822265625, 0.9168853759765625, 0.963592529296875, 1.0102996826171875, 1.0570068359375, 1.1037139892578125, 1.150421142578125, 1.1971282958984375, 1.24383544921875, 1.2905426025390625, 1.337249755859375, 1.3839569091796875, 1.4306640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 7.0, 8.0, 11.0, 21.0, 19.0, 33.0, 36.0, 38.0, 40.0, 41.0, 57.0, 47.0, 60.0, 59.0, 67.0, 49.0, 70.0, 62.0, 37.0, 36.0, 37.0, 29.0, 22.0, 18.0, 17.0, 12.0, 10.0, 8.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1025390625, -1.065948486328125, -1.02935791015625, -0.992767333984375, -0.9561767578125, -0.919586181640625, -0.88299560546875, -0.846405029296875, -0.809814453125, -0.773223876953125, -0.73663330078125, -0.700042724609375, -0.6634521484375, -0.626861572265625, -0.59027099609375, -0.553680419921875, -0.51708984375, -0.480499267578125, -0.44390869140625, -0.407318115234375, -0.3707275390625, -0.334136962890625, -0.29754638671875, -0.260955810546875, -0.224365234375, -0.187774658203125, -0.15118408203125, -0.114593505859375, -0.0780029296875, -0.041412353515625, -0.00482177734375, 0.031768798828125, 0.068359375, 0.104949951171875, 0.14154052734375, 0.178131103515625, 0.2147216796875, 0.251312255859375, 0.28790283203125, 0.324493408203125, 0.361083984375, 0.397674560546875, 0.43426513671875, 0.470855712890625, 0.5074462890625, 0.544036865234375, 0.58062744140625, 0.617218017578125, 0.65380859375, 0.690399169921875, 0.72698974609375, 0.763580322265625, 0.8001708984375, 0.836761474609375, 0.87335205078125, 0.909942626953125, 0.946533203125, 0.983123779296875, 1.01971435546875, 1.056304931640625, 1.0928955078125, 1.129486083984375, 1.16607666015625, 1.202667236328125, 1.2392578125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 6.0, 8.0, 23.0, 27.0, 56.0, 120.0, 185.0, 450.0, 1051.0, 4097.0, 44968.0, 3811728.0, 318932.0, 9568.0, 1853.0, 611.0, 272.0, 140.0, 76.0, 44.0, 17.0, 13.0, 12.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.478240966796875, -3.36859130859375, -3.258941650390625, -3.1492919921875, -3.039642333984375, -2.92999267578125, -2.820343017578125, -2.710693359375, -2.601043701171875, -2.49139404296875, -2.381744384765625, -2.2720947265625, -2.162445068359375, -2.05279541015625, -1.943145751953125, -1.83349609375, -1.723846435546875, -1.61419677734375, -1.504547119140625, -1.3948974609375, -1.285247802734375, -1.17559814453125, -1.065948486328125, -0.956298828125, -0.846649169921875, -0.73699951171875, -0.627349853515625, -0.5177001953125, -0.408050537109375, -0.29840087890625, -0.188751220703125, -0.0791015625, 0.030548095703125, 0.14019775390625, 0.249847412109375, 0.3594970703125, 0.469146728515625, 0.57879638671875, 0.688446044921875, 0.798095703125, 0.907745361328125, 1.01739501953125, 1.127044677734375, 1.2366943359375, 1.346343994140625, 1.45599365234375, 1.565643310546875, 1.67529296875, 1.784942626953125, 1.89459228515625, 2.004241943359375, 2.1138916015625, 2.223541259765625, 2.33319091796875, 2.442840576171875, 2.552490234375, 2.662139892578125, 2.77178955078125, 2.881439208984375, 2.9910888671875, 3.100738525390625, 3.21038818359375, 3.320037841796875, 3.4296875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 7.0, 8.0, 15.0, 14.0, 35.0, 46.0, 102.0, 200.0, 365.0, 650.0, 903.0, 733.0, 471.0, 224.0, 127.0, 75.0, 41.0, 33.0, 13.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.41089630126953125, -0.3877105712890625, -0.36452484130859375, -0.341339111328125, -0.31815338134765625, -0.2949676513671875, -0.27178192138671875, -0.24859619140625, -0.22541046142578125, -0.2022247314453125, -0.17903900146484375, -0.155853271484375, -0.13266754150390625, -0.1094818115234375, -0.08629608154296875, -0.0631103515625, -0.03992462158203125, -0.0167388916015625, 0.00644683837890625, 0.029632568359375, 0.05281829833984375, 0.0760040283203125, 0.09918975830078125, 0.12237548828125, 0.14556121826171875, 0.1687469482421875, 0.19193267822265625, 0.215118408203125, 0.23830413818359375, 0.2614898681640625, 0.28467559814453125, 0.307861328125, 0.33104705810546875, 0.3542327880859375, 0.37741851806640625, 0.400604248046875, 0.42378997802734375, 0.4469757080078125, 0.47016143798828125, 0.49334716796875, 0.5165328979492188, 0.5397186279296875, 0.5629043579101562, 0.586090087890625, 0.6092758178710938, 0.6324615478515625, 0.6556472778320312, 0.6788330078125, 0.7020187377929688, 0.7252044677734375, 0.7483901977539062, 0.771575927734375, 0.7947616577148438, 0.8179473876953125, 0.8411331176757812, 0.86431884765625, 0.8875045776367188, 0.9106903076171875, 0.9338760375976562, 0.957061767578125, 0.9802474975585938, 1.0034332275390625, 1.0266189575195312, 1.0498046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 11.0, 24.0, 35.0, 34.0, 59.0, 99.0, 101.0, 128.0, 110.0, 74.0, 85.0, 75.0, 60.0, 27.0, 27.0, 13.0, 5.0, 5.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2227377891540527, -2.1516666412353516, -2.0805954933166504, -2.009524345397949, -1.9384530782699585, -1.8673819303512573, -1.7963106632232666, -1.7252395153045654, -1.6541683673858643, -1.583097219467163, -1.512026071548462, -1.4409548044204712, -1.36988365650177, -1.2988125085830688, -1.2277412414550781, -1.156670093536377, -1.0855989456176758, -1.0145277976989746, -0.9434565901756287, -0.8723853826522827, -0.8013142347335815, -0.7302430868148804, -0.6591718792915344, -0.5881006717681885, -0.5170295238494873, -0.44595834612846375, -0.3748871684074402, -0.3038159906864166, -0.23274481296539307, -0.1616736352443695, -0.09060245752334595, -0.019531279802322388, 0.05154013633728027, 0.12261131405830383, 0.1936824917793274, 0.26475366950035095, 0.3358248472213745, 0.40689602494239807, 0.47796720266342163, 0.5490384101867676, 0.6201095581054688, 0.6911807060241699, 0.7622519135475159, 0.8333231210708618, 0.904394268989563, 0.9754654169082642, 1.0465366840362549, 1.117607831954956, 1.1886789798736572, 1.2597501277923584, 1.3308212757110596, 1.4018925428390503, 1.4729636907577515, 1.5440348386764526, 1.6151061058044434, 1.6861772537231445, 1.7572484016418457, 1.8283195495605469, 1.899390697479248, 1.9704619646072388, 2.0415329933166504, 2.1126043796539307, 2.183675527572632, 2.254746675491333, 2.325817823410034]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 5.0, 4.0, 4.0, 14.0, 11.0, 20.0, 30.0, 15.0, 34.0, 28.0, 27.0, 41.0, 28.0, 31.0, 41.0, 38.0, 57.0, 43.0, 48.0, 52.0, 51.0, 45.0, 38.0, 37.0, 35.0, 31.0, 28.0, 27.0, 10.0, 28.0, 16.0, 15.0, 12.0, 12.0, 12.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1532191038131714, -1.1176023483276367, -1.0819854736328125, -1.0463687181472778, -1.0107519626617432, -0.9751352071762085, -0.939518392086029, -0.9039015769958496, -0.8682848215103149, -0.8326680660247803, -0.7970512509346008, -0.7614344358444214, -0.7258176803588867, -0.690200924873352, -0.6545841097831726, -0.6189672946929932, -0.5833505392074585, -0.5477337837219238, -0.5121169686317444, -0.47650018334388733, -0.4408833980560303, -0.4052666127681732, -0.36964982748031616, -0.3340330421924591, -0.29841625690460205, -0.262799471616745, -0.22718268632888794, -0.19156590104103088, -0.15594911575317383, -0.12033233046531677, -0.08471554517745972, -0.04909875988960266, -0.013481855392456055, 0.022134929895401, 0.05775171518325806, 0.09336850047111511, 0.12898528575897217, 0.16460207104682922, 0.20021885633468628, 0.23583564162254333, 0.2714524269104004, 0.30706921219825745, 0.3426859974861145, 0.37830278277397156, 0.4139195680618286, 0.44953635334968567, 0.4851531386375427, 0.5207699537277222, 0.5563867092132568, 0.5920034646987915, 0.627620279788971, 0.6632370948791504, 0.6988538503646851, 0.7344706058502197, 0.7700874209403992, 0.8057042360305786, 0.8413209915161133, 0.876937747001648, 0.9125545620918274, 0.9481713771820068, 0.9837881326675415, 1.0194048881530762, 1.0550217628479004, 1.090638518333435, 1.1262552738189697]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 8.0, 11.0, 22.0, 34.0, 59.0, 77.0, 141.0, 264.0, 422.0, 1003.0, 2364.0, 6556.0, 21185.0, 76918.0, 315318.0, 444586.0, 130164.0, 33150.0, 10014.0, 3458.0, 1428.0, 591.0, 286.0, 185.0, 112.0, 70.0, 37.0, 20.0, 16.0, 9.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3152313232421875, -0.304046630859375, -0.2928619384765625, -0.28167724609375, -0.2704925537109375, -0.259307861328125, -0.2481231689453125, -0.2369384765625, -0.2257537841796875, -0.214569091796875, -0.2033843994140625, -0.19219970703125, -0.1810150146484375, -0.169830322265625, -0.1586456298828125, -0.1474609375, -0.1362762451171875, -0.125091552734375, -0.1139068603515625, -0.10272216796875, -0.0915374755859375, -0.080352783203125, -0.0691680908203125, -0.0579833984375, -0.0467987060546875, -0.035614013671875, -0.0244293212890625, -0.01324462890625, -0.0020599365234375, 0.009124755859375, 0.0203094482421875, 0.031494140625, 0.0426788330078125, 0.053863525390625, 0.0650482177734375, 0.07623291015625, 0.0874176025390625, 0.098602294921875, 0.1097869873046875, 0.1209716796875, 0.1321563720703125, 0.143341064453125, 0.1545257568359375, 0.16571044921875, 0.1768951416015625, 0.188079833984375, 0.1992645263671875, 0.21044921875, 0.2216339111328125, 0.232818603515625, 0.2440032958984375, 0.25518798828125, 0.2663726806640625, 0.277557373046875, 0.2887420654296875, 0.2999267578125, 0.3111114501953125, 0.322296142578125, 0.3334808349609375, 0.34466552734375, 0.3558502197265625, 0.367034912109375, 0.3782196044921875, 0.389404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 9.0, 4.0, 11.0, 18.0, 15.0, 32.0, 22.0, 21.0, 23.0, 38.0, 38.0, 40.0, 44.0, 41.0, 50.0, 52.0, 40.0, 58.0, 58.0, 45.0, 38.0, 37.0, 38.0, 43.0, 32.0, 12.0, 18.0, 23.0, 20.0, 10.0, 13.0, 8.0, 8.0, 5.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74365234375, -0.718353271484375, -0.69305419921875, -0.667755126953125, -0.6424560546875, -0.617156982421875, -0.59185791015625, -0.566558837890625, -0.541259765625, -0.515960693359375, -0.49066162109375, -0.465362548828125, -0.4400634765625, -0.414764404296875, -0.38946533203125, -0.364166259765625, -0.3388671875, -0.313568115234375, -0.28826904296875, -0.262969970703125, -0.2376708984375, -0.212371826171875, -0.18707275390625, -0.161773681640625, -0.136474609375, -0.111175537109375, -0.08587646484375, -0.060577392578125, -0.0352783203125, -0.009979248046875, 0.01531982421875, 0.040618896484375, 0.06591796875, 0.091217041015625, 0.11651611328125, 0.141815185546875, 0.1671142578125, 0.192413330078125, 0.21771240234375, 0.243011474609375, 0.268310546875, 0.293609619140625, 0.31890869140625, 0.344207763671875, 0.3695068359375, 0.394805908203125, 0.42010498046875, 0.445404052734375, 0.470703125, 0.496002197265625, 0.52130126953125, 0.546600341796875, 0.5718994140625, 0.597198486328125, 0.62249755859375, 0.647796630859375, 0.673095703125, 0.698394775390625, 0.72369384765625, 0.748992919921875, 0.7742919921875, 0.799591064453125, 0.82489013671875, 0.850189208984375, 0.87548828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 16.0, 14.0, 10.0, 29.0, 41.0, 66.0, 83.0, 174.0, 248.0, 426.0, 882.0, 1892.0, 4396.0, 11325.0, 31146.0, 100432.0, 315923.0, 377670.0, 137714.0, 41411.0, 14369.0, 5578.0, 2387.0, 1057.0, 506.0, 271.0, 172.0, 97.0, 61.0, 42.0, 31.0, 21.0, 15.0, 9.0, 11.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.25444793701171875, -0.2457122802734375, -0.23697662353515625, -0.228240966796875, -0.21950531005859375, -0.2107696533203125, -0.20203399658203125, -0.19329833984375, -0.18456268310546875, -0.1758270263671875, -0.16709136962890625, -0.158355712890625, -0.14962005615234375, -0.1408843994140625, -0.13214874267578125, -0.1234130859375, -0.11467742919921875, -0.1059417724609375, -0.09720611572265625, -0.088470458984375, -0.07973480224609375, -0.0709991455078125, -0.06226348876953125, -0.05352783203125, -0.04479217529296875, -0.0360565185546875, -0.02732086181640625, -0.018585205078125, -0.00984954833984375, -0.0011138916015625, 0.00762176513671875, 0.016357421875, 0.02509307861328125, 0.0338287353515625, 0.04256439208984375, 0.051300048828125, 0.06003570556640625, 0.0687713623046875, 0.07750701904296875, 0.08624267578125, 0.09497833251953125, 0.1037139892578125, 0.11244964599609375, 0.121185302734375, 0.12992095947265625, 0.1386566162109375, 0.14739227294921875, 0.1561279296875, 0.16486358642578125, 0.1735992431640625, 0.18233489990234375, 0.191070556640625, 0.19980621337890625, 0.2085418701171875, 0.21727752685546875, 0.22601318359375, 0.23474884033203125, 0.2434844970703125, 0.25222015380859375, 0.260955810546875, 0.26969146728515625, 0.2784271240234375, 0.28716278076171875, 0.2958984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 2.0, 6.0, 8.0, 12.0, 11.0, 12.0, 20.0, 13.0, 26.0, 29.0, 19.0, 29.0, 30.0, 33.0, 39.0, 49.0, 40.0, 53.0, 51.0, 55.0, 66.0, 47.0, 48.0, 30.0, 32.0, 48.0, 33.0, 22.0, 31.0, 19.0, 14.0, 17.0, 22.0, 9.0, 5.0, 2.0, 4.0, 7.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7822265625, -1.731658935546875, -1.68109130859375, -1.630523681640625, -1.5799560546875, -1.529388427734375, -1.47882080078125, -1.428253173828125, -1.377685546875, -1.327117919921875, -1.27655029296875, -1.225982666015625, -1.1754150390625, -1.124847412109375, -1.07427978515625, -1.023712158203125, -0.97314453125, -0.922576904296875, -0.87200927734375, -0.821441650390625, -0.7708740234375, -0.720306396484375, -0.66973876953125, -0.619171142578125, -0.568603515625, -0.518035888671875, -0.46746826171875, -0.416900634765625, -0.3663330078125, -0.315765380859375, -0.26519775390625, -0.214630126953125, -0.1640625, -0.113494873046875, -0.06292724609375, -0.012359619140625, 0.0382080078125, 0.088775634765625, 0.13934326171875, 0.189910888671875, 0.240478515625, 0.291046142578125, 0.34161376953125, 0.392181396484375, 0.4427490234375, 0.493316650390625, 0.54388427734375, 0.594451904296875, 0.64501953125, 0.695587158203125, 0.74615478515625, 0.796722412109375, 0.8472900390625, 0.897857666015625, 0.94842529296875, 0.998992919921875, 1.049560546875, 1.100128173828125, 1.15069580078125, 1.201263427734375, 1.2518310546875, 1.302398681640625, 1.35296630859375, 1.403533935546875, 1.4541015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 20.0, 20.0, 40.0, 53.0, 118.0, 170.0, 314.0, 564.0, 1177.0, 2457.0, 6320.0, 21170.0, 82764.0, 331288.0, 431903.0, 124672.0, 30357.0, 8860.0, 3196.0, 1445.0, 644.0, 386.0, 234.0, 143.0, 72.0, 49.0, 16.0, 29.0, 13.0, 13.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11304855346679688, -0.10903167724609375, -0.10501480102539062, -0.1009979248046875, -0.09698104858398438, -0.09296417236328125, -0.08894729614257812, -0.084930419921875, -0.08091354370117188, -0.07689666748046875, -0.07287979125976562, -0.0688629150390625, -0.06484603881835938, -0.06082916259765625, -0.056812286376953125, -0.05279541015625, -0.048778533935546875, -0.04476165771484375, -0.040744781494140625, -0.0367279052734375, -0.032711029052734375, -0.02869415283203125, -0.024677276611328125, -0.020660400390625, -0.016643524169921875, -0.01262664794921875, -0.008609771728515625, -0.0045928955078125, -0.000576019287109375, 0.00344085693359375, 0.007457733154296875, 0.011474609375, 0.015491485595703125, 0.01950836181640625, 0.023525238037109375, 0.0275421142578125, 0.031558990478515625, 0.03557586669921875, 0.039592742919921875, 0.043609619140625, 0.047626495361328125, 0.05164337158203125, 0.055660247802734375, 0.0596771240234375, 0.06369400024414062, 0.06771087646484375, 0.07172775268554688, 0.07574462890625, 0.07976150512695312, 0.08377838134765625, 0.08779525756835938, 0.0918121337890625, 0.09582901000976562, 0.09984588623046875, 0.10386276245117188, 0.107879638671875, 0.11189651489257812, 0.11591339111328125, 0.11993026733398438, 0.1239471435546875, 0.12796401977539062, 0.13198089599609375, 0.13599777221679688, 0.1400146484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 14.0, 22.0, 33.0, 27.0, 68.0, 68.0, 85.0, 91.0, 103.0, 99.0, 94.0, 74.0, 58.0, 36.0, 24.0, 20.0, 14.0, 14.0, 8.0, 10.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.681680679321289e-05, -6.51627779006958e-05, -6.350874900817871e-05, -6.185472011566162e-05, -6.020069122314453e-05, -5.854666233062744e-05, -5.689263343811035e-05, -5.523860454559326e-05, -5.358457565307617e-05, -5.193054676055908e-05, -5.027651786804199e-05, -4.86224889755249e-05, -4.696846008300781e-05, -4.531443119049072e-05, -4.366040229797363e-05, -4.200637340545654e-05, -4.035234451293945e-05, -3.869831562042236e-05, -3.7044286727905273e-05, -3.5390257835388184e-05, -3.3736228942871094e-05, -3.2082200050354004e-05, -3.0428171157836914e-05, -2.8774142265319824e-05, -2.7120113372802734e-05, -2.5466084480285645e-05, -2.3812055587768555e-05, -2.2158026695251465e-05, -2.0503997802734375e-05, -1.8849968910217285e-05, -1.7195940017700195e-05, -1.5541911125183105e-05, -1.3887882232666016e-05, -1.2233853340148926e-05, -1.0579824447631836e-05, -8.925795555114746e-06, -7.271766662597656e-06, -5.617737770080566e-06, -3.9637088775634766e-06, -2.3096799850463867e-06, -6.556510925292969e-07, 9.98377799987793e-07, 2.652406692504883e-06, 4.306435585021973e-06, 5.9604644775390625e-06, 7.614493370056152e-06, 9.268522262573242e-06, 1.0922551155090332e-05, 1.2576580047607422e-05, 1.4230608940124512e-05, 1.58846378326416e-05, 1.753866672515869e-05, 1.919269561767578e-05, 2.084672451019287e-05, 2.250075340270996e-05, 2.415478229522705e-05, 2.580881118774414e-05, 2.746284008026123e-05, 2.911686897277832e-05, 3.077089786529541e-05, 3.24249267578125e-05, 3.407895565032959e-05, 3.573298454284668e-05, 3.738701343536377e-05, 3.904104232788086e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 13.0, 6.0, 15.0, 10.0, 35.0, 47.0, 60.0, 82.0, 154.0, 266.0, 622.0, 1593.0, 5491.0, 26081.0, 177334.0, 634711.0, 169101.0, 24775.0, 5345.0, 1508.0, 626.0, 285.0, 147.0, 79.0, 42.0, 27.0, 29.0, 21.0, 12.0, 9.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2091064453125, -0.20286178588867188, -0.19661712646484375, -0.19037246704101562, -0.1841278076171875, -0.17788314819335938, -0.17163848876953125, -0.16539382934570312, -0.159149169921875, -0.15290451049804688, -0.14665985107421875, -0.14041519165039062, -0.1341705322265625, -0.12792587280273438, -0.12168121337890625, -0.11543655395507812, -0.10919189453125, -0.10294723510742188, -0.09670257568359375, -0.09045791625976562, -0.0842132568359375, -0.07796859741210938, -0.07172393798828125, -0.06547927856445312, -0.059234619140625, -0.052989959716796875, -0.04674530029296875, -0.040500640869140625, -0.0342559814453125, -0.028011322021484375, -0.02176666259765625, -0.015522003173828125, -0.00927734375, -0.003032684326171875, 0.00321197509765625, 0.009456634521484375, 0.0157012939453125, 0.021945953369140625, 0.02819061279296875, 0.034435272216796875, 0.040679931640625, 0.046924591064453125, 0.05316925048828125, 0.059413909912109375, 0.0656585693359375, 0.07190322875976562, 0.07814788818359375, 0.08439254760742188, 0.09063720703125, 0.09688186645507812, 0.10312652587890625, 0.10937118530273438, 0.1156158447265625, 0.12186050415039062, 0.12810516357421875, 0.13434982299804688, 0.140594482421875, 0.14683914184570312, 0.15308380126953125, 0.15932846069335938, 0.1655731201171875, 0.17181777954101562, 0.17806243896484375, 0.18430709838867188, 0.1905517578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 16.0, 25.0, 26.0, 34.0, 42.0, 46.0, 68.0, 106.0, 84.0, 93.0, 85.0, 68.0, 63.0, 49.0, 44.0, 28.0, 18.0, 16.0, 19.0, 12.0, 8.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03863525390625, -0.037210941314697266, -0.03578662872314453, -0.0343623161315918, -0.03293800354003906, -0.03151369094848633, -0.030089378356933594, -0.02866506576538086, -0.027240753173828125, -0.02581644058227539, -0.024392127990722656, -0.022967815399169922, -0.021543502807617188, -0.020119190216064453, -0.01869487762451172, -0.017270565032958984, -0.01584625244140625, -0.014421939849853516, -0.012997627258300781, -0.011573314666748047, -0.010149002075195312, -0.008724689483642578, -0.007300376892089844, -0.005876064300537109, -0.004451751708984375, -0.0030274391174316406, -0.0016031265258789062, -0.00017881393432617188, 0.0012454986572265625, 0.002669811248779297, 0.004094123840332031, 0.005518436431884766, 0.0069427490234375, 0.008367061614990234, 0.009791374206542969, 0.011215686798095703, 0.012639999389648438, 0.014064311981201172, 0.015488624572753906, 0.01691293716430664, 0.018337249755859375, 0.01976156234741211, 0.021185874938964844, 0.022610187530517578, 0.024034500122070312, 0.025458812713623047, 0.02688312530517578, 0.028307437896728516, 0.02973175048828125, 0.031156063079833984, 0.03258037567138672, 0.03400468826293945, 0.03542900085449219, 0.03685331344604492, 0.038277626037597656, 0.03970193862915039, 0.041126251220703125, 0.04255056381225586, 0.043974876403808594, 0.04539918899536133, 0.04682350158691406, 0.0482478141784668, 0.04967212677001953, 0.051096439361572266, 0.052520751953125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 16.0, 19.0, 46.0, 44.0, 80.0, 125.0, 140.0, 155.0, 127.0, 93.0, 57.0, 31.0, 27.0, 15.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.9136167764663696, -1.8592132329940796, -1.8048096895217896, -1.750406265258789, -1.696002721786499, -1.641599178314209, -1.587195634841919, -1.532792091369629, -1.4783885478973389, -1.4239850044250488, -1.3695814609527588, -1.3151779174804688, -1.2607744932174683, -1.2063709497451782, -1.1519674062728882, -1.0975638628005981, -1.0431604385375977, -0.9887568950653076, -0.9343534111976624, -0.8799498677253723, -0.825546383857727, -0.771142840385437, -0.716739296913147, -0.6623357534408569, -0.6079322695732117, -0.5535287261009216, -0.49912524223327637, -0.44472169876098633, -0.3903181850910187, -0.335914671421051, -0.281511127948761, -0.22710761427879333, -0.17270398139953613, -0.11830046027898788, -0.06389693915843964, -0.009493410587310791, 0.04491010308265686, 0.09931361675262451, 0.15371716022491455, 0.2081206738948822, 0.26252418756484985, 0.3169277012348175, 0.37133121490478516, 0.4257347583770752, 0.48013827204704285, 0.5345417857170105, 0.5889453291893005, 0.6433488130569458, 0.6977523565292358, 0.7521559000015259, 0.8065593838691711, 0.8609629273414612, 0.9153664112091064, 0.9697699546813965, 1.0241734981536865, 1.0785770416259766, 1.1329805850982666, 1.1873841285705566, 1.2417876720428467, 1.2961912155151367, 1.3505946397781372, 1.4049981832504272, 1.4594017267227173, 1.5138052701950073, 1.5682086944580078]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 3.0, 6.0, 5.0, 4.0, 8.0, 6.0, 24.0, 19.0, 26.0, 28.0, 26.0, 24.0, 42.0, 36.0, 27.0, 38.0, 42.0, 44.0, 48.0, 45.0, 51.0, 46.0, 49.0, 40.0, 35.0, 39.0, 43.0, 28.0, 24.0, 26.0, 16.0, 14.0, 21.0, 12.0, 11.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6900408267974854, -0.6668879389762878, -0.6437351107597351, -0.6205822229385376, -0.5974293947219849, -0.5742765069007874, -0.5511236190795898, -0.5279707908630371, -0.5048179626464844, -0.48166510462760925, -0.45851224660873413, -0.4353593587875366, -0.4122065305709839, -0.3890536427497864, -0.36590078473091125, -0.34274792671203613, -0.3195950388908386, -0.2964421808719635, -0.2732893228530884, -0.25013643503189087, -0.22698359191417694, -0.20383073389530182, -0.1806778609752655, -0.15752500295639038, -0.13437214493751526, -0.11121928691864014, -0.08806642144918442, -0.0649135559797287, -0.04176069796085358, -0.018607839941978455, 0.004545032978057861, 0.027697890996932983, 0.05085068941116333, 0.07400354743003845, 0.09715641289949417, 0.12030927836894989, 0.143462136387825, 0.16661499440670013, 0.18976786732673645, 0.21292072534561157, 0.2360735833644867, 0.2592264413833618, 0.28237929940223694, 0.30553215742111206, 0.32868504524230957, 0.3518378734588623, 0.3749907612800598, 0.39814361929893494, 0.42129647731781006, 0.4444493353366852, 0.4676021933555603, 0.4907550811767578, 0.5139079093933105, 0.5370607972145081, 0.5602136850357056, 0.5833665132522583, 0.606519341468811, 0.6296722292900085, 0.6528250575065613, 0.6759779453277588, 0.6991307735443115, 0.722283661365509, 0.7454365491867065, 0.7685893774032593, 0.7917422652244568]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 22.0, 11.0, 14.0, 37.0, 58.0, 69.0, 113.0, 190.0, 250.0, 401.0, 650.0, 1077.0, 1981.0, 3666.0, 7669.0, 16575.0, 37859.0, 96839.0, 273034.0, 373937.0, 138502.0, 52737.0, 22162.0, 9997.0, 4762.0, 2435.0, 1358.0, 806.0, 450.0, 290.0, 181.0, 130.0, 86.0, 60.0, 30.0, 29.0, 17.0, 17.0, 12.0, 9.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5104827880859375, -0.494110107421875, -0.4777374267578125, -0.46136474609375, -0.4449920654296875, -0.428619384765625, -0.4122467041015625, -0.3958740234375, -0.3795013427734375, -0.363128662109375, -0.3467559814453125, -0.33038330078125, -0.3140106201171875, -0.297637939453125, -0.2812652587890625, -0.264892578125, -0.2485198974609375, -0.232147216796875, -0.2157745361328125, -0.19940185546875, -0.1830291748046875, -0.166656494140625, -0.1502838134765625, -0.1339111328125, -0.1175384521484375, -0.101165771484375, -0.0847930908203125, -0.06842041015625, -0.0520477294921875, -0.035675048828125, -0.0193023681640625, -0.0029296875, 0.0134429931640625, 0.029815673828125, 0.0461883544921875, 0.06256103515625, 0.0789337158203125, 0.095306396484375, 0.1116790771484375, 0.1280517578125, 0.1444244384765625, 0.160797119140625, 0.1771697998046875, 0.19354248046875, 0.2099151611328125, 0.226287841796875, 0.2426605224609375, 0.259033203125, 0.2754058837890625, 0.291778564453125, 0.3081512451171875, 0.32452392578125, 0.3408966064453125, 0.357269287109375, 0.3736419677734375, 0.3900146484375, 0.4063873291015625, 0.422760009765625, 0.4391326904296875, 0.45550537109375, 0.4718780517578125, 0.488250732421875, 0.5046234130859375, 0.52099609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 4.0, 5.0, 6.0, 12.0, 9.0, 11.0, 11.0, 26.0, 22.0, 31.0, 33.0, 19.0, 31.0, 46.0, 35.0, 40.0, 43.0, 50.0, 57.0, 46.0, 53.0, 54.0, 43.0, 37.0, 41.0, 42.0, 29.0, 32.0, 18.0, 19.0, 11.0, 20.0, 14.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.369140625, -1.3199920654296875, -1.270843505859375, -1.2216949462890625, -1.17254638671875, -1.1233978271484375, -1.074249267578125, -1.0251007080078125, -0.9759521484375, -0.9268035888671875, -0.877655029296875, -0.8285064697265625, -0.77935791015625, -0.7302093505859375, -0.681060791015625, -0.6319122314453125, -0.582763671875, -0.5336151123046875, -0.484466552734375, -0.4353179931640625, -0.38616943359375, -0.3370208740234375, -0.287872314453125, -0.2387237548828125, -0.1895751953125, -0.1404266357421875, -0.091278076171875, -0.0421295166015625, 0.00701904296875, 0.0561676025390625, 0.105316162109375, 0.1544647216796875, 0.20361328125, 0.2527618408203125, 0.301910400390625, 0.3510589599609375, 0.40020751953125, 0.4493560791015625, 0.498504638671875, 0.5476531982421875, 0.5968017578125, 0.6459503173828125, 0.695098876953125, 0.7442474365234375, 0.79339599609375, 0.8425445556640625, 0.891693115234375, 0.9408416748046875, 0.989990234375, 1.0391387939453125, 1.088287353515625, 1.1374359130859375, 1.18658447265625, 1.2357330322265625, 1.284881591796875, 1.3340301513671875, 1.3831787109375, 1.4323272705078125, 1.481475830078125, 1.5306243896484375, 1.57977294921875, 1.6289215087890625, 1.678070068359375, 1.7272186279296875, 1.7763671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 9.0, 3.0, 10.0, 12.0, 10.0, 24.0, 22.0, 37.0, 40.0, 71.0, 107.0, 127.0, 216.0, 375.0, 839.0, 3478.0, 41929.0, 795689.0, 193562.0, 9163.0, 1478.0, 545.0, 273.0, 166.0, 103.0, 80.0, 57.0, 32.0, 26.0, 21.0, 8.0, 13.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9312896728515625, -1.877227783203125, -1.8231658935546875, -1.76910400390625, -1.7150421142578125, -1.660980224609375, -1.6069183349609375, -1.5528564453125, -1.4987945556640625, -1.444732666015625, -1.3906707763671875, -1.33660888671875, -1.2825469970703125, -1.228485107421875, -1.1744232177734375, -1.120361328125, -1.0662994384765625, -1.012237548828125, -0.9581756591796875, -0.90411376953125, -0.8500518798828125, -0.795989990234375, -0.7419281005859375, -0.6878662109375, -0.6338043212890625, -0.579742431640625, -0.5256805419921875, -0.47161865234375, -0.4175567626953125, -0.363494873046875, -0.3094329833984375, -0.25537109375, -0.2013092041015625, -0.147247314453125, -0.0931854248046875, -0.03912353515625, 0.0149383544921875, 0.069000244140625, 0.1230621337890625, 0.1771240234375, 0.2311859130859375, 0.285247802734375, 0.3393096923828125, 0.39337158203125, 0.4474334716796875, 0.501495361328125, 0.5555572509765625, 0.609619140625, 0.6636810302734375, 0.717742919921875, 0.7718048095703125, 0.82586669921875, 0.8799285888671875, 0.933990478515625, 0.9880523681640625, 1.0421142578125, 1.0961761474609375, 1.150238037109375, 1.2042999267578125, 1.25836181640625, 1.3124237060546875, 1.366485595703125, 1.4205474853515625, 1.474609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 10.0, 9.0, 7.0, 13.0, 12.0, 12.0, 15.0, 21.0, 23.0, 20.0, 29.0, 42.0, 35.0, 37.0, 43.0, 43.0, 34.0, 37.0, 30.0, 50.0, 44.0, 39.0, 36.0, 35.0, 33.0, 21.0, 27.0, 33.0, 37.0, 19.0, 17.0, 12.0, 17.0, 5.0, 19.0, 6.0, 13.0, 8.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.701171875, -1.6514739990234375, -1.601776123046875, -1.5520782470703125, -1.50238037109375, -1.4526824951171875, -1.402984619140625, -1.3532867431640625, -1.3035888671875, -1.2538909912109375, -1.204193115234375, -1.1544952392578125, -1.10479736328125, -1.0550994873046875, -1.005401611328125, -0.9557037353515625, -0.906005859375, -0.8563079833984375, -0.806610107421875, -0.7569122314453125, -0.70721435546875, -0.6575164794921875, -0.607818603515625, -0.5581207275390625, -0.5084228515625, -0.4587249755859375, -0.409027099609375, -0.3593292236328125, -0.30963134765625, -0.2599334716796875, -0.210235595703125, -0.1605377197265625, -0.11083984375, -0.0611419677734375, -0.011444091796875, 0.0382537841796875, 0.08795166015625, 0.1376495361328125, 0.187347412109375, 0.2370452880859375, 0.2867431640625, 0.3364410400390625, 0.386138916015625, 0.4358367919921875, 0.48553466796875, 0.5352325439453125, 0.584930419921875, 0.6346282958984375, 0.684326171875, 0.7340240478515625, 0.783721923828125, 0.8334197998046875, 0.88311767578125, 0.9328155517578125, 0.982513427734375, 1.0322113037109375, 1.0819091796875, 1.1316070556640625, 1.181304931640625, 1.2310028076171875, 1.28070068359375, 1.3303985595703125, 1.380096435546875, 1.4297943115234375, 1.4794921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 22.0, 44.0, 84.0, 209.0, 1260.0, 119956.0, 923073.0, 3244.0, 401.0, 122.0, 53.0, 26.0, 13.0, 8.0, 6.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2867584228515625, -1.237579345703125, -1.1884002685546875, -1.13922119140625, -1.0900421142578125, -1.040863037109375, -0.9916839599609375, -0.9425048828125, -0.8933258056640625, -0.844146728515625, -0.7949676513671875, -0.74578857421875, -0.6966094970703125, -0.647430419921875, -0.5982513427734375, -0.549072265625, -0.4998931884765625, -0.450714111328125, -0.4015350341796875, -0.35235595703125, -0.3031768798828125, -0.253997802734375, -0.2048187255859375, -0.1556396484375, -0.1064605712890625, -0.057281494140625, -0.0081024169921875, 0.04107666015625, 0.0902557373046875, 0.139434814453125, 0.1886138916015625, 0.23779296875, 0.2869720458984375, 0.336151123046875, 0.3853302001953125, 0.43450927734375, 0.4836883544921875, 0.532867431640625, 0.5820465087890625, 0.6312255859375, 0.6804046630859375, 0.729583740234375, 0.7787628173828125, 0.82794189453125, 0.8771209716796875, 0.926300048828125, 0.9754791259765625, 1.024658203125, 1.0738372802734375, 1.123016357421875, 1.1721954345703125, 1.22137451171875, 1.2705535888671875, 1.319732666015625, 1.3689117431640625, 1.4180908203125, 1.4672698974609375, 1.516448974609375, 1.5656280517578125, 1.61480712890625, 1.6639862060546875, 1.713165283203125, 1.7623443603515625, 1.8115234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 7.0, 5.0, 10.0, 14.0, 20.0, 39.0, 58.0, 107.0, 143.0, 166.0, 141.0, 110.0, 61.0, 45.0, 19.0, 20.0, 13.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010859966278076172, -0.0001061074435710907, -0.00010361522436141968, -0.00010112300515174866, -9.863078594207764e-05, -9.613856673240662e-05, -9.36463475227356e-05, -9.115412831306458e-05, -8.866190910339355e-05, -8.616968989372253e-05, -8.367747068405151e-05, -8.118525147438049e-05, -7.869303226470947e-05, -7.620081305503845e-05, -7.370859384536743e-05, -7.121637463569641e-05, -6.872415542602539e-05, -6.623193621635437e-05, -6.373971700668335e-05, -6.124749779701233e-05, -5.875527858734131e-05, -5.626305937767029e-05, -5.377084016799927e-05, -5.127862095832825e-05, -4.8786401748657227e-05, -4.6294182538986206e-05, -4.3801963329315186e-05, -4.1309744119644165e-05, -3.8817524909973145e-05, -3.6325305700302124e-05, -3.3833086490631104e-05, -3.134086728096008e-05, -2.8848648071289062e-05, -2.6356428861618042e-05, -2.386420965194702e-05, -2.1371990442276e-05, -1.887977123260498e-05, -1.638755202293396e-05, -1.389533281326294e-05, -1.1403113603591919e-05, -8.910894393920898e-06, -6.418675184249878e-06, -3.926455974578857e-06, -1.434236764907837e-06, 1.0579824447631836e-06, 3.550201654434204e-06, 6.042420864105225e-06, 8.534640073776245e-06, 1.1026859283447266e-05, 1.3519078493118286e-05, 1.6011297702789307e-05, 1.8503516912460327e-05, 2.0995736122131348e-05, 2.3487955331802368e-05, 2.598017454147339e-05, 2.847239375114441e-05, 3.096461296081543e-05, 3.345683217048645e-05, 3.594905138015747e-05, 3.844127058982849e-05, 4.093348979949951e-05, 4.342570900917053e-05, 4.591792821884155e-05, 4.841014742851257e-05, 5.0902366638183594e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 8.0, 9.0, 12.0, 19.0, 24.0, 56.0, 88.0, 219.0, 772.0, 4735.0, 702743.0, 335381.0, 3555.0, 583.0, 168.0, 74.0, 32.0, 22.0, 20.0, 12.0, 10.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.8418731689453125, -1.798980712890625, -1.7560882568359375, -1.71319580078125, -1.6703033447265625, -1.627410888671875, -1.5845184326171875, -1.5416259765625, -1.4987335205078125, -1.455841064453125, -1.4129486083984375, -1.37005615234375, -1.3271636962890625, -1.284271240234375, -1.2413787841796875, -1.198486328125, -1.1555938720703125, -1.112701416015625, -1.0698089599609375, -1.02691650390625, -0.9840240478515625, -0.941131591796875, -0.8982391357421875, -0.8553466796875, -0.8124542236328125, -0.769561767578125, -0.7266693115234375, -0.68377685546875, -0.6408843994140625, -0.597991943359375, -0.5550994873046875, -0.51220703125, -0.4693145751953125, -0.426422119140625, -0.3835296630859375, -0.34063720703125, -0.2977447509765625, -0.254852294921875, -0.2119598388671875, -0.1690673828125, -0.1261749267578125, -0.083282470703125, -0.0403900146484375, 0.00250244140625, 0.0453948974609375, 0.088287353515625, 0.1311798095703125, 0.174072265625, 0.2169647216796875, 0.259857177734375, 0.3027496337890625, 0.34564208984375, 0.3885345458984375, 0.431427001953125, 0.4743194580078125, 0.5172119140625, 0.5601043701171875, 0.602996826171875, 0.6458892822265625, 0.68878173828125, 0.7316741943359375, 0.774566650390625, 0.8174591064453125, 0.8603515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 6.0, 15.0, 20.0, 54.0, 69.0, 124.0, 163.0, 187.0, 127.0, 76.0, 53.0, 36.0, 20.0, 10.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25634765625, -0.24568557739257812, -0.23502349853515625, -0.22436141967773438, -0.2136993408203125, -0.20303726196289062, -0.19237518310546875, -0.18171310424804688, -0.171051025390625, -0.16038894653320312, -0.14972686767578125, -0.13906478881835938, -0.1284027099609375, -0.11774063110351562, -0.10707855224609375, -0.09641647338867188, -0.08575439453125, -0.07509231567382812, -0.06443023681640625, -0.053768157958984375, -0.0431060791015625, -0.032444000244140625, -0.02178192138671875, -0.011119842529296875, -0.000457763671875, 0.010204315185546875, 0.02086639404296875, 0.031528472900390625, 0.0421905517578125, 0.052852630615234375, 0.06351470947265625, 0.07417678833007812, 0.0848388671875, 0.09550094604492188, 0.10616302490234375, 0.11682510375976562, 0.1274871826171875, 0.13814926147460938, 0.14881134033203125, 0.15947341918945312, 0.170135498046875, 0.18079757690429688, 0.19145965576171875, 0.20212173461914062, 0.2127838134765625, 0.22344589233398438, 0.23410797119140625, 0.24477005004882812, 0.25543212890625, 0.2660942077636719, 0.27675628662109375, 0.2874183654785156, 0.2980804443359375, 0.3087425231933594, 0.31940460205078125, 0.3300666809082031, 0.340728759765625, 0.3513908386230469, 0.36205291748046875, 0.3727149963378906, 0.3833770751953125, 0.3940391540527344, 0.40470123291015625, 0.4153633117675781, 0.426025390625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 40.0, 60.0, 105.0, 170.0, 201.0, 169.0, 100.0, 68.0, 34.0, 16.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.5707292556762695, -6.426671028137207, -6.2826128005981445, -6.13855504989624, -5.994496822357178, -5.850438594818115, -5.706380367279053, -5.56232213973999, -5.418264389038086, -5.274206161499023, -5.130147933959961, -4.986090183258057, -4.842031955718994, -4.697973728179932, -4.553915500640869, -4.409857273101807, -4.265799045562744, -4.121740818023682, -3.9776828289031982, -3.8336246013641357, -3.6895666122436523, -3.54550838470459, -3.4014501571655273, -3.257391929626465, -3.1133339405059814, -2.969275712966919, -2.8252177238464355, -2.681159496307373, -2.5371012687683105, -2.393043279647827, -2.2489850521087646, -2.1049270629882812, -1.9608688354492188, -1.8168107271194458, -1.6727526187896729, -1.5286943912506104, -1.3846362829208374, -1.2405781745910645, -1.096519947052002, -0.952461838722229, -0.808403730392456, -0.6643456220626831, -0.5202874541282654, -0.37622931599617004, -0.2321711778640747, -0.08811306953430176, 0.05594509840011597, 0.2000032663345337, 0.34406137466430664, 0.488119512796402, 0.6321776509284973, 0.776235818862915, 0.920293927192688, 1.064352035522461, 1.2084102630615234, 1.3524683713912964, 1.4965264797210693, 1.6405845880508423, 1.7846426963806152, 1.9287009239196777, 2.0727591514587402, 2.2168171405792236, 2.360875368118286, 2.5049333572387695, 2.648991584777832]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 0.0, 5.0, 6.0, 6.0, 12.0, 10.0, 11.0, 18.0, 24.0, 16.0, 26.0, 22.0, 19.0, 21.0, 40.0, 40.0, 34.0, 49.0, 35.0, 36.0, 28.0, 42.0, 40.0, 20.0, 45.0, 34.0, 51.0, 41.0, 34.0, 28.0, 28.0, 27.0, 32.0, 23.0, 12.0, 12.0, 16.0, 17.0, 8.0, 2.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7254226207733154, -2.6395819187164307, -2.553741216659546, -2.467900514602661, -2.3820598125457764, -2.2962191104888916, -2.210378646850586, -2.124537944793701, -2.0386972427368164, -1.9528565406799316, -1.8670158386230469, -1.781175136566162, -1.6953344345092773, -1.6094937324523926, -1.5236531496047974, -1.4378124475479126, -1.3519716262817383, -1.2661309242248535, -1.1802902221679688, -1.094449520111084, -1.0086088180541992, -0.9227681756019592, -0.8369275331497192, -0.7510868310928345, -0.6652461290359497, -0.5794054269790649, -0.49356475472450256, -0.4077240824699402, -0.3218833804130554, -0.23604267835617065, -0.15020203590393066, -0.0643613338470459, 0.021479368209838867, 0.10732005536556244, 0.193160742521286, 0.2790014147758484, 0.36484211683273315, 0.4506828188896179, 0.5365234613418579, 0.6223641633987427, 0.7082048654556274, 0.7940455675125122, 0.879886269569397, 0.965726912021637, 1.051567554473877, 1.1374082565307617, 1.2232489585876465, 1.3090896606445312, 1.394930362701416, 1.4807710647583008, 1.5666117668151855, 1.6524524688720703, 1.738293170928955, 1.8241338729858398, 1.909974455833435, 1.9958151578903198, 2.081655979156494, 2.167496681213379, 2.2533373832702637, 2.3391780853271484, 2.425018787384033, 2.510859489440918, 2.5967001914978027, 2.6825408935546875, 2.768381357192993]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 17.0, 8.0, 8.0, 19.0, 26.0, 29.0, 27.0, 56.0, 65.0, 104.0, 166.0, 252.0, 403.0, 743.0, 1316.0, 2641.0, 5989.0, 16103.0, 56159.0, 270214.0, 1298996.0, 1871141.0, 525483.0, 102917.0, 25506.0, 8461.0, 3402.0, 1620.0, 889.0, 515.0, 325.0, 213.0, 118.0, 110.0, 71.0, 45.0, 36.0, 24.0, 17.0, 8.0, 15.0, 0.0, 7.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.201171875, -1.1649932861328125, -1.128814697265625, -1.0926361083984375, -1.05645751953125, -1.0202789306640625, -0.984100341796875, -0.9479217529296875, -0.9117431640625, -0.8755645751953125, -0.839385986328125, -0.8032073974609375, -0.76702880859375, -0.7308502197265625, -0.694671630859375, -0.6584930419921875, -0.622314453125, -0.5861358642578125, -0.549957275390625, -0.5137786865234375, -0.47760009765625, -0.4414215087890625, -0.405242919921875, -0.3690643310546875, -0.3328857421875, -0.2967071533203125, -0.260528564453125, -0.2243499755859375, -0.18817138671875, -0.1519927978515625, -0.115814208984375, -0.0796356201171875, -0.04345703125, -0.0072784423828125, 0.028900146484375, 0.0650787353515625, 0.10125732421875, 0.1374359130859375, 0.173614501953125, 0.2097930908203125, 0.2459716796875, 0.2821502685546875, 0.318328857421875, 0.3545074462890625, 0.39068603515625, 0.4268646240234375, 0.463043212890625, 0.4992218017578125, 0.535400390625, 0.5715789794921875, 0.607757568359375, 0.6439361572265625, 0.68011474609375, 0.7162933349609375, 0.752471923828125, 0.7886505126953125, 0.8248291015625, 0.8610076904296875, 0.897186279296875, 0.9333648681640625, 0.96954345703125, 1.0057220458984375, 1.041900634765625, 1.0780792236328125, 1.1142578125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 12.0, 8.0, 17.0, 25.0, 21.0, 22.0, 25.0, 43.0, 46.0, 48.0, 60.0, 45.0, 60.0, 54.0, 54.0, 61.0, 56.0, 44.0, 50.0, 45.0, 40.0, 39.0, 32.0, 11.0, 13.0, 19.0, 10.0, 6.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8827056884765625, -0.845489501953125, -0.8082733154296875, -0.77105712890625, -0.7338409423828125, -0.696624755859375, -0.6594085693359375, -0.6221923828125, -0.5849761962890625, -0.547760009765625, -0.5105438232421875, -0.47332763671875, -0.4361114501953125, -0.398895263671875, -0.3616790771484375, -0.324462890625, -0.2872467041015625, -0.250030517578125, -0.2128143310546875, -0.17559814453125, -0.1383819580078125, -0.101165771484375, -0.0639495849609375, -0.0267333984375, 0.0104827880859375, 0.047698974609375, 0.0849151611328125, 0.12213134765625, 0.1593475341796875, 0.196563720703125, 0.2337799072265625, 0.27099609375, 0.3082122802734375, 0.345428466796875, 0.3826446533203125, 0.41986083984375, 0.4570770263671875, 0.494293212890625, 0.5315093994140625, 0.5687255859375, 0.6059417724609375, 0.643157958984375, 0.6803741455078125, 0.71759033203125, 0.7548065185546875, 0.792022705078125, 0.8292388916015625, 0.866455078125, 0.9036712646484375, 0.940887451171875, 0.9781036376953125, 1.01531982421875, 1.0525360107421875, 1.089752197265625, 1.1269683837890625, 1.1641845703125, 1.2014007568359375, 1.238616943359375, 1.2758331298828125, 1.31304931640625, 1.3502655029296875, 1.387481689453125, 1.4246978759765625, 1.4619140625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 15.0, 27.0, 32.0, 50.0, 108.0, 171.0, 340.0, 713.0, 1875.0, 7454.0, 82703.0, 3764510.0, 316663.0, 14816.0, 2857.0, 937.0, 441.0, 195.0, 128.0, 85.0, 45.0, 22.0, 21.0, 9.0, 13.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.753570556640625, -2.65753173828125, -2.561492919921875, -2.4654541015625, -2.369415283203125, -2.27337646484375, -2.177337646484375, -2.081298828125, -1.985260009765625, -1.88922119140625, -1.793182373046875, -1.6971435546875, -1.601104736328125, -1.50506591796875, -1.409027099609375, -1.31298828125, -1.216949462890625, -1.12091064453125, -1.024871826171875, -0.9288330078125, -0.832794189453125, -0.73675537109375, -0.640716552734375, -0.544677734375, -0.448638916015625, -0.35260009765625, -0.256561279296875, -0.1605224609375, -0.064483642578125, 0.03155517578125, 0.127593994140625, 0.2236328125, 0.319671630859375, 0.41571044921875, 0.511749267578125, 0.6077880859375, 0.703826904296875, 0.79986572265625, 0.895904541015625, 0.991943359375, 1.087982177734375, 1.18402099609375, 1.280059814453125, 1.3760986328125, 1.472137451171875, 1.56817626953125, 1.664215087890625, 1.76025390625, 1.856292724609375, 1.95233154296875, 2.048370361328125, 2.1444091796875, 2.240447998046875, 2.33648681640625, 2.432525634765625, 2.528564453125, 2.624603271484375, 2.72064208984375, 2.816680908203125, 2.9127197265625, 3.008758544921875, 3.10479736328125, 3.200836181640625, 3.296875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 9.0, 6.0, 14.0, 21.0, 24.0, 41.0, 64.0, 104.0, 164.0, 300.0, 550.0, 782.0, 770.0, 509.0, 304.0, 168.0, 97.0, 37.0, 37.0, 25.0, 17.0, 6.0, 7.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5859603881835938, -0.5649871826171875, -0.5440139770507812, -0.523040771484375, -0.5020675659179688, -0.4810943603515625, -0.46012115478515625, -0.43914794921875, -0.41817474365234375, -0.3972015380859375, -0.37622833251953125, -0.355255126953125, -0.33428192138671875, -0.3133087158203125, -0.29233551025390625, -0.2713623046875, -0.25038909912109375, -0.2294158935546875, -0.20844268798828125, -0.187469482421875, -0.16649627685546875, -0.1455230712890625, -0.12454986572265625, -0.10357666015625, -0.08260345458984375, -0.0616302490234375, -0.04065704345703125, -0.019683837890625, 0.00128936767578125, 0.0222625732421875, 0.04323577880859375, 0.064208984375, 0.08518218994140625, 0.1061553955078125, 0.12712860107421875, 0.148101806640625, 0.16907501220703125, 0.1900482177734375, 0.21102142333984375, 0.23199462890625, 0.25296783447265625, 0.2739410400390625, 0.29491424560546875, 0.315887451171875, 0.33686065673828125, 0.3578338623046875, 0.37880706787109375, 0.3997802734375, 0.42075347900390625, 0.4417266845703125, 0.46269989013671875, 0.483673095703125, 0.5046463012695312, 0.5256195068359375, 0.5465927124023438, 0.56756591796875, 0.5885391235351562, 0.6095123291015625, 0.6304855346679688, 0.651458740234375, 0.6724319458007812, 0.6934051513671875, 0.7143783569335938, 0.7353515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 7.0, 29.0, 36.0, 62.0, 84.0, 101.0, 138.0, 134.0, 123.0, 100.0, 74.0, 41.0, 25.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4242005348205566, -2.33559513092041, -2.2469897270202637, -2.158384323120117, -2.0697786808013916, -1.9811732769012451, -1.8925678730010986, -1.8039624691009521, -1.7153569459915161, -1.6267515420913696, -1.5381460189819336, -1.449540615081787, -1.3609352111816406, -1.2723296880722046, -1.183724284172058, -1.095118761062622, -1.0065133571624756, -0.9179078936576843, -0.8293024301528931, -0.7406970262527466, -0.6520915627479553, -0.5634860992431641, -0.4748806953430176, -0.3862752318382263, -0.29766976833343506, -0.209064319729805, -0.12045887112617493, -0.031853437423706055, 0.056752026081085205, 0.14535748958587646, 0.23396289348602295, 0.3225683569908142, 0.41117382049560547, 0.49977928400039673, 0.588384747505188, 0.6769901514053345, 0.7655956149101257, 0.854201078414917, 0.9428064823150635, 1.03141188621521, 1.120017409324646, 1.2086228132247925, 1.2972283363342285, 1.385833740234375, 1.4744391441345215, 1.5630446672439575, 1.651650071144104, 1.74025559425354, 1.8288609981536865, 1.917466402053833, 2.0060718059539795, 2.094677448272705, 2.1832828521728516, 2.271888256072998, 2.3604936599731445, 2.449099063873291, 2.5377044677734375, 2.626309871673584, 2.7149152755737305, 2.803520679473877, 2.8921263217926025, 2.980731725692749, 3.0693371295928955, 3.157942533493042, 3.2465481758117676]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 11.0, 13.0, 20.0, 16.0, 27.0, 27.0, 18.0, 20.0, 34.0, 39.0, 42.0, 31.0, 35.0, 40.0, 46.0, 31.0, 39.0, 39.0, 35.0, 35.0, 50.0, 34.0, 48.0, 41.0, 36.0, 23.0, 24.0, 23.0, 29.0, 13.0, 15.0, 13.0, 4.0, 8.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0734831094741821, -1.0392005443572998, -1.0049179792404175, -0.9706354737281799, -0.9363529086112976, -0.9020703434944153, -0.8677878379821777, -0.8335052728652954, -0.7992227077484131, -0.7649401426315308, -0.7306575775146484, -0.6963750720024109, -0.6620925068855286, -0.6278099417686462, -0.5935274362564087, -0.5592448711395264, -0.524962306022644, -0.4906797409057617, -0.4563972055912018, -0.42211467027664185, -0.3878321051597595, -0.3535495400428772, -0.31926700472831726, -0.2849844694137573, -0.250701904296875, -0.21641935408115387, -0.18213680386543274, -0.1478542536497116, -0.11357170343399048, -0.07928915321826935, -0.04500660300254822, -0.010724052786827087, 0.023558378219604492, 0.05784092843532562, 0.09212347865104675, 0.12640602886676788, 0.160688579082489, 0.19497112929821014, 0.22925367951393127, 0.2635362148284912, 0.29781877994537354, 0.33210134506225586, 0.3663838803768158, 0.40066641569137573, 0.43494898080825806, 0.4692315459251404, 0.5035140514373779, 0.5377966165542603, 0.5720791816711426, 0.6063617467880249, 0.6406443119049072, 0.6749268174171448, 0.7092093825340271, 0.7434919476509094, 0.777774453163147, 0.8120570182800293, 0.8463395833969116, 0.880622148513794, 0.9149047136306763, 0.9491872191429138, 0.9834697842597961, 1.0177522897720337, 1.052034854888916, 1.0863174200057983, 1.1205999851226807]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 11.0, 14.0, 17.0, 29.0, 66.0, 101.0, 165.0, 235.0, 463.0, 841.0, 1497.0, 3073.0, 6903.0, 17291.0, 61097.0, 286285.0, 487876.0, 131387.0, 31189.0, 10664.0, 4571.0, 2180.0, 1121.0, 598.0, 319.0, 218.0, 115.0, 86.0, 49.0, 26.0, 18.0, 8.0, 13.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51513671875, -0.5013084411621094, -0.48748016357421875, -0.4736518859863281, -0.4598236083984375, -0.4459953308105469, -0.43216705322265625, -0.4183387756347656, -0.404510498046875, -0.3906822204589844, -0.37685394287109375, -0.3630256652832031, -0.3491973876953125, -0.3353691101074219, -0.32154083251953125, -0.3077125549316406, -0.29388427734375, -0.2800559997558594, -0.26622772216796875, -0.2523994445800781, -0.2385711669921875, -0.22474288940429688, -0.21091461181640625, -0.19708633422851562, -0.183258056640625, -0.16942977905273438, -0.15560150146484375, -0.14177322387695312, -0.1279449462890625, -0.11411666870117188, -0.10028839111328125, -0.08646011352539062, -0.0726318359375, -0.058803558349609375, -0.04497528076171875, -0.031147003173828125, -0.0173187255859375, -0.003490447998046875, 0.01033782958984375, 0.024166107177734375, 0.037994384765625, 0.051822662353515625, 0.06565093994140625, 0.07947921752929688, 0.0933074951171875, 0.10713577270507812, 0.12096405029296875, 0.13479232788085938, 0.14862060546875, 0.16244888305664062, 0.17627716064453125, 0.19010543823242188, 0.2039337158203125, 0.21776199340820312, 0.23159027099609375, 0.24541854858398438, 0.259246826171875, 0.2730751037597656, 0.28690338134765625, 0.3007316589355469, 0.3145599365234375, 0.3283882141113281, 0.34221649169921875, 0.3560447692871094, 0.369873046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 12.0, 9.0, 7.0, 11.0, 23.0, 28.0, 25.0, 33.0, 38.0, 47.0, 36.0, 44.0, 60.0, 51.0, 43.0, 44.0, 40.0, 54.0, 51.0, 59.0, 55.0, 48.0, 39.0, 30.0, 26.0, 26.0, 14.0, 13.0, 10.0, 10.0, 3.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.78265380859375, -0.7552490234375, -0.72784423828125, -0.700439453125, -0.67303466796875, -0.6456298828125, -0.61822509765625, -0.5908203125, -0.56341552734375, -0.5360107421875, -0.50860595703125, -0.481201171875, -0.45379638671875, -0.4263916015625, -0.39898681640625, -0.37158203125, -0.34417724609375, -0.3167724609375, -0.28936767578125, -0.261962890625, -0.23455810546875, -0.2071533203125, -0.17974853515625, -0.15234375, -0.12493896484375, -0.0975341796875, -0.07012939453125, -0.042724609375, -0.01531982421875, 0.0120849609375, 0.03948974609375, 0.06689453125, 0.09429931640625, 0.1217041015625, 0.14910888671875, 0.176513671875, 0.20391845703125, 0.2313232421875, 0.25872802734375, 0.2861328125, 0.31353759765625, 0.3409423828125, 0.36834716796875, 0.395751953125, 0.42315673828125, 0.4505615234375, 0.47796630859375, 0.50537109375, 0.53277587890625, 0.5601806640625, 0.58758544921875, 0.614990234375, 0.64239501953125, 0.6697998046875, 0.69720458984375, 0.724609375, 0.75201416015625, 0.7794189453125, 0.80682373046875, 0.834228515625, 0.86163330078125, 0.8890380859375, 0.91644287109375, 0.94384765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 11.0, 16.0, 24.0, 38.0, 54.0, 92.0, 119.0, 171.0, 250.0, 406.0, 658.0, 1112.0, 2173.0, 4531.0, 12902.0, 72985.0, 587100.0, 316645.0, 33425.0, 8131.0, 3408.0, 1691.0, 900.0, 604.0, 351.0, 246.0, 154.0, 95.0, 78.0, 37.0, 37.0, 23.0, 15.0, 15.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.53125, -0.513427734375, -0.49560546875, -0.477783203125, -0.4599609375, -0.442138671875, -0.42431640625, -0.406494140625, -0.388671875, -0.370849609375, -0.35302734375, -0.335205078125, -0.3173828125, -0.299560546875, -0.28173828125, -0.263916015625, -0.24609375, -0.228271484375, -0.21044921875, -0.192626953125, -0.1748046875, -0.156982421875, -0.13916015625, -0.121337890625, -0.103515625, -0.085693359375, -0.06787109375, -0.050048828125, -0.0322265625, -0.014404296875, 0.00341796875, 0.021240234375, 0.0390625, 0.056884765625, 0.07470703125, 0.092529296875, 0.1103515625, 0.128173828125, 0.14599609375, 0.163818359375, 0.181640625, 0.199462890625, 0.21728515625, 0.235107421875, 0.2529296875, 0.270751953125, 0.28857421875, 0.306396484375, 0.32421875, 0.342041015625, 0.35986328125, 0.377685546875, 0.3955078125, 0.413330078125, 0.43115234375, 0.448974609375, 0.466796875, 0.484619140625, 0.50244140625, 0.520263671875, 0.5380859375, 0.555908203125, 0.57373046875, 0.591552734375, 0.609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 2.0, 7.0, 11.0, 14.0, 25.0, 20.0, 27.0, 21.0, 34.0, 31.0, 38.0, 41.0, 55.0, 60.0, 44.0, 47.0, 61.0, 52.0, 47.0, 48.0, 49.0, 30.0, 29.0, 54.0, 28.0, 27.0, 18.0, 16.0, 9.0, 8.0, 6.0, 10.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5363922119140625, -1.482940673828125, -1.4294891357421875, -1.37603759765625, -1.3225860595703125, -1.269134521484375, -1.2156829833984375, -1.1622314453125, -1.1087799072265625, -1.055328369140625, -1.0018768310546875, -0.94842529296875, -0.8949737548828125, -0.841522216796875, -0.7880706787109375, -0.734619140625, -0.6811676025390625, -0.627716064453125, -0.5742645263671875, -0.52081298828125, -0.4673614501953125, -0.413909912109375, -0.3604583740234375, -0.3070068359375, -0.2535552978515625, -0.200103759765625, -0.1466522216796875, -0.09320068359375, -0.0397491455078125, 0.013702392578125, 0.0671539306640625, 0.12060546875, 0.1740570068359375, 0.227508544921875, 0.2809600830078125, 0.33441162109375, 0.3878631591796875, 0.441314697265625, 0.4947662353515625, 0.5482177734375, 0.6016693115234375, 0.655120849609375, 0.7085723876953125, 0.76202392578125, 0.8154754638671875, 0.868927001953125, 0.9223785400390625, 0.975830078125, 1.0292816162109375, 1.082733154296875, 1.1361846923828125, 1.18963623046875, 1.2430877685546875, 1.296539306640625, 1.3499908447265625, 1.4034423828125, 1.4568939208984375, 1.510345458984375, 1.5637969970703125, 1.61724853515625, 1.6707000732421875, 1.724151611328125, 1.7776031494140625, 1.8310546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 10.0, 17.0, 18.0, 18.0, 36.0, 64.0, 84.0, 138.0, 229.0, 416.0, 705.0, 1348.0, 2461.0, 5103.0, 10859.0, 26338.0, 88487.0, 437763.0, 360720.0, 71263.0, 22954.0, 9793.0, 4600.0, 2270.0, 1205.0, 697.0, 353.0, 242.0, 130.0, 84.0, 54.0, 27.0, 19.0, 16.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14468765258789062, -0.13910675048828125, -0.13352584838867188, -0.1279449462890625, -0.12236404418945312, -0.11678314208984375, -0.11120223999023438, -0.105621337890625, -0.10004043579101562, -0.09445953369140625, -0.08887863159179688, -0.0832977294921875, -0.07771682739257812, -0.07213592529296875, -0.06655502319335938, -0.06097412109375, -0.055393218994140625, -0.04981231689453125, -0.044231414794921875, -0.0386505126953125, -0.033069610595703125, -0.02748870849609375, -0.021907806396484375, -0.016326904296875, -0.010746002197265625, -0.00516510009765625, 0.000415802001953125, 0.0059967041015625, 0.011577606201171875, 0.01715850830078125, 0.022739410400390625, 0.0283203125, 0.033901214599609375, 0.03948211669921875, 0.045063018798828125, 0.0506439208984375, 0.056224822998046875, 0.06180572509765625, 0.06738662719726562, 0.072967529296875, 0.07854843139648438, 0.08412933349609375, 0.08971023559570312, 0.0952911376953125, 0.10087203979492188, 0.10645294189453125, 0.11203384399414062, 0.11761474609375, 0.12319564819335938, 0.12877655029296875, 0.13435745239257812, 0.1399383544921875, 0.14551925659179688, 0.15110015869140625, 0.15668106079101562, 0.162261962890625, 0.16784286499023438, 0.17342376708984375, 0.17900466918945312, 0.1845855712890625, 0.19016647338867188, 0.19574737548828125, 0.20132827758789062, 0.2069091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 13.0, 41.0, 99.0, 183.0, 315.0, 171.0, 83.0, 26.0, 19.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001766681671142578, -0.00017168372869491577, -0.00016669929027557373, -0.0001617148518562317, -0.00015673041343688965, -0.0001517459750175476, -0.00014676153659820557, -0.00014177709817886353, -0.00013679265975952148, -0.00013180822134017944, -0.0001268237829208374, -0.00012183934450149536, -0.00011685490608215332, -0.00011187046766281128, -0.00010688602924346924, -0.0001019015908241272, -9.691715240478516e-05, -9.193271398544312e-05, -8.694827556610107e-05, -8.196383714675903e-05, -7.697939872741699e-05, -7.199496030807495e-05, -6.701052188873291e-05, -6.202608346939087e-05, -5.704164505004883e-05, -5.205720663070679e-05, -4.7072768211364746e-05, -4.2088329792022705e-05, -3.7103891372680664e-05, -3.211945295333862e-05, -2.7135014533996582e-05, -2.215057611465454e-05, -1.71661376953125e-05, -1.2181699275970459e-05, -7.197260856628418e-06, -2.212822437286377e-06, 2.771615982055664e-06, 7.756054401397705e-06, 1.2740492820739746e-05, 1.7724931240081787e-05, 2.2709369659423828e-05, 2.769380807876587e-05, 3.267824649810791e-05, 3.766268491744995e-05, 4.264712333679199e-05, 4.763156175613403e-05, 5.2616000175476074e-05, 5.7600438594818115e-05, 6.258487701416016e-05, 6.75693154335022e-05, 7.255375385284424e-05, 7.753819227218628e-05, 8.252263069152832e-05, 8.750706911087036e-05, 9.24915075302124e-05, 9.747594594955444e-05, 0.00010246038436889648, 0.00010744482278823853, 0.00011242926120758057, 0.00011741369962692261, 0.00012239813804626465, 0.0001273825764656067, 0.00013236701488494873, 0.00013735145330429077, 0.0001423358917236328]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 7.0, 8.0, 11.0, 16.0, 28.0, 39.0, 47.0, 81.0, 140.0, 177.0, 290.0, 506.0, 967.0, 1819.0, 3557.0, 7683.0, 18442.0, 52822.0, 236453.0, 530000.0, 133896.0, 35902.0, 13515.0, 5903.0, 2792.0, 1449.0, 773.0, 459.0, 271.0, 144.0, 94.0, 78.0, 51.0, 24.0, 23.0, 19.0, 17.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1939697265625, -0.18777847290039062, -0.18158721923828125, -0.17539596557617188, -0.1692047119140625, -0.16301345825195312, -0.15682220458984375, -0.15063095092773438, -0.144439697265625, -0.13824844360351562, -0.13205718994140625, -0.12586593627929688, -0.1196746826171875, -0.11348342895507812, -0.10729217529296875, -0.10110092163085938, -0.09490966796875, -0.08871841430664062, -0.08252716064453125, -0.07633590698242188, -0.0701446533203125, -0.06395339965820312, -0.05776214599609375, -0.051570892333984375, -0.045379638671875, -0.039188385009765625, -0.03299713134765625, -0.026805877685546875, -0.0206146240234375, -0.014423370361328125, -0.00823211669921875, -0.002040863037109375, 0.004150390625, 0.010341644287109375, 0.01653289794921875, 0.022724151611328125, 0.0289154052734375, 0.035106658935546875, 0.04129791259765625, 0.047489166259765625, 0.053680419921875, 0.059871673583984375, 0.06606292724609375, 0.07225418090820312, 0.0784454345703125, 0.08463668823242188, 0.09082794189453125, 0.09701919555664062, 0.10321044921875, 0.10940170288085938, 0.11559295654296875, 0.12178421020507812, 0.1279754638671875, 0.13416671752929688, 0.14035797119140625, 0.14654922485351562, 0.152740478515625, 0.15893173217773438, 0.16512298583984375, 0.17131423950195312, 0.1775054931640625, 0.18369674682617188, 0.18988800048828125, 0.19607925415039062, 0.2022705078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 10.0, 7.0, 9.0, 9.0, 22.0, 18.0, 26.0, 39.0, 43.0, 63.0, 116.0, 109.0, 124.0, 94.0, 77.0, 51.0, 34.0, 29.0, 14.0, 20.0, 9.0, 8.0, 6.0, 10.0, 8.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059051513671875, -0.057233333587646484, -0.05541515350341797, -0.05359697341918945, -0.05177879333496094, -0.04996061325073242, -0.048142433166503906, -0.04632425308227539, -0.044506072998046875, -0.04268789291381836, -0.040869712829589844, -0.03905153274536133, -0.03723335266113281, -0.0354151725769043, -0.03359699249267578, -0.031778812408447266, -0.02996063232421875, -0.028142452239990234, -0.02632427215576172, -0.024506092071533203, -0.022687911987304688, -0.020869731903076172, -0.019051551818847656, -0.01723337173461914, -0.015415191650390625, -0.01359701156616211, -0.011778831481933594, -0.009960651397705078, -0.008142471313476562, -0.006324291229248047, -0.004506111145019531, -0.0026879310607910156, -0.0008697509765625, 0.0009484291076660156, 0.0027666091918945312, 0.004584789276123047, 0.0064029693603515625, 0.008221149444580078, 0.010039329528808594, 0.01185750961303711, 0.013675689697265625, 0.01549386978149414, 0.017312049865722656, 0.019130229949951172, 0.020948410034179688, 0.022766590118408203, 0.02458477020263672, 0.026402950286865234, 0.02822113037109375, 0.030039310455322266, 0.03185749053955078, 0.0336756706237793, 0.03549385070800781, 0.03731203079223633, 0.039130210876464844, 0.04094839096069336, 0.042766571044921875, 0.04458475112915039, 0.046402931213378906, 0.04822111129760742, 0.05003929138183594, 0.05185747146606445, 0.05367565155029297, 0.055493831634521484, 0.05731201171875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 15.0, 19.0, 51.0, 81.0, 115.0, 145.0, 179.0, 145.0, 111.0, 56.0, 31.0, 21.0, 9.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.060208320617676, -1.9967817068099976, -1.9333550930023193, -1.8699283599853516, -1.8065017461776733, -1.7430751323699951, -1.679648518562317, -1.6162219047546387, -1.552795171737671, -1.4893685579299927, -1.4259419441223145, -1.3625152111053467, -1.2990885972976685, -1.2356619834899902, -1.172235369682312, -1.1088087558746338, -1.0453821420669556, -0.9819555282592773, -0.9185288548469543, -0.8551022410392761, -0.7916755676269531, -0.7282489538192749, -0.6648223400115967, -0.6013957262039185, -0.5379690527915955, -0.47454240918159485, -0.41111576557159424, -0.347689151763916, -0.2842625081539154, -0.2208358645439148, -0.15740925073623657, -0.09398260712623596, -0.0305558443069458, 0.03287079185247421, 0.09629742801189423, 0.15972405672073364, 0.22315070033073425, 0.28657734394073486, 0.3500039577484131, 0.4134306013584137, 0.4768572449684143, 0.5402838587760925, 0.6037105321884155, 0.6671371459960938, 0.730563759803772, 0.793990433216095, 0.8574170470237732, 0.9208437204360962, 0.9842703342437744, 1.0476969480514526, 1.1111235618591309, 1.1745502948760986, 1.2379769086837769, 1.301403522491455, 1.3648301362991333, 1.4282567501068115, 1.4916834831237793, 1.5551100969314575, 1.6185367107391357, 1.6819634437561035, 1.7453900575637817, 1.80881667137146, 1.8722432851791382, 1.9356698989868164, 1.9990965127944946]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 15.0, 8.0, 14.0, 21.0, 25.0, 22.0, 30.0, 29.0, 29.0, 43.0, 49.0, 38.0, 47.0, 39.0, 59.0, 52.0, 35.0, 48.0, 46.0, 51.0, 54.0, 36.0, 34.0, 36.0, 36.0, 27.0, 21.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8579243421554565, -0.8328648209571838, -0.8078052997589111, -0.7827457785606384, -0.7576862573623657, -0.732626736164093, -0.7075672149658203, -0.6825076937675476, -0.6574481725692749, -0.6323886513710022, -0.6073291301727295, -0.5822696089744568, -0.5572100877761841, -0.5321505665779114, -0.5070910453796387, -0.48203152418136597, -0.45697200298309326, -0.43191248178482056, -0.40685296058654785, -0.38179343938827515, -0.35673391819000244, -0.33167439699172974, -0.30661487579345703, -0.2815553545951843, -0.2564958333969116, -0.23143631219863892, -0.2063767910003662, -0.1813172698020935, -0.1562577486038208, -0.1311982274055481, -0.10613870620727539, -0.08107918500900269, -0.05601966381072998, -0.030960142612457275, -0.00590062141418457, 0.019158899784088135, 0.04421842098236084, 0.06927794218063354, 0.09433746337890625, 0.11939698457717896, 0.14445650577545166, 0.16951602697372437, 0.19457554817199707, 0.21963506937026978, 0.24469459056854248, 0.2697541117668152, 0.2948136329650879, 0.3198731541633606, 0.3449326753616333, 0.369992196559906, 0.3950517177581787, 0.4201112389564514, 0.4451707601547241, 0.4702302813529968, 0.49528980255126953, 0.5203493237495422, 0.5454088449478149, 0.5704683661460876, 0.5955278873443604, 0.6205874085426331, 0.6456469297409058, 0.6707064509391785, 0.6957659721374512, 0.7208254933357239, 0.7458850145339966]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 16.0, 24.0, 50.0, 68.0, 149.0, 290.0, 546.0, 1500.0, 4508.0, 15311.0, 73450.0, 716081.0, 197768.0, 27460.0, 7387.0, 2261.0, 873.0, 381.0, 198.0, 85.0, 67.0, 33.0, 20.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.0656890869140625, -1.029815673828125, -0.9939422607421875, -0.95806884765625, -0.9221954345703125, -0.886322021484375, -0.8504486083984375, -0.8145751953125, -0.7787017822265625, -0.742828369140625, -0.7069549560546875, -0.67108154296875, -0.6352081298828125, -0.599334716796875, -0.5634613037109375, -0.527587890625, -0.4917144775390625, -0.455841064453125, -0.4199676513671875, -0.38409423828125, -0.3482208251953125, -0.312347412109375, -0.2764739990234375, -0.2406005859375, -0.2047271728515625, -0.168853759765625, -0.1329803466796875, -0.09710693359375, -0.0612335205078125, -0.025360107421875, 0.0105133056640625, 0.04638671875, 0.0822601318359375, 0.118133544921875, 0.1540069580078125, 0.18988037109375, 0.2257537841796875, 0.261627197265625, 0.2975006103515625, 0.3333740234375, 0.3692474365234375, 0.405120849609375, 0.4409942626953125, 0.47686767578125, 0.5127410888671875, 0.548614501953125, 0.5844879150390625, 0.620361328125, 0.6562347412109375, 0.692108154296875, 0.7279815673828125, 0.76385498046875, 0.7997283935546875, 0.835601806640625, 0.8714752197265625, 0.9073486328125, 0.9432220458984375, 0.979095458984375, 1.0149688720703125, 1.05084228515625, 1.0867156982421875, 1.122589111328125, 1.1584625244140625, 1.1943359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 18.0, 20.0, 17.0, 28.0, 44.0, 49.0, 40.0, 65.0, 68.0, 67.0, 82.0, 63.0, 65.0, 83.0, 63.0, 60.0, 41.0, 38.0, 28.0, 15.0, 15.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.7590789794921875, -2.686126708984375, -2.6131744384765625, -2.54022216796875, -2.4672698974609375, -2.394317626953125, -2.3213653564453125, -2.2484130859375, -2.1754608154296875, -2.102508544921875, -2.0295562744140625, -1.95660400390625, -1.8836517333984375, -1.810699462890625, -1.7377471923828125, -1.664794921875, -1.5918426513671875, -1.518890380859375, -1.4459381103515625, -1.37298583984375, -1.3000335693359375, -1.227081298828125, -1.1541290283203125, -1.0811767578125, -1.0082244873046875, -0.935272216796875, -0.8623199462890625, -0.78936767578125, -0.7164154052734375, -0.643463134765625, -0.5705108642578125, -0.49755859375, -0.4246063232421875, -0.351654052734375, -0.2787017822265625, -0.20574951171875, -0.1327972412109375, -0.059844970703125, 0.0131072998046875, 0.0860595703125, 0.1590118408203125, 0.231964111328125, 0.3049163818359375, 0.37786865234375, 0.4508209228515625, 0.523773193359375, 0.5967254638671875, 0.669677734375, 0.7426300048828125, 0.815582275390625, 0.8885345458984375, 0.96148681640625, 1.0344390869140625, 1.107391357421875, 1.1803436279296875, 1.2532958984375, 1.3262481689453125, 1.399200439453125, 1.4721527099609375, 1.54510498046875, 1.6180572509765625, 1.691009521484375, 1.7639617919921875, 1.8369140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 7.0, 7.0, 9.0, 8.0, 13.0, 20.0, 24.0, 24.0, 25.0, 42.0, 53.0, 97.0, 120.0, 212.0, 483.0, 1507.0, 21615.0, 970441.0, 50223.0, 2307.0, 564.0, 233.0, 154.0, 94.0, 58.0, 45.0, 31.0, 26.0, 21.0, 15.0, 14.0, 8.0, 7.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.06640625, -2.972381591796875, -2.87835693359375, -2.784332275390625, -2.6903076171875, -2.596282958984375, -2.50225830078125, -2.408233642578125, -2.314208984375, -2.220184326171875, -2.12615966796875, -2.032135009765625, -1.9381103515625, -1.844085693359375, -1.75006103515625, -1.656036376953125, -1.56201171875, -1.467987060546875, -1.37396240234375, -1.279937744140625, -1.1859130859375, -1.091888427734375, -0.99786376953125, -0.903839111328125, -0.809814453125, -0.715789794921875, -0.62176513671875, -0.527740478515625, -0.4337158203125, -0.339691162109375, -0.24566650390625, -0.151641845703125, -0.0576171875, 0.036407470703125, 0.13043212890625, 0.224456787109375, 0.3184814453125, 0.412506103515625, 0.50653076171875, 0.600555419921875, 0.694580078125, 0.788604736328125, 0.88262939453125, 0.976654052734375, 1.0706787109375, 1.164703369140625, 1.25872802734375, 1.352752685546875, 1.44677734375, 1.540802001953125, 1.63482666015625, 1.728851318359375, 1.8228759765625, 1.916900634765625, 2.01092529296875, 2.104949951171875, 2.198974609375, 2.292999267578125, 2.38702392578125, 2.481048583984375, 2.5750732421875, 2.669097900390625, 2.76312255859375, 2.857147216796875, 2.951171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 4.0, 7.0, 5.0, 15.0, 6.0, 10.0, 11.0, 11.0, 24.0, 14.0, 22.0, 29.0, 35.0, 28.0, 45.0, 34.0, 50.0, 47.0, 59.0, 52.0, 40.0, 61.0, 53.0, 63.0, 35.0, 42.0, 30.0, 21.0, 28.0, 23.0, 16.0, 12.0, 8.0, 13.0, 6.0, 9.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0], "bins": [-2.25390625, -2.1930694580078125, -2.132232666015625, -2.0713958740234375, -2.01055908203125, -1.9497222900390625, -1.888885498046875, -1.8280487060546875, -1.7672119140625, -1.7063751220703125, -1.645538330078125, -1.5847015380859375, -1.52386474609375, -1.4630279541015625, -1.402191162109375, -1.3413543701171875, -1.280517578125, -1.2196807861328125, -1.158843994140625, -1.0980072021484375, -1.03717041015625, -0.9763336181640625, -0.915496826171875, -0.8546600341796875, -0.7938232421875, -0.7329864501953125, -0.672149658203125, -0.6113128662109375, -0.55047607421875, -0.4896392822265625, -0.428802490234375, -0.3679656982421875, -0.30712890625, -0.2462921142578125, -0.185455322265625, -0.1246185302734375, -0.06378173828125, -0.0029449462890625, 0.057891845703125, 0.1187286376953125, 0.1795654296875, 0.2404022216796875, 0.301239013671875, 0.3620758056640625, 0.42291259765625, 0.4837493896484375, 0.544586181640625, 0.6054229736328125, 0.666259765625, 0.7270965576171875, 0.787933349609375, 0.8487701416015625, 0.90960693359375, 0.9704437255859375, 1.031280517578125, 1.0921173095703125, 1.1529541015625, 1.2137908935546875, 1.274627685546875, 1.3354644775390625, 1.39630126953125, 1.4571380615234375, 1.517974853515625, 1.5788116455078125, 1.6396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 9.0, 8.0, 21.0, 29.0, 41.0, 109.0, 170.0, 548.0, 1671.0, 9158.0, 144354.0, 858601.0, 29087.0, 3417.0, 776.0, 306.0, 113.0, 58.0, 21.0, 26.0, 13.0, 9.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.27034759521484375, -0.2526092529296875, -0.23487091064453125, -0.217132568359375, -0.19939422607421875, -0.1816558837890625, -0.16391754150390625, -0.14617919921875, -0.12844085693359375, -0.1107025146484375, -0.09296417236328125, -0.075225830078125, -0.05748748779296875, -0.0397491455078125, -0.02201080322265625, -0.0042724609375, 0.01346588134765625, 0.0312042236328125, 0.04894256591796875, 0.066680908203125, 0.08441925048828125, 0.1021575927734375, 0.11989593505859375, 0.13763427734375, 0.15537261962890625, 0.1731109619140625, 0.19084930419921875, 0.208587646484375, 0.22632598876953125, 0.2440643310546875, 0.26180267333984375, 0.279541015625, 0.29727935791015625, 0.3150177001953125, 0.33275604248046875, 0.350494384765625, 0.36823272705078125, 0.3859710693359375, 0.40370941162109375, 0.42144775390625, 0.43918609619140625, 0.4569244384765625, 0.47466278076171875, 0.492401123046875, 0.5101394653320312, 0.5278778076171875, 0.5456161499023438, 0.5633544921875, 0.5810928344726562, 0.5988311767578125, 0.6165695190429688, 0.634307861328125, 0.6520462036132812, 0.6697845458984375, 0.6875228881835938, 0.70526123046875, 0.7229995727539062, 0.7407379150390625, 0.7584762573242188, 0.776214599609375, 0.7939529418945312, 0.8116912841796875, 0.8294296264648438, 0.84716796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 21.0, 28.0, 62.0, 102.0, 169.0, 234.0, 118.0, 89.0, 63.0, 36.0, 17.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4717063903808594e-05, -5.285162478685379e-05, -5.098618566989899e-05, -4.912074655294418e-05, -4.725530743598938e-05, -4.5389868319034576e-05, -4.352442920207977e-05, -4.165899008512497e-05, -3.9793550968170166e-05, -3.792811185121536e-05, -3.606267273426056e-05, -3.4197233617305756e-05, -3.233179450035095e-05, -3.046635538339615e-05, -2.8600916266441345e-05, -2.6735477149486542e-05, -2.4870038032531738e-05, -2.3004598915576935e-05, -2.113915979862213e-05, -1.9273720681667328e-05, -1.7408281564712524e-05, -1.554284244775772e-05, -1.3677403330802917e-05, -1.1811964213848114e-05, -9.94652509689331e-06, -8.081085979938507e-06, -6.215646862983704e-06, -4.3502077460289e-06, -2.4847686290740967e-06, -6.193295121192932e-07, 1.2461096048355103e-06, 3.1115487217903137e-06, 4.976987838745117e-06, 6.842426955699921e-06, 8.707866072654724e-06, 1.0573305189609528e-05, 1.2438744306564331e-05, 1.4304183423519135e-05, 1.6169622540473938e-05, 1.803506165742874e-05, 1.9900500774383545e-05, 2.176593989133835e-05, 2.3631379008293152e-05, 2.5496818125247955e-05, 2.736225724220276e-05, 2.9227696359157562e-05, 3.1093135476112366e-05, 3.295857459306717e-05, 3.482401371002197e-05, 3.6689452826976776e-05, 3.855489194393158e-05, 4.042033106088638e-05, 4.2285770177841187e-05, 4.415120929479599e-05, 4.6016648411750793e-05, 4.78820875287056e-05, 4.97475266456604e-05, 5.1612965762615204e-05, 5.347840487957001e-05, 5.534384399652481e-05, 5.7209283113479614e-05, 5.907472223043442e-05, 6.094016134738922e-05, 6.280560046434402e-05, 6.467103958129883e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 11.0, 8.0, 10.0, 16.0, 30.0, 42.0, 108.0, 145.0, 280.0, 615.0, 1598.0, 5696.0, 40779.0, 858710.0, 124939.0, 11351.0, 2448.0, 883.0, 402.0, 208.0, 101.0, 78.0, 38.0, 19.0, 14.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74365234375, -0.7253799438476562, -0.7071075439453125, -0.6888351440429688, -0.670562744140625, -0.6522903442382812, -0.6340179443359375, -0.6157455444335938, -0.59747314453125, -0.5792007446289062, -0.5609283447265625, -0.5426559448242188, -0.524383544921875, -0.5061111450195312, -0.4878387451171875, -0.46956634521484375, -0.4512939453125, -0.43302154541015625, -0.4147491455078125, -0.39647674560546875, -0.378204345703125, -0.35993194580078125, -0.3416595458984375, -0.32338714599609375, -0.30511474609375, -0.28684234619140625, -0.2685699462890625, -0.25029754638671875, -0.232025146484375, -0.21375274658203125, -0.1954803466796875, -0.17720794677734375, -0.158935546875, -0.14066314697265625, -0.1223907470703125, -0.10411834716796875, -0.085845947265625, -0.06757354736328125, -0.0493011474609375, -0.03102874755859375, -0.01275634765625, 0.00551605224609375, 0.0237884521484375, 0.04206085205078125, 0.060333251953125, 0.07860565185546875, 0.0968780517578125, 0.11515045166015625, 0.1334228515625, 0.15169525146484375, 0.1699676513671875, 0.18824005126953125, 0.206512451171875, 0.22478485107421875, 0.2430572509765625, 0.26132965087890625, 0.27960205078125, 0.29787445068359375, 0.3161468505859375, 0.33441925048828125, 0.352691650390625, 0.37096405029296875, 0.3892364501953125, 0.40750885009765625, 0.42578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 20.0, 21.0, 27.0, 38.0, 50.0, 133.0, 146.0, 199.0, 113.0, 59.0, 47.0, 28.0, 23.0, 10.0, 12.0, 10.0, 9.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12276458740234375, -0.1172332763671875, -0.11170196533203125, -0.106170654296875, -0.10063934326171875, -0.0951080322265625, -0.08957672119140625, -0.08404541015625, -0.07851409912109375, -0.0729827880859375, -0.06745147705078125, -0.061920166015625, -0.05638885498046875, -0.0508575439453125, -0.04532623291015625, -0.039794921875, -0.03426361083984375, -0.0287322998046875, -0.02320098876953125, -0.017669677734375, -0.01213836669921875, -0.0066070556640625, -0.00107574462890625, 0.00445556640625, 0.00998687744140625, 0.0155181884765625, 0.02104949951171875, 0.026580810546875, 0.03211212158203125, 0.0376434326171875, 0.04317474365234375, 0.0487060546875, 0.05423736572265625, 0.0597686767578125, 0.06529998779296875, 0.070831298828125, 0.07636260986328125, 0.0818939208984375, 0.08742523193359375, 0.09295654296875, 0.09848785400390625, 0.1040191650390625, 0.10955047607421875, 0.115081787109375, 0.12061309814453125, 0.1261444091796875, 0.13167572021484375, 0.13720703125, 0.14273834228515625, 0.1482696533203125, 0.15380096435546875, 0.159332275390625, 0.16486358642578125, 0.1703948974609375, 0.17592620849609375, 0.18145751953125, 0.18698883056640625, 0.1925201416015625, 0.19805145263671875, 0.203582763671875, 0.20911407470703125, 0.2146453857421875, 0.22017669677734375, 0.2257080078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 29.0, 44.0, 112.0, 162.0, 215.0, 199.0, 133.0, 51.0, 20.0, 16.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.017664909362793, -5.844317436218262, -5.670969486236572, -5.497621536254883, -5.324274063110352, -5.15092658996582, -4.977578639984131, -4.804230690002441, -4.63088321685791, -4.457535743713379, -4.2841877937316895, -4.11083984375, -3.9374923706054688, -3.7641446590423584, -3.590796947479248, -3.4174492359161377, -3.2441015243530273, -3.070753812789917, -2.8974061012268066, -2.7240583896636963, -2.550710678100586, -2.3773629665374756, -2.2040152549743652, -2.030667543411255, -1.8573198318481445, -1.6839721202850342, -1.5106244087219238, -1.3372766971588135, -1.1639289855957031, -0.9905812740325928, -0.8172335624694824, -0.6438858509063721, -0.4705386161804199, -0.29719090461730957, -0.12384319305419922, 0.04950451850891113, 0.22285223007202148, 0.39619994163513184, 0.5695476531982422, 0.7428953647613525, 0.9162430763244629, 1.0895907878875732, 1.2629384994506836, 1.436286211013794, 1.6096339225769043, 1.7829816341400146, 1.956329345703125, 2.1296770572662354, 2.3030247688293457, 2.476372480392456, 2.6497201919555664, 2.8230679035186768, 2.996415615081787, 3.1697633266448975, 3.343111038208008, 3.516458749771118, 3.6898064613342285, 3.863154172897339, 4.036501884460449, 4.2098493576049805, 4.38319730758667, 4.556545257568359, 4.729892730712891, 4.903240203857422, 5.076588153839111]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 12.0, 8.0, 8.0, 16.0, 14.0, 23.0, 8.0, 25.0, 37.0, 28.0, 31.0, 34.0, 58.0, 41.0, 49.0, 44.0, 51.0, 47.0, 65.0, 37.0, 39.0, 49.0, 42.0, 43.0, 35.0, 26.0, 22.0, 37.0, 16.0, 15.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.8116557598114014, -3.7090628147125244, -3.6064701080322266, -3.5038771629333496, -3.4012842178344727, -3.298691511154175, -3.196098566055298, -3.093505859375, -2.990912914276123, -2.888319969177246, -2.7857272624969482, -2.6831343173980713, -2.5805416107177734, -2.4779486656188965, -2.3753557205200195, -2.2727627754211426, -2.1701700687408447, -2.0675771236419678, -1.96498441696167, -1.862391471862793, -1.7597986459732056, -1.6572058200836182, -1.5546128749847412, -1.4520200490951538, -1.3494272232055664, -1.246834397315979, -1.1442415714263916, -1.0416486263275146, -0.9390558004379272, -0.8364629745483398, -0.7338700890541077, -0.6312772035598755, -0.5286843776702881, -0.4260915219783783, -0.3234986662864685, -0.22090581059455872, -0.11831295490264893, -0.015720129013061523, 0.08687275648117065, 0.18946564197540283, 0.29205846786499023, 0.3946513235569, 0.4972441792488098, 0.599837064743042, 0.7024298906326294, 0.8050227165222168, 0.907615602016449, 1.0102084875106812, 1.1128013134002686, 1.215394139289856, 1.3179869651794434, 1.4205799102783203, 1.5231727361679077, 1.6257655620574951, 1.728358507156372, 1.8309513330459595, 1.9335441589355469, 2.036137104034424, 2.1387298107147217, 2.2413227558135986, 2.3439154624938965, 2.4465084075927734, 2.5491013526916504, 2.6516942977905273, 2.754287004470825]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 7.0, 5.0, 12.0, 11.0, 13.0, 16.0, 21.0, 31.0, 43.0, 46.0, 63.0, 101.0, 163.0, 442.0, 1369.0, 7793.0, 144285.0, 3647339.0, 377858.0, 11628.0, 1874.0, 539.0, 205.0, 118.0, 90.0, 45.0, 42.0, 33.0, 21.0, 17.0, 18.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.51171875, -3.410247802734375, -3.30877685546875, -3.207305908203125, -3.1058349609375, -3.004364013671875, -2.90289306640625, -2.801422119140625, -2.699951171875, -2.598480224609375, -2.49700927734375, -2.395538330078125, -2.2940673828125, -2.192596435546875, -2.09112548828125, -1.989654541015625, -1.88818359375, -1.786712646484375, -1.68524169921875, -1.583770751953125, -1.4822998046875, -1.380828857421875, -1.27935791015625, -1.177886962890625, -1.076416015625, -0.974945068359375, -0.87347412109375, -0.772003173828125, -0.6705322265625, -0.569061279296875, -0.46759033203125, -0.366119384765625, -0.2646484375, -0.163177490234375, -0.06170654296875, 0.039764404296875, 0.1412353515625, 0.242706298828125, 0.34417724609375, 0.445648193359375, 0.547119140625, 0.648590087890625, 0.75006103515625, 0.851531982421875, 0.9530029296875, 1.054473876953125, 1.15594482421875, 1.257415771484375, 1.35888671875, 1.460357666015625, 1.56182861328125, 1.663299560546875, 1.7647705078125, 1.866241455078125, 1.96771240234375, 2.069183349609375, 2.170654296875, 2.272125244140625, 2.37359619140625, 2.475067138671875, 2.5765380859375, 2.678009033203125, 2.77947998046875, 2.880950927734375, 2.982421875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 7.0, 6.0, 15.0, 11.0, 19.0, 17.0, 22.0, 23.0, 36.0, 33.0, 42.0, 48.0, 38.0, 46.0, 48.0, 41.0, 51.0, 36.0, 39.0, 50.0, 49.0, 43.0, 35.0, 41.0, 49.0, 24.0, 28.0, 21.0, 12.0, 13.0, 8.0, 11.0, 9.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8232345581054688, -0.7924652099609375, -0.7616958618164062, -0.730926513671875, -0.7001571655273438, -0.6693878173828125, -0.6386184692382812, -0.60784912109375, -0.5770797729492188, -0.5463104248046875, -0.5155410766601562, -0.484771728515625, -0.45400238037109375, -0.4232330322265625, -0.39246368408203125, -0.3616943359375, -0.33092498779296875, -0.3001556396484375, -0.26938629150390625, -0.238616943359375, -0.20784759521484375, -0.1770782470703125, -0.14630889892578125, -0.11553955078125, -0.08477020263671875, -0.0540008544921875, -0.02323150634765625, 0.007537841796875, 0.03830718994140625, 0.0690765380859375, 0.09984588623046875, 0.130615234375, 0.16138458251953125, 0.1921539306640625, 0.22292327880859375, 0.253692626953125, 0.28446197509765625, 0.3152313232421875, 0.34600067138671875, 0.37677001953125, 0.40753936767578125, 0.4383087158203125, 0.46907806396484375, 0.499847412109375, 0.5306167602539062, 0.5613861083984375, 0.5921554565429688, 0.6229248046875, 0.6536941528320312, 0.6844635009765625, 0.7152328491210938, 0.746002197265625, 0.7767715454101562, 0.8075408935546875, 0.8383102416992188, 0.86907958984375, 0.8998489379882812, 0.9306182861328125, 0.9613876342773438, 0.992156982421875, 1.0229263305664062, 1.0536956787109375, 1.0844650268554688, 1.115234375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 23.0, 44.0, 82.0, 167.0, 427.0, 1489.0, 8546.0, 465643.0, 3692374.0, 21799.0, 2536.0, 663.0, 227.0, 102.0, 45.0, 36.0, 21.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9205322265625, -3.770751953125, -3.6209716796875, -3.47119140625, -3.3214111328125, -3.171630859375, -3.0218505859375, -2.8720703125, -2.7222900390625, -2.572509765625, -2.4227294921875, -2.27294921875, -2.1231689453125, -1.973388671875, -1.8236083984375, -1.673828125, -1.5240478515625, -1.374267578125, -1.2244873046875, -1.07470703125, -0.9249267578125, -0.775146484375, -0.6253662109375, -0.4755859375, -0.3258056640625, -0.176025390625, -0.0262451171875, 0.12353515625, 0.2733154296875, 0.423095703125, 0.5728759765625, 0.72265625, 0.8724365234375, 1.022216796875, 1.1719970703125, 1.32177734375, 1.4715576171875, 1.621337890625, 1.7711181640625, 1.9208984375, 2.0706787109375, 2.220458984375, 2.3702392578125, 2.52001953125, 2.6697998046875, 2.819580078125, 2.9693603515625, 3.119140625, 3.2689208984375, 3.418701171875, 3.5684814453125, 3.71826171875, 3.8680419921875, 4.017822265625, 4.1676025390625, 4.3173828125, 4.4671630859375, 4.616943359375, 4.7667236328125, 4.91650390625, 5.0662841796875, 5.216064453125, 5.3658447265625, 5.515625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 12.0, 20.0, 48.0, 73.0, 115.0, 236.0, 485.0, 900.0, 954.0, 588.0, 279.0, 146.0, 81.0, 51.0, 31.0, 19.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.958984375, -0.9308853149414062, -0.9027862548828125, -0.8746871948242188, -0.846588134765625, -0.8184890747070312, -0.7903900146484375, -0.7622909545898438, -0.73419189453125, -0.7060928344726562, -0.6779937744140625, -0.6498947143554688, -0.621795654296875, -0.5936965942382812, -0.5655975341796875, -0.5374984741210938, -0.5093994140625, -0.48130035400390625, -0.4532012939453125, -0.42510223388671875, -0.397003173828125, -0.36890411376953125, -0.3408050537109375, -0.31270599365234375, -0.28460693359375, -0.25650787353515625, -0.2284088134765625, -0.20030975341796875, -0.172210693359375, -0.14411163330078125, -0.1160125732421875, -0.08791351318359375, -0.059814453125, -0.03171539306640625, -0.0036163330078125, 0.02448272705078125, 0.052581787109375, 0.08068084716796875, 0.1087799072265625, 0.13687896728515625, 0.16497802734375, 0.19307708740234375, 0.2211761474609375, 0.24927520751953125, 0.277374267578125, 0.30547332763671875, 0.3335723876953125, 0.36167144775390625, 0.3897705078125, 0.41786956787109375, 0.4459686279296875, 0.47406768798828125, 0.502166748046875, 0.5302658081054688, 0.5583648681640625, 0.5864639282226562, 0.61456298828125, 0.6426620483398438, 0.6707611083984375, 0.6988601684570312, 0.726959228515625, 0.7550582885742188, 0.7831573486328125, 0.8112564086914062, 0.83935546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 9.0, 14.0, 21.0, 22.0, 32.0, 47.0, 46.0, 75.0, 76.0, 95.0, 94.0, 105.0, 91.0, 71.0, 55.0, 45.0, 27.0, 28.0, 14.0, 13.0, 12.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474672555923462, -2.410276174545288, -2.3458797931671143, -2.2814831733703613, -2.2170867919921875, -2.1526904106140137, -2.08829402923584, -2.023897647857666, -1.9595011472702026, -1.8951047658920288, -1.8307082653045654, -1.7663118839263916, -1.7019155025482178, -1.6375190019607544, -1.5731226205825806, -1.5087261199951172, -1.4443297386169434, -1.3799333572387695, -1.3155368566513062, -1.2511404752731323, -1.186743974685669, -1.1223475933074951, -1.0579512119293213, -0.9935547709465027, -0.9291583299636841, -0.8647618889808655, -0.8003654479980469, -0.735969066619873, -0.6715726256370544, -0.6071761846542358, -0.542779803276062, -0.4783833622932434, -0.4139869213104248, -0.3495904803276062, -0.28519406914711, -0.22079764306545258, -0.15640121698379517, -0.09200477600097656, -0.027608364820480347, 0.03678804636001587, 0.10118448734283447, 0.16558091342449188, 0.2299773395061493, 0.2943737506866455, 0.3587701916694641, 0.4231666326522827, 0.48756304383277893, 0.5519594550132751, 0.6163558959960938, 0.6807523369789124, 0.745148777961731, 0.8095451593399048, 0.8739416003227234, 0.938338041305542, 1.0027344226837158, 1.0671308040618896, 1.131527304649353, 1.1959236860275269, 1.2603201866149902, 1.324716567993164, 1.389112949371338, 1.4535094499588013, 1.517905831336975, 1.5823023319244385, 1.6466987133026123]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 3.0, 14.0, 7.0, 18.0, 14.0, 13.0, 20.0, 18.0, 25.0, 31.0, 34.0, 40.0, 47.0, 41.0, 50.0, 46.0, 53.0, 41.0, 43.0, 42.0, 42.0, 44.0, 45.0, 28.0, 39.0, 31.0, 22.0, 26.0, 25.0, 22.0, 16.0, 13.0, 7.0, 6.0, 12.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.220424771308899, -1.1819335222244263, -1.1434423923492432, -1.1049511432647705, -1.0664600133895874, -1.0279687643051147, -0.9894775748252869, -0.950986385345459, -0.9124951958656311, -0.8740040063858032, -0.8355128169059753, -0.7970216274261475, -0.7585303783416748, -0.7200392484664917, -0.681547999382019, -0.6430568099021912, -0.6045656204223633, -0.5660744309425354, -0.5275832414627075, -0.48909202218055725, -0.45060083270072937, -0.4121096432209015, -0.3736184239387512, -0.33512723445892334, -0.29663604497909546, -0.2581448554992676, -0.2196536511182785, -0.18116244673728943, -0.14267125725746155, -0.10418006777763367, -0.06568886339664459, -0.027197659015655518, 0.011293649673461914, 0.04978484660387039, 0.08827604353427887, 0.12676724791526794, 0.16525843739509583, 0.2037496268749237, 0.24224083125591278, 0.28073203563690186, 0.31922322511672974, 0.3577144145965576, 0.3962056040763855, 0.43469682335853577, 0.47318801283836365, 0.5116791725158691, 0.5501704216003418, 0.5886616110801697, 0.6271528005599976, 0.6656439900398254, 0.7041351795196533, 0.7426263689994812, 0.7811175584793091, 0.8196088075637817, 0.8580999970436096, 0.8965911865234375, 0.9350823760032654, 0.9735735654830933, 1.012064814567566, 1.050555944442749, 1.0890471935272217, 1.1275383234024048, 1.1660295724868774, 1.2045207023620605, 1.2430119514465332]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 3.0, 8.0, 10.0, 20.0, 33.0, 49.0, 67.0, 134.0, 278.0, 494.0, 933.0, 1847.0, 3912.0, 10614.0, 59890.0, 639871.0, 291750.0, 25923.0, 6828.0, 2910.0, 1328.0, 738.0, 386.0, 224.0, 130.0, 72.0, 37.0, 26.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.853515625, -0.8266754150390625, -0.799835205078125, -0.7729949951171875, -0.74615478515625, -0.7193145751953125, -0.692474365234375, -0.6656341552734375, -0.6387939453125, -0.6119537353515625, -0.585113525390625, -0.5582733154296875, -0.53143310546875, -0.5045928955078125, -0.477752685546875, -0.4509124755859375, -0.424072265625, -0.3972320556640625, -0.370391845703125, -0.3435516357421875, -0.31671142578125, -0.2898712158203125, -0.263031005859375, -0.2361907958984375, -0.2093505859375, -0.1825103759765625, -0.155670166015625, -0.1288299560546875, -0.10198974609375, -0.0751495361328125, -0.048309326171875, -0.0214691162109375, 0.00537109375, 0.0322113037109375, 0.059051513671875, 0.0858917236328125, 0.11273193359375, 0.1395721435546875, 0.166412353515625, 0.1932525634765625, 0.2200927734375, 0.2469329833984375, 0.273773193359375, 0.3006134033203125, 0.32745361328125, 0.3542938232421875, 0.381134033203125, 0.4079742431640625, 0.434814453125, 0.4616546630859375, 0.488494873046875, 0.5153350830078125, 0.54217529296875, 0.5690155029296875, 0.595855712890625, 0.6226959228515625, 0.6495361328125, 0.6763763427734375, 0.703216552734375, 0.7300567626953125, 0.75689697265625, 0.7837371826171875, 0.810577392578125, 0.8374176025390625, 0.8642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 9.0, 8.0, 10.0, 11.0, 16.0, 15.0, 20.0, 23.0, 27.0, 46.0, 43.0, 40.0, 60.0, 63.0, 44.0, 47.0, 44.0, 50.0, 31.0, 49.0, 39.0, 33.0, 30.0, 33.0, 37.0, 26.0, 28.0, 22.0, 20.0, 15.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.931640625, -0.904449462890625, -0.87725830078125, -0.850067138671875, -0.8228759765625, -0.795684814453125, -0.76849365234375, -0.741302490234375, -0.714111328125, -0.686920166015625, -0.65972900390625, -0.632537841796875, -0.6053466796875, -0.578155517578125, -0.55096435546875, -0.523773193359375, -0.49658203125, -0.469390869140625, -0.44219970703125, -0.415008544921875, -0.3878173828125, -0.360626220703125, -0.33343505859375, -0.306243896484375, -0.279052734375, -0.251861572265625, -0.22467041015625, -0.197479248046875, -0.1702880859375, -0.143096923828125, -0.11590576171875, -0.088714599609375, -0.0615234375, -0.034332275390625, -0.00714111328125, 0.020050048828125, 0.0472412109375, 0.074432373046875, 0.10162353515625, 0.128814697265625, 0.156005859375, 0.183197021484375, 0.21038818359375, 0.237579345703125, 0.2647705078125, 0.291961669921875, 0.31915283203125, 0.346343994140625, 0.37353515625, 0.400726318359375, 0.42791748046875, 0.455108642578125, 0.4822998046875, 0.509490966796875, 0.53668212890625, 0.563873291015625, 0.591064453125, 0.618255615234375, 0.64544677734375, 0.672637939453125, 0.6998291015625, 0.727020263671875, 0.75421142578125, 0.781402587890625, 0.80859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 10.0, 13.0, 18.0, 19.0, 36.0, 56.0, 67.0, 115.0, 172.0, 254.0, 389.0, 599.0, 1092.0, 2212.0, 4774.0, 13473.0, 237743.0, 736886.0, 36829.0, 6940.0, 3121.0, 1462.0, 831.0, 471.0, 321.0, 212.0, 141.0, 78.0, 61.0, 44.0, 33.0, 22.0, 12.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8466796875, -0.815582275390625, -0.78448486328125, -0.753387451171875, -0.7222900390625, -0.691192626953125, -0.66009521484375, -0.628997802734375, -0.597900390625, -0.566802978515625, -0.53570556640625, -0.504608154296875, -0.4735107421875, -0.442413330078125, -0.41131591796875, -0.380218505859375, -0.34912109375, -0.318023681640625, -0.28692626953125, -0.255828857421875, -0.2247314453125, -0.193634033203125, -0.16253662109375, -0.131439208984375, -0.100341796875, -0.069244384765625, -0.03814697265625, -0.007049560546875, 0.0240478515625, 0.055145263671875, 0.08624267578125, 0.117340087890625, 0.1484375, 0.179534912109375, 0.21063232421875, 0.241729736328125, 0.2728271484375, 0.303924560546875, 0.33502197265625, 0.366119384765625, 0.397216796875, 0.428314208984375, 0.45941162109375, 0.490509033203125, 0.5216064453125, 0.552703857421875, 0.58380126953125, 0.614898681640625, 0.64599609375, 0.677093505859375, 0.70819091796875, 0.739288330078125, 0.7703857421875, 0.801483154296875, 0.83258056640625, 0.863677978515625, 0.894775390625, 0.925872802734375, 0.95697021484375, 0.988067626953125, 1.0191650390625, 1.050262451171875, 1.08135986328125, 1.112457275390625, 1.1435546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 12.0, 9.0, 16.0, 24.0, 16.0, 26.0, 30.0, 24.0, 43.0, 39.0, 38.0, 49.0, 56.0, 53.0, 50.0, 53.0, 48.0, 51.0, 48.0, 37.0, 45.0, 32.0, 33.0, 26.0, 21.0, 25.0, 9.0, 19.0, 8.0, 12.0, 10.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.0845947265625, -2.024658203125, -1.9647216796875, -1.90478515625, -1.8448486328125, -1.784912109375, -1.7249755859375, -1.6650390625, -1.6051025390625, -1.545166015625, -1.4852294921875, -1.42529296875, -1.3653564453125, -1.305419921875, -1.2454833984375, -1.185546875, -1.1256103515625, -1.065673828125, -1.0057373046875, -0.94580078125, -0.8858642578125, -0.825927734375, -0.7659912109375, -0.7060546875, -0.6461181640625, -0.586181640625, -0.5262451171875, -0.46630859375, -0.4063720703125, -0.346435546875, -0.2864990234375, -0.2265625, -0.1666259765625, -0.106689453125, -0.0467529296875, 0.01318359375, 0.0731201171875, 0.133056640625, 0.1929931640625, 0.2529296875, 0.3128662109375, 0.372802734375, 0.4327392578125, 0.49267578125, 0.5526123046875, 0.612548828125, 0.6724853515625, 0.732421875, 0.7923583984375, 0.852294921875, 0.9122314453125, 0.97216796875, 1.0321044921875, 1.092041015625, 1.1519775390625, 1.2119140625, 1.2718505859375, 1.331787109375, 1.3917236328125, 1.45166015625, 1.5115966796875, 1.571533203125, 1.6314697265625, 1.69140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 6.0, 10.0, 12.0, 27.0, 31.0, 47.0, 77.0, 88.0, 143.0, 270.0, 487.0, 825.0, 1511.0, 3226.0, 7423.0, 20270.0, 70811.0, 331725.0, 459063.0, 106544.0, 27820.0, 9849.0, 4017.0, 1872.0, 941.0, 583.0, 329.0, 186.0, 128.0, 79.0, 54.0, 20.0, 24.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1778564453125, -0.17248916625976562, -0.16712188720703125, -0.16175460815429688, -0.1563873291015625, -0.15102005004882812, -0.14565277099609375, -0.14028549194335938, -0.134918212890625, -0.12955093383789062, -0.12418365478515625, -0.11881637573242188, -0.1134490966796875, -0.10808181762695312, -0.10271453857421875, -0.09734725952148438, -0.09197998046875, -0.08661270141601562, -0.08124542236328125, -0.07587814331054688, -0.0705108642578125, -0.06514358520507812, -0.05977630615234375, -0.054409027099609375, -0.049041748046875, -0.043674468994140625, -0.03830718994140625, -0.032939910888671875, -0.0275726318359375, -0.022205352783203125, -0.01683807373046875, -0.011470794677734375, -0.006103515625, -0.000736236572265625, 0.00463104248046875, 0.009998321533203125, 0.0153656005859375, 0.020732879638671875, 0.02610015869140625, 0.031467437744140625, 0.036834716796875, 0.042201995849609375, 0.04756927490234375, 0.052936553955078125, 0.0583038330078125, 0.06367111206054688, 0.06903839111328125, 0.07440567016601562, 0.07977294921875, 0.08514022827148438, 0.09050750732421875, 0.09587478637695312, 0.1012420654296875, 0.10660934448242188, 0.11197662353515625, 0.11734390258789062, 0.122711181640625, 0.12807846069335938, 0.13344573974609375, 0.13881301879882812, 0.1441802978515625, 0.14954757690429688, 0.15491485595703125, 0.16028213500976562, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 8.0, 9.0, 17.0, 24.0, 39.0, 62.0, 91.0, 109.0, 149.0, 146.0, 103.0, 72.0, 35.0, 37.0, 24.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.749961853027344e-05, -8.497387170791626e-05, -8.244812488555908e-05, -7.99223780632019e-05, -7.739663124084473e-05, -7.487088441848755e-05, -7.234513759613037e-05, -6.98193907737732e-05, -6.729364395141602e-05, -6.476789712905884e-05, -6.224215030670166e-05, -5.971640348434448e-05, -5.7190656661987305e-05, -5.466490983963013e-05, -5.213916301727295e-05, -4.961341619491577e-05, -4.7087669372558594e-05, -4.4561922550201416e-05, -4.203617572784424e-05, -3.951042890548706e-05, -3.698468208312988e-05, -3.4458935260772705e-05, -3.193318843841553e-05, -2.940744161605835e-05, -2.6881694793701172e-05, -2.4355947971343994e-05, -2.1830201148986816e-05, -1.930445432662964e-05, -1.677870750427246e-05, -1.4252960681915283e-05, -1.1727213859558105e-05, -9.201467037200928e-06, -6.67572021484375e-06, -4.149973392486572e-06, -1.6242265701293945e-06, 9.015202522277832e-07, 3.427267074584961e-06, 5.953013896942139e-06, 8.478760719299316e-06, 1.1004507541656494e-05, 1.3530254364013672e-05, 1.605600118637085e-05, 1.8581748008728027e-05, 2.1107494831085205e-05, 2.3633241653442383e-05, 2.615898847579956e-05, 2.8684735298156738e-05, 3.1210482120513916e-05, 3.3736228942871094e-05, 3.626197576522827e-05, 3.878772258758545e-05, 4.131346940994263e-05, 4.3839216232299805e-05, 4.636496305465698e-05, 4.889070987701416e-05, 5.141645669937134e-05, 5.3942203521728516e-05, 5.646795034408569e-05, 5.899369716644287e-05, 6.151944398880005e-05, 6.404519081115723e-05, 6.65709376335144e-05, 6.909668445587158e-05, 7.162243127822876e-05, 7.414817810058594e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 15.0, 21.0, 25.0, 47.0, 84.0, 123.0, 244.0, 574.0, 1387.0, 4112.0, 14092.0, 62056.0, 436201.0, 445198.0, 62993.0, 14229.0, 4465.0, 1477.0, 580.0, 237.0, 133.0, 74.0, 52.0, 22.0, 34.0, 13.0, 12.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29977989196777344, -0.2914543151855469, -0.2831287384033203, -0.27480316162109375, -0.2664775848388672, -0.2581520080566406, -0.24982643127441406, -0.2415008544921875, -0.23317527770996094, -0.22484970092773438, -0.2165241241455078, -0.20819854736328125, -0.1998729705810547, -0.19154739379882812, -0.18322181701660156, -0.174896240234375, -0.16657066345214844, -0.15824508666992188, -0.1499195098876953, -0.14159393310546875, -0.1332683563232422, -0.12494277954101562, -0.11661720275878906, -0.1082916259765625, -0.09996604919433594, -0.09164047241210938, -0.08331489562988281, -0.07498931884765625, -0.06666374206542969, -0.058338165283203125, -0.05001258850097656, -0.04168701171875, -0.03336143493652344, -0.025035858154296875, -0.016710281372070312, -0.00838470458984375, -5.91278076171875e-05, 0.008266448974609375, 0.016592025756835938, 0.0249176025390625, 0.03324317932128906, 0.041568756103515625, 0.04989433288574219, 0.05821990966796875, 0.06654548645019531, 0.07487106323242188, 0.08319664001464844, 0.091522216796875, 0.09984779357910156, 0.10817337036132812, 0.11649894714355469, 0.12482452392578125, 0.1331501007080078, 0.14147567749023438, 0.14980125427246094, 0.1581268310546875, 0.16645240783691406, 0.17477798461914062, 0.1831035614013672, 0.19142913818359375, 0.1997547149658203, 0.20808029174804688, 0.21640586853027344, 0.2247314453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 12.0, 5.0, 17.0, 14.0, 24.0, 24.0, 31.0, 43.0, 46.0, 45.0, 76.0, 52.0, 86.0, 71.0, 78.0, 82.0, 55.0, 46.0, 33.0, 23.0, 23.0, 24.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.04524421691894531, -0.043704986572265625, -0.04216575622558594, -0.04062652587890625, -0.03908729553222656, -0.037548065185546875, -0.03600883483886719, -0.0344696044921875, -0.03293037414550781, -0.031391143798828125, -0.029851913452148438, -0.02831268310546875, -0.026773452758789062, -0.025234222412109375, -0.023694992065429688, -0.02215576171875, -0.020616531372070312, -0.019077301025390625, -0.017538070678710938, -0.01599884033203125, -0.014459609985351562, -0.012920379638671875, -0.011381149291992188, -0.0098419189453125, -0.008302688598632812, -0.006763458251953125, -0.0052242279052734375, -0.00368499755859375, -0.0021457672119140625, -0.000606536865234375, 0.0009326934814453125, 0.002471923828125, 0.0040111541748046875, 0.005550384521484375, 0.0070896148681640625, 0.00862884521484375, 0.010168075561523438, 0.011707305908203125, 0.013246536254882812, 0.0147857666015625, 0.016324996948242188, 0.017864227294921875, 0.019403457641601562, 0.02094268798828125, 0.022481918334960938, 0.024021148681640625, 0.025560379028320312, 0.027099609375, 0.028638839721679688, 0.030178070068359375, 0.03171730041503906, 0.03325653076171875, 0.03479576110839844, 0.036334991455078125, 0.03787422180175781, 0.0394134521484375, 0.04095268249511719, 0.042491912841796875, 0.04403114318847656, 0.04557037353515625, 0.04710960388183594, 0.048648834228515625, 0.05018806457519531, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 13.0, 17.0, 32.0, 41.0, 53.0, 58.0, 108.0, 118.0, 142.0, 106.0, 94.0, 62.0, 50.0, 32.0, 25.0, 22.0, 7.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9193627834320068, -1.8680018186569214, -1.8166407346725464, -1.765279769897461, -1.7139188051223755, -1.66255784034729, -1.611196756362915, -1.5598357915878296, -1.5084748268127441, -1.4571138620376587, -1.4057527780532837, -1.3543918132781982, -1.3030308485031128, -1.2516698837280273, -1.2003087997436523, -1.148947834968567, -1.097586750984192, -1.0462257862091064, -0.9948647618293762, -0.943503737449646, -0.8921427726745605, -0.8407817482948303, -0.7894207239151001, -0.7380597591400146, -0.6866987347602844, -0.6353377103805542, -0.5839767456054688, -0.5326157212257385, -0.4812547266483307, -0.42989373207092285, -0.3785327076911926, -0.3271717131137848, -0.27581071853637695, -0.22444972395896912, -0.17308871448040009, -0.12172770500183105, -0.07036671042442322, -0.01900571584701538, 0.032355308532714844, 0.08371630311012268, 0.13507729768753052, 0.18643829226493835, 0.23779930174350739, 0.2891603112220764, 0.34052130579948425, 0.3918823003768921, 0.4432433247566223, 0.49460431933403015, 0.545965313911438, 0.5973263382911682, 0.6486873030662537, 0.7000483274459839, 0.7514092922210693, 0.8027703166007996, 0.8541313409805298, 0.9054923057556152, 0.9568533301353455, 1.0082143545150757, 1.0595753192901611, 1.1109364032745361, 1.1622973680496216, 1.213658332824707, 1.265019416809082, 1.3163803815841675, 1.367741346359253]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 4.0, 10.0, 9.0, 8.0, 19.0, 17.0, 13.0, 23.0, 17.0, 26.0, 44.0, 34.0, 42.0, 48.0, 46.0, 47.0, 46.0, 45.0, 46.0, 45.0, 41.0, 47.0, 40.0, 37.0, 32.0, 30.0, 36.0, 32.0, 17.0, 23.0, 17.0, 10.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8063705563545227, -0.7802299857139587, -0.75408935546875, -0.727948784828186, -0.7018081545829773, -0.6756675839424133, -0.6495269536972046, -0.6233863830566406, -0.5972458124160767, -0.5711052417755127, -0.544964611530304, -0.51882404088974, -0.49268341064453125, -0.4665428400039673, -0.44040223956108093, -0.4142616391181946, -0.38812100887298584, -0.3619804084300995, -0.33583980798721313, -0.30969923734664917, -0.28355860710144043, -0.25741803646087646, -0.2312774360179901, -0.20513683557510376, -0.1789962351322174, -0.15285563468933105, -0.1267150342464447, -0.10057444870471954, -0.07443384826183319, -0.04829324781894684, -0.02215266227722168, 0.003987938165664673, 0.03012847900390625, 0.056269075721502304, 0.08240967243909836, 0.10855026543140411, 0.13469086587429047, 0.16083146631717682, 0.18697205185890198, 0.21311265230178833, 0.23925325274467468, 0.26539385318756104, 0.2915344536304474, 0.31767505407333374, 0.3438156247138977, 0.36995625495910645, 0.3960968255996704, 0.42223742604255676, 0.4483780264854431, 0.47451862692832947, 0.5006592273712158, 0.5267997980117798, 0.5529404282569885, 0.5790809988975525, 0.6052216291427612, 0.6313621997833252, 0.6575027704238892, 0.6836433410644531, 0.7097839713096619, 0.7359245419502258, 0.7620651721954346, 0.7882057428359985, 0.8143463134765625, 0.8404869437217712, 0.86662757396698]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 11.0, 5.0, 15.0, 9.0, 21.0, 20.0, 23.0, 35.0, 52.0, 84.0, 92.0, 169.0, 237.0, 360.0, 611.0, 1092.0, 2245.0, 4899.0, 11218.0, 29642.0, 87474.0, 385766.0, 386464.0, 87394.0, 29306.0, 11454.0, 4805.0, 2203.0, 1085.0, 625.0, 375.0, 221.0, 167.0, 103.0, 81.0, 37.0, 35.0, 25.0, 28.0, 16.0, 10.0, 10.0, 10.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6930694580078125, -0.666412353515625, -0.6397552490234375, -0.61309814453125, -0.5864410400390625, -0.559783935546875, -0.5331268310546875, -0.5064697265625, -0.4798126220703125, -0.453155517578125, -0.4264984130859375, -0.39984130859375, -0.3731842041015625, -0.346527099609375, -0.3198699951171875, -0.293212890625, -0.2665557861328125, -0.239898681640625, -0.2132415771484375, -0.18658447265625, -0.1599273681640625, -0.133270263671875, -0.1066131591796875, -0.0799560546875, -0.0532989501953125, -0.026641845703125, 1.52587890625e-05, 0.02667236328125, 0.0533294677734375, 0.079986572265625, 0.1066436767578125, 0.13330078125, 0.1599578857421875, 0.186614990234375, 0.2132720947265625, 0.23992919921875, 0.2665863037109375, 0.293243408203125, 0.3199005126953125, 0.3465576171875, 0.3732147216796875, 0.399871826171875, 0.4265289306640625, 0.45318603515625, 0.4798431396484375, 0.506500244140625, 0.5331573486328125, 0.559814453125, 0.5864715576171875, 0.613128662109375, 0.6397857666015625, 0.66644287109375, 0.6930999755859375, 0.719757080078125, 0.7464141845703125, 0.7730712890625, 0.7997283935546875, 0.826385498046875, 0.8530426025390625, 0.87969970703125, 0.9063568115234375, 0.933013916015625, 0.9596710205078125, 0.986328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 10.0, 12.0, 16.0, 17.0, 25.0, 17.0, 30.0, 14.0, 34.0, 38.0, 47.0, 55.0, 49.0, 49.0, 42.0, 52.0, 39.0, 46.0, 42.0, 42.0, 32.0, 39.0, 38.0, 41.0, 30.0, 21.0, 21.0, 19.0, 10.0, 14.0, 6.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.538177490234375, -1.48944091796875, -1.440704345703125, -1.3919677734375, -1.343231201171875, -1.29449462890625, -1.245758056640625, -1.197021484375, -1.148284912109375, -1.09954833984375, -1.050811767578125, -1.0020751953125, -0.953338623046875, -0.90460205078125, -0.855865478515625, -0.80712890625, -0.758392333984375, -0.70965576171875, -0.660919189453125, -0.6121826171875, -0.563446044921875, -0.51470947265625, -0.465972900390625, -0.417236328125, -0.368499755859375, -0.31976318359375, -0.271026611328125, -0.2222900390625, -0.173553466796875, -0.12481689453125, -0.076080322265625, -0.02734375, 0.021392822265625, 0.07012939453125, 0.118865966796875, 0.1676025390625, 0.216339111328125, 0.26507568359375, 0.313812255859375, 0.362548828125, 0.411285400390625, 0.46002197265625, 0.508758544921875, 0.5574951171875, 0.606231689453125, 0.65496826171875, 0.703704833984375, 0.75244140625, 0.801177978515625, 0.84991455078125, 0.898651123046875, 0.9473876953125, 0.996124267578125, 1.04486083984375, 1.093597412109375, 1.142333984375, 1.191070556640625, 1.23980712890625, 1.288543701171875, 1.3372802734375, 1.386016845703125, 1.43475341796875, 1.483489990234375, 1.5322265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 3.0, 7.0, 11.0, 19.0, 16.0, 26.0, 27.0, 45.0, 57.0, 100.0, 163.0, 373.0, 885.0, 8394.0, 731791.0, 300175.0, 4954.0, 702.0, 311.0, 147.0, 87.0, 59.0, 42.0, 33.0, 31.0, 25.0, 9.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.96484375, -3.854461669921875, -3.74407958984375, -3.633697509765625, -3.5233154296875, -3.412933349609375, -3.30255126953125, -3.192169189453125, -3.081787109375, -2.971405029296875, -2.86102294921875, -2.750640869140625, -2.6402587890625, -2.529876708984375, -2.41949462890625, -2.309112548828125, -2.19873046875, -2.088348388671875, -1.97796630859375, -1.867584228515625, -1.7572021484375, -1.646820068359375, -1.53643798828125, -1.426055908203125, -1.315673828125, -1.205291748046875, -1.09490966796875, -0.984527587890625, -0.8741455078125, -0.763763427734375, -0.65338134765625, -0.542999267578125, -0.4326171875, -0.322235107421875, -0.21185302734375, -0.101470947265625, 0.0089111328125, 0.119293212890625, 0.22967529296875, 0.340057373046875, 0.450439453125, 0.560821533203125, 0.67120361328125, 0.781585693359375, 0.8919677734375, 1.002349853515625, 1.11273193359375, 1.223114013671875, 1.33349609375, 1.443878173828125, 1.55426025390625, 1.664642333984375, 1.7750244140625, 1.885406494140625, 1.99578857421875, 2.106170654296875, 2.216552734375, 2.326934814453125, 2.43731689453125, 2.547698974609375, 2.6580810546875, 2.768463134765625, 2.87884521484375, 2.989227294921875, 3.099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 10.0, 11.0, 12.0, 7.0, 9.0, 11.0, 16.0, 30.0, 35.0, 34.0, 39.0, 42.0, 36.0, 40.0, 56.0, 51.0, 66.0, 47.0, 46.0, 48.0, 38.0, 49.0, 47.0, 31.0, 34.0, 18.0, 13.0, 23.0, 19.0, 15.0, 10.0, 9.0, 8.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.0183258056640625, -1.956573486328125, -1.8948211669921875, -1.83306884765625, -1.7713165283203125, -1.709564208984375, -1.6478118896484375, -1.5860595703125, -1.5243072509765625, -1.462554931640625, -1.4008026123046875, -1.33905029296875, -1.2772979736328125, -1.215545654296875, -1.1537933349609375, -1.092041015625, -1.0302886962890625, -0.968536376953125, -0.9067840576171875, -0.84503173828125, -0.7832794189453125, -0.721527099609375, -0.6597747802734375, -0.5980224609375, -0.5362701416015625, -0.474517822265625, -0.4127655029296875, -0.35101318359375, -0.2892608642578125, -0.227508544921875, -0.1657562255859375, -0.10400390625, -0.0422515869140625, 0.019500732421875, 0.0812530517578125, 0.14300537109375, 0.2047576904296875, 0.266510009765625, 0.3282623291015625, 0.3900146484375, 0.4517669677734375, 0.513519287109375, 0.5752716064453125, 0.63702392578125, 0.6987762451171875, 0.760528564453125, 0.8222808837890625, 0.884033203125, 0.9457855224609375, 1.007537841796875, 1.0692901611328125, 1.13104248046875, 1.1927947998046875, 1.254547119140625, 1.3162994384765625, 1.3780517578125, 1.4398040771484375, 1.501556396484375, 1.5633087158203125, 1.62506103515625, 1.6868133544921875, 1.748565673828125, 1.8103179931640625, 1.8720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 6.0, 0.0, 5.0, 7.0, 9.0, 18.0, 14.0, 18.0, 29.0, 40.0, 63.0, 74.0, 158.0, 266.0, 486.0, 1154.0, 3570.0, 15344.0, 101234.0, 701830.0, 191129.0, 24916.0, 5225.0, 1532.0, 601.0, 293.0, 134.0, 95.0, 75.0, 49.0, 32.0, 35.0, 34.0, 17.0, 14.0, 9.0, 11.0, 2.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31446075439453125, -0.3034820556640625, -0.29250335693359375, -0.281524658203125, -0.27054595947265625, -0.2595672607421875, -0.24858856201171875, -0.23760986328125, -0.22663116455078125, -0.2156524658203125, -0.20467376708984375, -0.193695068359375, -0.18271636962890625, -0.1717376708984375, -0.16075897216796875, -0.1497802734375, -0.13880157470703125, -0.1278228759765625, -0.11684417724609375, -0.105865478515625, -0.09488677978515625, -0.0839080810546875, -0.07292938232421875, -0.06195068359375, -0.05097198486328125, -0.0399932861328125, -0.02901458740234375, -0.018035888671875, -0.00705718994140625, 0.0039215087890625, 0.01490020751953125, 0.02587890625, 0.03685760498046875, 0.0478363037109375, 0.05881500244140625, 0.069793701171875, 0.08077239990234375, 0.0917510986328125, 0.10272979736328125, 0.11370849609375, 0.12468719482421875, 0.1356658935546875, 0.14664459228515625, 0.157623291015625, 0.16860198974609375, 0.1795806884765625, 0.19055938720703125, 0.2015380859375, 0.21251678466796875, 0.2234954833984375, 0.23447418212890625, 0.245452880859375, 0.25643157958984375, 0.2674102783203125, 0.27838897705078125, 0.28936767578125, 0.30034637451171875, 0.3113250732421875, 0.32230377197265625, 0.333282470703125, 0.34426116943359375, 0.3552398681640625, 0.36621856689453125, 0.377197265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 10.0, 16.0, 15.0, 25.0, 43.0, 49.0, 56.0, 80.0, 106.0, 95.0, 84.0, 67.0, 56.0, 38.0, 40.0, 24.0, 42.0, 29.0, 17.0, 10.0, 16.0, 4.0, 16.0, 8.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0650367736816406e-05, -3.9548613131046295e-05, -3.8446858525276184e-05, -3.734510391950607e-05, -3.624334931373596e-05, -3.514159470796585e-05, -3.403984010219574e-05, -3.293808549642563e-05, -3.183633089065552e-05, -3.0734576284885406e-05, -2.9632821679115295e-05, -2.8531067073345184e-05, -2.7429312467575073e-05, -2.6327557861804962e-05, -2.522580325603485e-05, -2.412404865026474e-05, -2.302229404449463e-05, -2.1920539438724518e-05, -2.0818784832954407e-05, -1.9717030227184296e-05, -1.8615275621414185e-05, -1.7513521015644073e-05, -1.6411766409873962e-05, -1.531001180410385e-05, -1.420825719833374e-05, -1.3106502592563629e-05, -1.2004747986793518e-05, -1.0902993381023407e-05, -9.801238775253296e-06, -8.699484169483185e-06, -7.597729563713074e-06, -6.495974957942963e-06, -5.3942203521728516e-06, -4.2924657464027405e-06, -3.1907111406326294e-06, -2.0889565348625183e-06, -9.872019290924072e-07, 1.1455267667770386e-07, 1.216307282447815e-06, 2.318061888217926e-06, 3.419816493988037e-06, 4.521571099758148e-06, 5.623325705528259e-06, 6.72508031129837e-06, 7.826834917068481e-06, 8.928589522838593e-06, 1.0030344128608704e-05, 1.1132098734378815e-05, 1.2233853340148926e-05, 1.3335607945919037e-05, 1.4437362551689148e-05, 1.553911715745926e-05, 1.664087176322937e-05, 1.774262636899948e-05, 1.8844380974769592e-05, 1.9946135580539703e-05, 2.1047890186309814e-05, 2.2149644792079926e-05, 2.3251399397850037e-05, 2.4353154003620148e-05, 2.545490860939026e-05, 2.655666321516037e-05, 2.765841782093048e-05, 2.8760172426700592e-05, 2.9861927032470703e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 9.0, 10.0, 21.0, 36.0, 61.0, 103.0, 224.0, 648.0, 2417.0, 28924.0, 915568.0, 94508.0, 4550.0, 846.0, 308.0, 144.0, 72.0, 37.0, 22.0, 8.0, 8.0, 5.0, 3.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8984375, -0.8717422485351562, -0.8450469970703125, -0.8183517456054688, -0.791656494140625, -0.7649612426757812, -0.7382659912109375, -0.7115707397460938, -0.68487548828125, -0.6581802368164062, -0.6314849853515625, -0.6047897338867188, -0.578094482421875, -0.5513992309570312, -0.5247039794921875, -0.49800872802734375, -0.4713134765625, -0.44461822509765625, -0.4179229736328125, -0.39122772216796875, -0.364532470703125, -0.33783721923828125, -0.3111419677734375, -0.28444671630859375, -0.25775146484375, -0.23105621337890625, -0.2043609619140625, -0.17766571044921875, -0.150970458984375, -0.12427520751953125, -0.0975799560546875, -0.07088470458984375, -0.044189453125, -0.01749420166015625, 0.0092010498046875, 0.03589630126953125, 0.062591552734375, 0.08928680419921875, 0.1159820556640625, 0.14267730712890625, 0.16937255859375, 0.19606781005859375, 0.2227630615234375, 0.24945831298828125, 0.276153564453125, 0.30284881591796875, 0.3295440673828125, 0.35623931884765625, 0.3829345703125, 0.40962982177734375, 0.4363250732421875, 0.46302032470703125, 0.489715576171875, 0.5164108276367188, 0.5431060791015625, 0.5698013305664062, 0.59649658203125, 0.6231918334960938, 0.6498870849609375, 0.6765823364257812, 0.703277587890625, 0.7299728393554688, 0.7566680908203125, 0.7833633422851562, 0.81005859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 7.0, 18.0, 17.0, 35.0, 65.0, 99.0, 180.0, 274.0, 119.0, 69.0, 40.0, 19.0, 17.0, 12.0, 12.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35791015625, -0.34827423095703125, -0.3386383056640625, -0.32900238037109375, -0.319366455078125, -0.30973052978515625, -0.3000946044921875, -0.29045867919921875, -0.28082275390625, -0.27118682861328125, -0.2615509033203125, -0.25191497802734375, -0.242279052734375, -0.23264312744140625, -0.2230072021484375, -0.21337127685546875, -0.2037353515625, -0.19409942626953125, -0.1844635009765625, -0.17482757568359375, -0.165191650390625, -0.15555572509765625, -0.1459197998046875, -0.13628387451171875, -0.12664794921875, -0.11701202392578125, -0.1073760986328125, -0.09774017333984375, -0.088104248046875, -0.07846832275390625, -0.0688323974609375, -0.05919647216796875, -0.049560546875, -0.03992462158203125, -0.0302886962890625, -0.02065277099609375, -0.011016845703125, -0.00138092041015625, 0.0082550048828125, 0.01789093017578125, 0.02752685546875, 0.03716278076171875, 0.0467987060546875, 0.05643463134765625, 0.066070556640625, 0.07570648193359375, 0.0853424072265625, 0.09497833251953125, 0.1046142578125, 0.11425018310546875, 0.1238861083984375, 0.13352203369140625, 0.143157958984375, 0.15279388427734375, 0.1624298095703125, 0.17206573486328125, 0.18170166015625, 0.19133758544921875, 0.2009735107421875, 0.21060943603515625, 0.220245361328125, 0.22988128662109375, 0.2395172119140625, 0.24915313720703125, 0.2587890625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 18.0, 55.0, 120.0, 208.0, 268.0, 188.0, 102.0, 34.0, 16.0, 5.0], "bins": [-13.263665199279785, -13.036294937133789, -12.808924674987793, -12.581554412841797, -12.3541841506958, -12.126813888549805, -11.899443626403809, -11.672073364257812, -11.444703102111816, -11.21733283996582, -10.989962577819824, -10.762592315673828, -10.535222053527832, -10.307851791381836, -10.08048152923584, -9.853111267089844, -9.625741004943848, -9.398370742797852, -9.171000480651855, -8.94363021850586, -8.716259956359863, -8.488889694213867, -8.261519432067871, -8.034149169921875, -7.806778907775879, -7.579408645629883, -7.352038383483887, -7.124668121337891, -6.8972978591918945, -6.669927597045898, -6.442557334899902, -6.215187072753906, -5.987817287445068, -5.760447025299072, -5.533076763153076, -5.30570650100708, -5.078336238861084, -4.850965976715088, -4.623595714569092, -4.396225452423096, -4.1688551902771, -3.9414849281311035, -3.7141146659851074, -3.4867444038391113, -3.2593741416931152, -3.032003879547119, -2.804633617401123, -2.577263355255127, -2.349893093109131, -2.1225228309631348, -1.8951525688171387, -1.6677823066711426, -1.4404120445251465, -1.2130417823791504, -0.9856715202331543, -0.7583012580871582, -0.5309308767318726, -0.30356061458587646, -0.07619035243988037, 0.15117990970611572, 0.3785501718521118, 0.6059204339981079, 0.833290696144104, 1.0606609582901, 1.2880312204360962]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 9.0, 11.0, 12.0, 13.0, 8.0, 28.0, 27.0, 26.0, 29.0, 42.0, 28.0, 33.0, 29.0, 42.0, 42.0, 45.0, 44.0, 30.0, 41.0, 44.0, 32.0, 50.0, 35.0, 31.0, 41.0, 34.0, 19.0, 24.0, 26.0, 22.0, 16.0, 11.0, 15.0, 11.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.86728572845459, -2.7767083644866943, -2.686131000518799, -2.5955538749694824, -2.504976511001587, -2.4143991470336914, -2.323822021484375, -2.2332446575164795, -2.142667293548584, -2.0520899295806885, -1.9615126848220825, -1.8709354400634766, -1.780358076095581, -1.6897807121276855, -1.5992034673690796, -1.5086262226104736, -1.4180488586425781, -1.3274714946746826, -1.2368942499160767, -1.1463170051574707, -1.0557396411895752, -0.9651623368263245, -0.8745850324630737, -0.784007728099823, -0.6934304237365723, -0.6028531193733215, -0.5122758150100708, -0.42169851064682007, -0.33112120628356934, -0.2405439019203186, -0.14996659755706787, -0.05938929319381714, 0.031188011169433594, 0.12176531553268433, 0.21234261989593506, 0.3029199242591858, 0.3934972286224365, 0.48407453298568726, 0.574651837348938, 0.6652291417121887, 0.7558064460754395, 0.8463837504386902, 0.9369610548019409, 1.0275382995605469, 1.1181156635284424, 1.208693027496338, 1.2992702722549438, 1.3898475170135498, 1.4804248809814453, 1.5710022449493408, 1.6615794897079468, 1.7521567344665527, 1.8427340984344482, 1.9333114624023438, 2.02388858795166, 2.1144659519195557, 2.205043315887451, 2.2956206798553467, 2.386198043823242, 2.4767751693725586, 2.567352533340454, 2.6579298973083496, 2.748507022857666, 2.8390843868255615, 2.929661750793457]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 10.0, 8.0, 12.0, 12.0, 16.0, 13.0, 30.0, 32.0, 48.0, 48.0, 83.0, 103.0, 132.0, 201.0, 300.0, 540.0, 902.0, 2011.0, 4915.0, 15344.0, 71477.0, 659501.0, 2591482.0, 740040.0, 81336.0, 16097.0, 4970.0, 2032.0, 984.0, 508.0, 315.0, 206.0, 151.0, 107.0, 75.0, 49.0, 49.0, 35.0, 14.0, 24.0, 15.0, 7.0, 9.0, 7.0, 13.0, 2.0, 6.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.5595703125, -1.510101318359375, -1.46063232421875, -1.411163330078125, -1.3616943359375, -1.312225341796875, -1.26275634765625, -1.213287353515625, -1.163818359375, -1.114349365234375, -1.06488037109375, -1.015411376953125, -0.9659423828125, -0.916473388671875, -0.86700439453125, -0.817535400390625, -0.76806640625, -0.718597412109375, -0.66912841796875, -0.619659423828125, -0.5701904296875, -0.520721435546875, -0.47125244140625, -0.421783447265625, -0.372314453125, -0.322845458984375, -0.27337646484375, -0.223907470703125, -0.1744384765625, -0.124969482421875, -0.07550048828125, -0.026031494140625, 0.0234375, 0.072906494140625, 0.12237548828125, 0.171844482421875, 0.2213134765625, 0.270782470703125, 0.32025146484375, 0.369720458984375, 0.419189453125, 0.468658447265625, 0.51812744140625, 0.567596435546875, 0.6170654296875, 0.666534423828125, 0.71600341796875, 0.765472412109375, 0.81494140625, 0.864410400390625, 0.91387939453125, 0.963348388671875, 1.0128173828125, 1.062286376953125, 1.11175537109375, 1.161224365234375, 1.210693359375, 1.260162353515625, 1.30963134765625, 1.359100341796875, 1.4085693359375, 1.458038330078125, 1.50750732421875, 1.556976318359375, 1.6064453125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 13.0, 7.0, 7.0, 13.0, 21.0, 25.0, 36.0, 35.0, 33.0, 49.0, 38.0, 57.0, 50.0, 64.0, 53.0, 59.0, 52.0, 51.0, 36.0, 39.0, 45.0, 39.0, 27.0, 24.0, 31.0, 21.0, 19.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0802154541015625, -1.046173095703125, -1.0121307373046875, -0.97808837890625, -0.9440460205078125, -0.910003662109375, -0.8759613037109375, -0.8419189453125, -0.8078765869140625, -0.773834228515625, -0.7397918701171875, -0.70574951171875, -0.6717071533203125, -0.637664794921875, -0.6036224365234375, -0.569580078125, -0.5355377197265625, -0.501495361328125, -0.4674530029296875, -0.43341064453125, -0.3993682861328125, -0.365325927734375, -0.3312835693359375, -0.2972412109375, -0.2631988525390625, -0.229156494140625, -0.1951141357421875, -0.16107177734375, -0.1270294189453125, -0.092987060546875, -0.0589447021484375, -0.02490234375, 0.0091400146484375, 0.043182373046875, 0.0772247314453125, 0.11126708984375, 0.1453094482421875, 0.179351806640625, 0.2133941650390625, 0.2474365234375, 0.2814788818359375, 0.315521240234375, 0.3495635986328125, 0.38360595703125, 0.4176483154296875, 0.451690673828125, 0.4857330322265625, 0.519775390625, 0.5538177490234375, 0.587860107421875, 0.6219024658203125, 0.65594482421875, 0.6899871826171875, 0.724029541015625, 0.7580718994140625, 0.7921142578125, 0.8261566162109375, 0.860198974609375, 0.8942413330078125, 0.92828369140625, 0.9623260498046875, 0.996368408203125, 1.0304107666015625, 1.064453125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 2.0, 9.0, 16.0, 9.0, 28.0, 24.0, 46.0, 82.0, 124.0, 213.0, 443.0, 1183.0, 4600.0, 26871.0, 540900.0, 3507103.0, 98298.0, 10677.0, 2264.0, 694.0, 302.0, 165.0, 73.0, 51.0, 32.0, 25.0, 10.0, 5.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.962890625, -2.871063232421875, -2.77923583984375, -2.687408447265625, -2.5955810546875, -2.503753662109375, -2.41192626953125, -2.320098876953125, -2.228271484375, -2.136444091796875, -2.04461669921875, -1.952789306640625, -1.8609619140625, -1.769134521484375, -1.67730712890625, -1.585479736328125, -1.49365234375, -1.401824951171875, -1.30999755859375, -1.218170166015625, -1.1263427734375, -1.034515380859375, -0.94268798828125, -0.850860595703125, -0.759033203125, -0.667205810546875, -0.57537841796875, -0.483551025390625, -0.3917236328125, -0.299896240234375, -0.20806884765625, -0.116241455078125, -0.0244140625, 0.067413330078125, 0.15924072265625, 0.251068115234375, 0.3428955078125, 0.434722900390625, 0.52655029296875, 0.618377685546875, 0.710205078125, 0.802032470703125, 0.89385986328125, 0.985687255859375, 1.0775146484375, 1.169342041015625, 1.26116943359375, 1.352996826171875, 1.44482421875, 1.536651611328125, 1.62847900390625, 1.720306396484375, 1.8121337890625, 1.903961181640625, 1.99578857421875, 2.087615966796875, 2.179443359375, 2.271270751953125, 2.36309814453125, 2.454925537109375, 2.5467529296875, 2.638580322265625, 2.73040771484375, 2.822235107421875, 2.9140625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 19.0, 22.0, 21.0, 52.0, 64.0, 135.0, 212.0, 433.0, 665.0, 763.0, 634.0, 421.0, 255.0, 142.0, 76.0, 41.0, 27.0, 26.0, 11.0, 7.0, 7.0, 12.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.53814697265625, -0.5142822265625, -0.49041748046875, -0.466552734375, -0.44268798828125, -0.4188232421875, -0.39495849609375, -0.37109375, -0.34722900390625, -0.3233642578125, -0.29949951171875, -0.275634765625, -0.25177001953125, -0.2279052734375, -0.20404052734375, -0.18017578125, -0.15631103515625, -0.1324462890625, -0.10858154296875, -0.084716796875, -0.06085205078125, -0.0369873046875, -0.01312255859375, 0.0107421875, 0.03460693359375, 0.0584716796875, 0.08233642578125, 0.106201171875, 0.13006591796875, 0.1539306640625, 0.17779541015625, 0.20166015625, 0.22552490234375, 0.2493896484375, 0.27325439453125, 0.297119140625, 0.32098388671875, 0.3448486328125, 0.36871337890625, 0.392578125, 0.41644287109375, 0.4403076171875, 0.46417236328125, 0.488037109375, 0.51190185546875, 0.5357666015625, 0.55963134765625, 0.58349609375, 0.60736083984375, 0.6312255859375, 0.65509033203125, 0.678955078125, 0.70281982421875, 0.7266845703125, 0.75054931640625, 0.7744140625, 0.79827880859375, 0.8221435546875, 0.84600830078125, 0.869873046875, 0.89373779296875, 0.9176025390625, 0.94146728515625, 0.96533203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 15.0, 15.0, 24.0, 41.0, 51.0, 66.0, 79.0, 130.0, 108.0, 103.0, 90.0, 82.0, 67.0, 46.0, 29.0, 21.0, 11.0, 9.0, 8.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892338275909424, -2.8175418376922607, -2.7427456378936768, -2.6679491996765137, -2.5931529998779297, -2.5183565616607666, -2.4435603618621826, -2.3687639236450195, -2.2939677238464355, -2.2191712856292725, -2.1443750858306885, -2.0695786476135254, -1.9947824478149414, -1.9199861288070679, -1.8451898097991943, -1.7703933715820312, -1.6955970525741577, -1.6208007335662842, -1.5460044145584106, -1.471208095550537, -1.3964117765426636, -1.32161545753479, -1.246819019317627, -1.172022819519043, -1.0972263813018799, -1.0224300622940063, -0.9476337432861328, -0.8728374242782593, -0.7980411052703857, -0.7232447862625122, -0.6484484076499939, -0.5736520886421204, -0.49885571002960205, -0.4240593910217285, -0.349263072013855, -0.27446672320365906, -0.19967040419578552, -0.12487408518791199, -0.050077736377716064, 0.02471858263015747, 0.099514901638031, 0.17431122064590454, 0.24910755455493927, 0.323903888463974, 0.39870020747184753, 0.47349652647972107, 0.548292875289917, 0.6230891942977905, 0.6978855133056641, 0.7726818323135376, 0.8474781513214111, 0.9222744703292847, 0.9970707893371582, 1.0718671083450317, 1.1466634273529053, 1.2214598655700684, 1.2962560653686523, 1.3710523843765259, 1.4458487033843994, 1.520645022392273, 1.5954413414001465, 1.67023766040802, 1.7450339794158936, 1.8198304176330566, 1.8946267366409302]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 9.0, 11.0, 11.0, 16.0, 12.0, 21.0, 24.0, 18.0, 20.0, 28.0, 42.0, 27.0, 35.0, 34.0, 31.0, 54.0, 37.0, 50.0, 45.0, 41.0, 43.0, 35.0, 45.0, 42.0, 27.0, 21.0, 31.0, 24.0, 14.0, 22.0, 14.0, 10.0, 24.0, 14.0, 8.0, 11.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.1347416639328003, -1.1009100675582886, -1.0670783519744873, -1.0332467555999756, -0.9994151592254639, -0.9655835032463074, -0.9317518472671509, -0.8979202508926392, -0.8640885949134827, -0.8302569389343262, -0.7964253425598145, -0.762593686580658, -0.7287620306015015, -0.6949304342269897, -0.6610987782478333, -0.6272671222686768, -0.593435525894165, -0.5596038699150085, -0.5257722735404968, -0.49194061756134033, -0.4581089913845062, -0.4242773652076721, -0.3904457092285156, -0.3566140830516815, -0.3227824568748474, -0.2889508306980133, -0.2551192045211792, -0.2212875485420227, -0.1874559223651886, -0.1536242961883545, -0.11979265511035919, -0.08596101403236389, -0.052129387855529785, -0.018297754228115082, 0.015533879399299622, 0.049365513026714325, 0.08319714665412903, 0.11702877283096313, 0.15086041390895844, 0.18469205498695374, 0.21852368116378784, 0.25235530734062195, 0.28618693351745605, 0.32001858949661255, 0.35385021567344666, 0.38768184185028076, 0.42151349782943726, 0.45534512400627136, 0.48917675018310547, 0.523008406162262, 0.5568400025367737, 0.5906716585159302, 0.6245032548904419, 0.6583349108695984, 0.6921665668487549, 0.7259981632232666, 0.7598298192024231, 0.7936614751815796, 0.8274930715560913, 0.8613247275352478, 0.8951563835144043, 0.928987979888916, 0.9628196358680725, 0.996651291847229, 1.0304828882217407]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 10.0, 13.0, 14.0, 16.0, 20.0, 42.0, 55.0, 84.0, 111.0, 183.0, 275.0, 419.0, 587.0, 1014.0, 1655.0, 2687.0, 4726.0, 8525.0, 16409.0, 33963.0, 83649.0, 229899.0, 362409.0, 178086.0, 64651.0, 27707.0, 13716.0, 7311.0, 4065.0, 2332.0, 1388.0, 842.0, 588.0, 362.0, 267.0, 149.0, 101.0, 71.0, 34.0, 37.0, 20.0, 22.0, 5.0, 8.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3212890625, -0.3116607666015625, -0.302032470703125, -0.2924041748046875, -0.28277587890625, -0.2731475830078125, -0.263519287109375, -0.2538909912109375, -0.2442626953125, -0.2346343994140625, -0.225006103515625, -0.2153778076171875, -0.20574951171875, -0.1961212158203125, -0.186492919921875, -0.1768646240234375, -0.167236328125, -0.1576080322265625, -0.147979736328125, -0.1383514404296875, -0.12872314453125, -0.1190948486328125, -0.109466552734375, -0.0998382568359375, -0.0902099609375, -0.0805816650390625, -0.070953369140625, -0.0613250732421875, -0.05169677734375, -0.0420684814453125, -0.032440185546875, -0.0228118896484375, -0.01318359375, -0.0035552978515625, 0.006072998046875, 0.0157012939453125, 0.02532958984375, 0.0349578857421875, 0.044586181640625, 0.0542144775390625, 0.0638427734375, 0.0734710693359375, 0.083099365234375, 0.0927276611328125, 0.10235595703125, 0.1119842529296875, 0.121612548828125, 0.1312408447265625, 0.140869140625, 0.1504974365234375, 0.160125732421875, 0.1697540283203125, 0.17938232421875, 0.1890106201171875, 0.198638916015625, 0.2082672119140625, 0.2178955078125, 0.2275238037109375, 0.237152099609375, 0.2467803955078125, 0.25640869140625, 0.2660369873046875, 0.275665283203125, 0.2852935791015625, 0.294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 7.0, 2.0, 6.0, 4.0, 7.0, 14.0, 8.0, 22.0, 23.0, 30.0, 36.0, 27.0, 36.0, 38.0, 28.0, 39.0, 55.0, 52.0, 58.0, 56.0, 48.0, 37.0, 41.0, 42.0, 47.0, 38.0, 26.0, 31.0, 30.0, 17.0, 19.0, 13.0, 12.0, 11.0, 12.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7247772216796875, -0.701507568359375, -0.6782379150390625, -0.65496826171875, -0.6316986083984375, -0.608428955078125, -0.5851593017578125, -0.5618896484375, -0.5386199951171875, -0.515350341796875, -0.4920806884765625, -0.46881103515625, -0.4455413818359375, -0.422271728515625, -0.3990020751953125, -0.375732421875, -0.3524627685546875, -0.329193115234375, -0.3059234619140625, -0.28265380859375, -0.2593841552734375, -0.236114501953125, -0.2128448486328125, -0.1895751953125, -0.1663055419921875, -0.143035888671875, -0.1197662353515625, -0.09649658203125, -0.0732269287109375, -0.049957275390625, -0.0266876220703125, -0.00341796875, 0.0198516845703125, 0.043121337890625, 0.0663909912109375, 0.08966064453125, 0.1129302978515625, 0.136199951171875, 0.1594696044921875, 0.1827392578125, 0.2060089111328125, 0.229278564453125, 0.2525482177734375, 0.27581787109375, 0.2990875244140625, 0.322357177734375, 0.3456268310546875, 0.368896484375, 0.3921661376953125, 0.415435791015625, 0.4387054443359375, 0.46197509765625, 0.4852447509765625, 0.508514404296875, 0.5317840576171875, 0.5550537109375, 0.5783233642578125, 0.601593017578125, 0.6248626708984375, 0.64813232421875, 0.6714019775390625, 0.694671630859375, 0.7179412841796875, 0.7412109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 8.0, 13.0, 16.0, 18.0, 15.0, 24.0, 28.0, 30.0, 55.0, 81.0, 115.0, 190.0, 301.0, 458.0, 830.0, 1516.0, 2913.0, 5629.0, 12816.0, 31555.0, 99860.0, 338205.0, 373093.0, 117224.0, 36215.0, 14118.0, 6308.0, 3043.0, 1670.0, 815.0, 489.0, 270.0, 206.0, 117.0, 80.0, 49.0, 47.0, 38.0, 11.0, 21.0, 15.0, 8.0, 14.0, 8.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.366943359375, -0.356170654296875, -0.34539794921875, -0.334625244140625, -0.3238525390625, -0.313079833984375, -0.30230712890625, -0.291534423828125, -0.28076171875, -0.269989013671875, -0.25921630859375, -0.248443603515625, -0.2376708984375, -0.226898193359375, -0.21612548828125, -0.205352783203125, -0.194580078125, -0.183807373046875, -0.17303466796875, -0.162261962890625, -0.1514892578125, -0.140716552734375, -0.12994384765625, -0.119171142578125, -0.1083984375, -0.097625732421875, -0.08685302734375, -0.076080322265625, -0.0653076171875, -0.054534912109375, -0.04376220703125, -0.032989501953125, -0.022216796875, -0.011444091796875, -0.00067138671875, 0.010101318359375, 0.0208740234375, 0.031646728515625, 0.04241943359375, 0.053192138671875, 0.06396484375, 0.074737548828125, 0.08551025390625, 0.096282958984375, 0.1070556640625, 0.117828369140625, 0.12860107421875, 0.139373779296875, 0.150146484375, 0.160919189453125, 0.17169189453125, 0.182464599609375, 0.1932373046875, 0.204010009765625, 0.21478271484375, 0.225555419921875, 0.236328125, 0.247100830078125, 0.25787353515625, 0.268646240234375, 0.2794189453125, 0.290191650390625, 0.30096435546875, 0.311737060546875, 0.322509765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 3.0, 7.0, 8.0, 11.0, 7.0, 18.0, 12.0, 18.0, 22.0, 20.0, 32.0, 33.0, 46.0, 42.0, 39.0, 50.0, 51.0, 45.0, 42.0, 39.0, 44.0, 42.0, 42.0, 38.0, 30.0, 36.0, 33.0, 31.0, 15.0, 28.0, 18.0, 16.0, 10.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 0.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5712890625, -1.5228118896484375, -1.474334716796875, -1.4258575439453125, -1.37738037109375, -1.3289031982421875, -1.280426025390625, -1.2319488525390625, -1.1834716796875, -1.1349945068359375, -1.086517333984375, -1.0380401611328125, -0.98956298828125, -0.9410858154296875, -0.892608642578125, -0.8441314697265625, -0.795654296875, -0.7471771240234375, -0.698699951171875, -0.6502227783203125, -0.60174560546875, -0.5532684326171875, -0.504791259765625, -0.4563140869140625, -0.4078369140625, -0.3593597412109375, -0.310882568359375, -0.2624053955078125, -0.21392822265625, -0.1654510498046875, -0.116973876953125, -0.0684967041015625, -0.02001953125, 0.0284576416015625, 0.076934814453125, 0.1254119873046875, 0.17388916015625, 0.2223663330078125, 0.270843505859375, 0.3193206787109375, 0.3677978515625, 0.4162750244140625, 0.464752197265625, 0.5132293701171875, 0.56170654296875, 0.6101837158203125, 0.658660888671875, 0.7071380615234375, 0.755615234375, 0.8040924072265625, 0.852569580078125, 0.9010467529296875, 0.94952392578125, 0.9980010986328125, 1.046478271484375, 1.0949554443359375, 1.1434326171875, 1.1919097900390625, 1.240386962890625, 1.2888641357421875, 1.33734130859375, 1.3858184814453125, 1.434295654296875, 1.4827728271484375, 1.53125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 18.0, 14.0, 24.0, 32.0, 47.0, 67.0, 102.0, 141.0, 261.0, 341.0, 539.0, 944.0, 1616.0, 2996.0, 5921.0, 13500.0, 35536.0, 179451.0, 649091.0, 107821.0, 27655.0, 11203.0, 5026.0, 2548.0, 1402.0, 762.0, 487.0, 318.0, 212.0, 142.0, 87.0, 52.0, 47.0, 44.0, 25.0, 17.0, 14.0, 7.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.2660179138183594, -0.25664520263671875, -0.24727249145507812, -0.2378997802734375, -0.22852706909179688, -0.21915435791015625, -0.20978164672851562, -0.200408935546875, -0.19103622436523438, -0.18166351318359375, -0.17229080200195312, -0.1629180908203125, -0.15354537963867188, -0.14417266845703125, -0.13479995727539062, -0.12542724609375, -0.11605453491210938, -0.10668182373046875, -0.09730911254882812, -0.0879364013671875, -0.07856369018554688, -0.06919097900390625, -0.059818267822265625, -0.050445556640625, -0.041072845458984375, -0.03170013427734375, -0.022327423095703125, -0.0129547119140625, -0.003582000732421875, 0.00579071044921875, 0.015163421630859375, 0.0245361328125, 0.033908843994140625, 0.04328155517578125, 0.052654266357421875, 0.0620269775390625, 0.07139968872070312, 0.08077239990234375, 0.09014511108398438, 0.099517822265625, 0.10889053344726562, 0.11826324462890625, 0.12763595581054688, 0.1370086669921875, 0.14638137817382812, 0.15575408935546875, 0.16512680053710938, 0.17449951171875, 0.18387222290039062, 0.19324493408203125, 0.20261764526367188, 0.2119903564453125, 0.22136306762695312, 0.23073577880859375, 0.24010848999023438, 0.249481201171875, 0.2588539123535156, 0.26822662353515625, 0.2775993347167969, 0.2869720458984375, 0.2963447570800781, 0.30571746826171875, 0.3150901794433594, 0.324462890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 6.0, 11.0, 13.0, 8.0, 16.0, 26.0, 60.0, 109.0, 207.0, 198.0, 154.0, 79.0, 36.0, 29.0, 10.0, 8.0, 6.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014638900756835938, -0.00014153867959976196, -0.00013668835163116455, -0.00013183802366256714, -0.00012698769569396973, -0.00012213736772537231, -0.0001172870397567749, -0.00011243671178817749, -0.00010758638381958008, -0.00010273605585098267, -9.788572788238525e-05, -9.303539991378784e-05, -8.818507194519043e-05, -8.333474397659302e-05, -7.84844160079956e-05, -7.36340880393982e-05, -6.878376007080078e-05, -6.393343210220337e-05, -5.908310413360596e-05, -5.4232776165008545e-05, -4.938244819641113e-05, -4.453212022781372e-05, -3.968179225921631e-05, -3.4831464290618896e-05, -2.9981136322021484e-05, -2.5130808353424072e-05, -2.028048038482666e-05, -1.5430152416229248e-05, -1.0579824447631836e-05, -5.729496479034424e-06, -8.791685104370117e-07, 3.9711594581604e-06, 8.821487426757812e-06, 1.3671815395355225e-05, 1.8522143363952637e-05, 2.337247133255005e-05, 2.822279930114746e-05, 3.307312726974487e-05, 3.7923455238342285e-05, 4.27737832069397e-05, 4.762411117553711e-05, 5.247443914413452e-05, 5.7324767112731934e-05, 6.217509508132935e-05, 6.702542304992676e-05, 7.187575101852417e-05, 7.672607898712158e-05, 8.1576406955719e-05, 8.64267349243164e-05, 9.127706289291382e-05, 9.612739086151123e-05, 0.00010097771883010864, 0.00010582804679870605, 0.00011067837476730347, 0.00011552870273590088, 0.00012037903070449829, 0.0001252293586730957, 0.00013007968664169312, 0.00013493001461029053, 0.00013978034257888794, 0.00014463067054748535, 0.00014948099851608276, 0.00015433132648468018, 0.0001591816544532776, 0.000164031982421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 4.0, 11.0, 11.0, 15.0, 35.0, 52.0, 84.0, 153.0, 266.0, 589.0, 1218.0, 2864.0, 7284.0, 21310.0, 107282.0, 737428.0, 132176.0, 23938.0, 7979.0, 3136.0, 1372.0, 628.0, 314.0, 151.0, 84.0, 57.0, 32.0, 19.0, 22.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.55224609375, -0.5379180908203125, -0.523590087890625, -0.5092620849609375, -0.49493408203125, -0.4806060791015625, -0.466278076171875, -0.4519500732421875, -0.4376220703125, -0.4232940673828125, -0.408966064453125, -0.3946380615234375, -0.38031005859375, -0.3659820556640625, -0.351654052734375, -0.3373260498046875, -0.322998046875, -0.3086700439453125, -0.294342041015625, -0.2800140380859375, -0.26568603515625, -0.2513580322265625, -0.237030029296875, -0.2227020263671875, -0.2083740234375, -0.1940460205078125, -0.179718017578125, -0.1653900146484375, -0.15106201171875, -0.1367340087890625, -0.122406005859375, -0.1080780029296875, -0.09375, -0.0794219970703125, -0.065093994140625, -0.0507659912109375, -0.03643798828125, -0.0221099853515625, -0.007781982421875, 0.0065460205078125, 0.0208740234375, 0.0352020263671875, 0.049530029296875, 0.0638580322265625, 0.07818603515625, 0.0925140380859375, 0.106842041015625, 0.1211700439453125, 0.135498046875, 0.1498260498046875, 0.164154052734375, 0.1784820556640625, 0.19281005859375, 0.2071380615234375, 0.221466064453125, 0.2357940673828125, 0.2501220703125, 0.2644500732421875, 0.278778076171875, 0.2931060791015625, 0.30743408203125, 0.3217620849609375, 0.336090087890625, 0.3504180908203125, 0.36474609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 17.0, 12.0, 16.0, 25.0, 37.0, 66.0, 95.0, 132.0, 164.0, 129.0, 99.0, 65.0, 36.0, 24.0, 11.0, 10.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.09227275848388672, -0.08865928649902344, -0.08504581451416016, -0.08143234252929688, -0.0778188705444336, -0.07420539855957031, -0.07059192657470703, -0.06697845458984375, -0.06336498260498047, -0.05975151062011719, -0.056138038635253906, -0.052524566650390625, -0.048911094665527344, -0.04529762268066406, -0.04168415069580078, -0.0380706787109375, -0.03445720672607422, -0.030843734741210938, -0.027230262756347656, -0.023616790771484375, -0.020003318786621094, -0.016389846801757812, -0.012776374816894531, -0.00916290283203125, -0.005549430847167969, -0.0019359588623046875, 0.0016775131225585938, 0.005290985107421875, 0.008904457092285156, 0.012517929077148438, 0.01613140106201172, 0.019744873046875, 0.02335834503173828, 0.026971817016601562, 0.030585289001464844, 0.034198760986328125, 0.037812232971191406, 0.04142570495605469, 0.04503917694091797, 0.04865264892578125, 0.05226612091064453, 0.05587959289550781, 0.059493064880371094, 0.06310653686523438, 0.06672000885009766, 0.07033348083496094, 0.07394695281982422, 0.0775604248046875, 0.08117389678955078, 0.08478736877441406, 0.08840084075927734, 0.09201431274414062, 0.0956277847290039, 0.09924125671386719, 0.10285472869873047, 0.10646820068359375, 0.11008167266845703, 0.11369514465332031, 0.1173086166381836, 0.12092208862304688, 0.12453556060791016, 0.12814903259277344, 0.13176250457763672, 0.1353759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 14.0, 18.0, 31.0, 35.0, 62.0, 84.0, 135.0, 123.0, 131.0, 100.0, 95.0, 57.0, 54.0, 18.0, 25.0, 10.0, 10.0, 5.0, 0.0, 4.0], "bins": [-2.4272518157958984, -2.3806257247924805, -2.3339996337890625, -2.2873733043670654, -2.2407472133636475, -2.1941211223602295, -2.1474950313568115, -2.1008687019348145, -2.0542426109313965, -2.0076165199279785, -1.960990309715271, -1.914364218711853, -1.8677380084991455, -1.8211119174957275, -1.7744858264923096, -1.727859616279602, -1.681233525276184, -1.6346074342727661, -1.5879812240600586, -1.5413551330566406, -1.494728922843933, -1.4481028318405151, -1.4014766216278076, -1.3548505306243896, -1.3082244396209717, -1.2615983486175537, -1.2149721384048462, -1.1683460474014282, -1.1217198371887207, -1.0750937461853027, -1.0284676551818848, -0.9818414449691772, -0.9352153539657593, -0.8885892033576965, -0.8419630527496338, -0.7953369617462158, -0.7487107515335083, -0.7020846605300903, -0.6554585099220276, -0.6088323593139648, -0.5622062087059021, -0.5155800580978394, -0.4689539074897766, -0.42232778668403625, -0.3757016360759735, -0.32907548546791077, -0.2824493646621704, -0.23582321405410767, -0.18919706344604492, -0.14257091283798218, -0.09594477713108063, -0.04931864142417908, -0.002692490816116333, 0.04393365979194641, 0.09055978059768677, 0.1371859312057495, 0.18381208181381226, 0.230438232421875, 0.27706438302993774, 0.3236905038356781, 0.37031665444374084, 0.4169428050518036, 0.46356892585754395, 0.5101950764656067, 0.5568212270736694]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 22.0, 12.0, 19.0, 24.0, 21.0, 26.0, 40.0, 38.0, 24.0, 29.0, 36.0, 27.0, 42.0, 48.0, 42.0, 45.0, 34.0, 57.0, 34.0, 36.0, 33.0, 25.0, 33.0, 33.0, 24.0, 27.0, 17.0, 17.0, 15.0, 13.0, 10.0, 11.0, 8.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.6026099920272827, -0.5838498473167419, -0.5650897026062012, -0.5463295578956604, -0.5275694131851196, -0.5088092088699341, -0.4900490939617157, -0.47128891944885254, -0.45252877473831177, -0.433768630027771, -0.4150084853172302, -0.39624834060668945, -0.3774881660938263, -0.3587280213832855, -0.33996787667274475, -0.3212077021598816, -0.3024475872516632, -0.28368744254112244, -0.26492729783058167, -0.2461671382188797, -0.22740697860717773, -0.20864683389663696, -0.1898866891860962, -0.17112652957439423, -0.15236638486385345, -0.13360624015331268, -0.11484608054161072, -0.09608593583106995, -0.07732578366994858, -0.05856563150882721, -0.03980548679828644, -0.021045327186584473, -0.002285182476043701, 0.016474967822432518, 0.03523511812090874, 0.05399526655673981, 0.07275541871786118, 0.09151557087898254, 0.11027571558952332, 0.12903587520122528, 0.14779601991176605, 0.16655616462230682, 0.1853163242340088, 0.20407646894454956, 0.22283661365509033, 0.2415967732667923, 0.2603569030761719, 0.27911707758903503, 0.2978772222995758, 0.3166373670101166, 0.33539751172065735, 0.3541576862335205, 0.3729178309440613, 0.39167797565460205, 0.4104381203651428, 0.4291982650756836, 0.44795840978622437, 0.46671855449676514, 0.4854786992073059, 0.5042388439178467, 0.5229989886283875, 0.5417591333389282, 0.5605193376541138, 0.5792794823646545, 0.5980396270751953]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 16.0, 28.0, 27.0, 59.0, 76.0, 127.0, 155.0, 293.0, 439.0, 782.0, 1327.0, 2556.0, 5204.0, 10615.0, 22776.0, 56244.0, 194453.0, 467077.0, 187959.0, 54480.0, 22490.0, 10165.0, 5103.0, 2626.0, 1368.0, 804.0, 473.0, 278.0, 166.0, 125.0, 72.0, 52.0, 36.0, 24.0, 16.0, 12.0, 11.0, 4.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.9462890625, -0.9196243286132812, -0.8929595947265625, -0.8662948608398438, -0.839630126953125, -0.8129653930664062, -0.7863006591796875, -0.7596359252929688, -0.73297119140625, -0.7063064575195312, -0.6796417236328125, -0.6529769897460938, -0.626312255859375, -0.5996475219726562, -0.5729827880859375, -0.5463180541992188, -0.5196533203125, -0.49298858642578125, -0.4663238525390625, -0.43965911865234375, -0.412994384765625, -0.38632965087890625, -0.3596649169921875, -0.33300018310546875, -0.30633544921875, -0.27967071533203125, -0.2530059814453125, -0.22634124755859375, -0.199676513671875, -0.17301177978515625, -0.1463470458984375, -0.11968231201171875, -0.093017578125, -0.06635284423828125, -0.0396881103515625, -0.01302337646484375, 0.013641357421875, 0.04030609130859375, 0.0669708251953125, 0.09363555908203125, 0.12030029296875, 0.14696502685546875, 0.1736297607421875, 0.20029449462890625, 0.226959228515625, 0.25362396240234375, 0.2802886962890625, 0.30695343017578125, 0.3336181640625, 0.36028289794921875, 0.3869476318359375, 0.41361236572265625, 0.440277099609375, 0.46694183349609375, 0.4936065673828125, 0.5202713012695312, 0.54693603515625, 0.5736007690429688, 0.6002655029296875, 0.6269302368164062, 0.653594970703125, 0.6802597045898438, 0.7069244384765625, 0.7335891723632812, 0.76025390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 5.0, 10.0, 15.0, 13.0, 20.0, 22.0, 21.0, 20.0, 41.0, 32.0, 31.0, 39.0, 37.0, 42.0, 40.0, 51.0, 53.0, 40.0, 48.0, 37.0, 43.0, 42.0, 40.0, 30.0, 20.0, 30.0, 18.0, 17.0, 25.0, 17.0, 20.0, 14.0, 13.0, 10.0, 4.0, 8.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.1567535400390625, -1.115264892578125, -1.0737762451171875, -1.03228759765625, -0.9907989501953125, -0.949310302734375, -0.9078216552734375, -0.8663330078125, -0.8248443603515625, -0.783355712890625, -0.7418670654296875, -0.70037841796875, -0.6588897705078125, -0.617401123046875, -0.5759124755859375, -0.534423828125, -0.4929351806640625, -0.451446533203125, -0.4099578857421875, -0.36846923828125, -0.3269805908203125, -0.285491943359375, -0.2440032958984375, -0.2025146484375, -0.1610260009765625, -0.119537353515625, -0.0780487060546875, -0.03656005859375, 0.0049285888671875, 0.046417236328125, 0.0879058837890625, 0.12939453125, 0.1708831787109375, 0.212371826171875, 0.2538604736328125, 0.29534912109375, 0.3368377685546875, 0.378326416015625, 0.4198150634765625, 0.4613037109375, 0.5027923583984375, 0.544281005859375, 0.5857696533203125, 0.62725830078125, 0.6687469482421875, 0.710235595703125, 0.7517242431640625, 0.793212890625, 0.8347015380859375, 0.876190185546875, 0.9176788330078125, 0.95916748046875, 1.0006561279296875, 1.042144775390625, 1.0836334228515625, 1.1251220703125, 1.1666107177734375, 1.208099365234375, 1.2495880126953125, 1.29107666015625, 1.3325653076171875, 1.374053955078125, 1.4155426025390625, 1.45703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 13.0, 18.0, 23.0, 29.0, 49.0, 58.0, 76.0, 137.0, 221.0, 522.0, 1397.0, 4422.0, 17380.0, 94864.0, 677484.0, 211006.0, 30230.0, 6990.0, 2006.0, 750.0, 322.0, 165.0, 110.0, 76.0, 48.0, 38.0, 29.0, 19.0, 7.0, 11.0, 14.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7099609375, -1.6620330810546875, -1.614105224609375, -1.5661773681640625, -1.51824951171875, -1.4703216552734375, -1.422393798828125, -1.3744659423828125, -1.3265380859375, -1.2786102294921875, -1.230682373046875, -1.1827545166015625, -1.13482666015625, -1.0868988037109375, -1.038970947265625, -0.9910430908203125, -0.943115234375, -0.8951873779296875, -0.847259521484375, -0.7993316650390625, -0.75140380859375, -0.7034759521484375, -0.655548095703125, -0.6076202392578125, -0.5596923828125, -0.5117645263671875, -0.463836669921875, -0.4159088134765625, -0.36798095703125, -0.3200531005859375, -0.272125244140625, -0.2241973876953125, -0.17626953125, -0.1283416748046875, -0.080413818359375, -0.0324859619140625, 0.01544189453125, 0.0633697509765625, 0.111297607421875, 0.1592254638671875, 0.2071533203125, 0.2550811767578125, 0.303009033203125, 0.3509368896484375, 0.39886474609375, 0.4467926025390625, 0.494720458984375, 0.5426483154296875, 0.590576171875, 0.6385040283203125, 0.686431884765625, 0.7343597412109375, 0.78228759765625, 0.8302154541015625, 0.878143310546875, 0.9260711669921875, 0.9739990234375, 1.0219268798828125, 1.069854736328125, 1.1177825927734375, 1.16571044921875, 1.2136383056640625, 1.261566162109375, 1.3094940185546875, 1.357421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 10.0, 11.0, 13.0, 14.0, 13.0, 16.0, 20.0, 32.0, 32.0, 38.0, 33.0, 47.0, 50.0, 65.0, 58.0, 50.0, 54.0, 59.0, 52.0, 33.0, 53.0, 38.0, 36.0, 29.0, 18.0, 27.0, 20.0, 13.0, 11.0, 10.0, 5.0, 4.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.91796875, -1.865692138671875, -1.81341552734375, -1.761138916015625, -1.7088623046875, -1.656585693359375, -1.60430908203125, -1.552032470703125, -1.499755859375, -1.447479248046875, -1.39520263671875, -1.342926025390625, -1.2906494140625, -1.238372802734375, -1.18609619140625, -1.133819580078125, -1.08154296875, -1.029266357421875, -0.97698974609375, -0.924713134765625, -0.8724365234375, -0.820159912109375, -0.76788330078125, -0.715606689453125, -0.663330078125, -0.611053466796875, -0.55877685546875, -0.506500244140625, -0.4542236328125, -0.401947021484375, -0.34967041015625, -0.297393798828125, -0.2451171875, -0.192840576171875, -0.14056396484375, -0.088287353515625, -0.0360107421875, 0.016265869140625, 0.06854248046875, 0.120819091796875, 0.173095703125, 0.225372314453125, 0.27764892578125, 0.329925537109375, 0.3822021484375, 0.434478759765625, 0.48675537109375, 0.539031982421875, 0.59130859375, 0.643585205078125, 0.69586181640625, 0.748138427734375, 0.8004150390625, 0.852691650390625, 0.90496826171875, 0.957244873046875, 1.009521484375, 1.061798095703125, 1.11407470703125, 1.166351318359375, 1.2186279296875, 1.270904541015625, 1.32318115234375, 1.375457763671875, 1.427734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 7.0, 15.0, 16.0, 27.0, 50.0, 92.0, 160.0, 337.0, 779.0, 2106.0, 7879.0, 54057.0, 653840.0, 296322.0, 25576.0, 4686.0, 1463.0, 541.0, 277.0, 137.0, 70.0, 34.0, 28.0, 15.0, 9.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4185829162597656, -0.40454864501953125, -0.3905143737792969, -0.3764801025390625, -0.3624458312988281, -0.34841156005859375, -0.3343772888183594, -0.320343017578125, -0.3063087463378906, -0.29227447509765625, -0.2782402038574219, -0.2642059326171875, -0.2501716613769531, -0.23613739013671875, -0.22210311889648438, -0.20806884765625, -0.19403457641601562, -0.18000030517578125, -0.16596603393554688, -0.1519317626953125, -0.13789749145507812, -0.12386322021484375, -0.10982894897460938, -0.095794677734375, -0.08176040649414062, -0.06772613525390625, -0.053691864013671875, -0.0396575927734375, -0.025623321533203125, -0.01158905029296875, 0.002445220947265625, 0.0164794921875, 0.030513763427734375, 0.04454803466796875, 0.058582305908203125, 0.0726165771484375, 0.08665084838867188, 0.10068511962890625, 0.11471939086914062, 0.128753662109375, 0.14278793334960938, 0.15682220458984375, 0.17085647583007812, 0.1848907470703125, 0.19892501831054688, 0.21295928955078125, 0.22699356079101562, 0.24102783203125, 0.2550621032714844, 0.26909637451171875, 0.2831306457519531, 0.2971649169921875, 0.3111991882324219, 0.32523345947265625, 0.3392677307128906, 0.353302001953125, 0.3673362731933594, 0.38137054443359375, 0.3954048156738281, 0.4094390869140625, 0.4234733581542969, 0.43750762939453125, 0.4515419006347656, 0.465576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 11.0, 9.0, 6.0, 7.0, 9.0, 13.0, 21.0, 19.0, 34.0, 39.0, 38.0, 53.0, 66.0, 87.0, 81.0, 93.0, 65.0, 48.0, 44.0, 37.0, 44.0, 42.0, 17.0, 15.0, 15.0, 13.0, 11.0, 9.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.254413604736328e-05, -3.145821392536163e-05, -3.0372291803359985e-05, -2.9286369681358337e-05, -2.820044755935669e-05, -2.711452543735504e-05, -2.6028603315353394e-05, -2.4942681193351746e-05, -2.3856759071350098e-05, -2.277083694934845e-05, -2.1684914827346802e-05, -2.0598992705345154e-05, -1.9513070583343506e-05, -1.8427148461341858e-05, -1.734122633934021e-05, -1.6255304217338562e-05, -1.5169382095336914e-05, -1.4083459973335266e-05, -1.2997537851333618e-05, -1.191161572933197e-05, -1.0825693607330322e-05, -9.739771485328674e-06, -8.653849363327026e-06, -7.567927241325378e-06, -6.4820051193237305e-06, -5.3960829973220825e-06, -4.3101608753204346e-06, -3.2242387533187866e-06, -2.1383166313171387e-06, -1.0523945093154907e-06, 3.3527612686157227e-08, 1.1194497346878052e-06, 2.205371856689453e-06, 3.291293978691101e-06, 4.377216100692749e-06, 5.463138222694397e-06, 6.549060344696045e-06, 7.634982466697693e-06, 8.72090458869934e-06, 9.806826710700989e-06, 1.0892748832702637e-05, 1.1978670954704285e-05, 1.3064593076705933e-05, 1.415051519870758e-05, 1.5236437320709229e-05, 1.6322359442710876e-05, 1.7408281564712524e-05, 1.8494203686714172e-05, 1.958012580871582e-05, 2.0666047930717468e-05, 2.1751970052719116e-05, 2.2837892174720764e-05, 2.3923814296722412e-05, 2.500973641872406e-05, 2.6095658540725708e-05, 2.7181580662727356e-05, 2.8267502784729004e-05, 2.9353424906730652e-05, 3.04393470287323e-05, 3.152526915073395e-05, 3.2611191272735596e-05, 3.3697113394737244e-05, 3.478303551673889e-05, 3.586895763874054e-05, 3.695487976074219e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 4.0, 14.0, 10.0, 21.0, 30.0, 33.0, 48.0, 60.0, 88.0, 158.0, 274.0, 486.0, 850.0, 1876.0, 4035.0, 11653.0, 47616.0, 317325.0, 547726.0, 87567.0, 17972.0, 5687.0, 2454.0, 1124.0, 568.0, 324.0, 165.0, 113.0, 63.0, 43.0, 37.0, 26.0, 18.0, 14.0, 17.0, 11.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351318359375, -0.3392753601074219, -0.32723236083984375, -0.3151893615722656, -0.3031463623046875, -0.2911033630371094, -0.27906036376953125, -0.2670173645019531, -0.254974365234375, -0.24293136596679688, -0.23088836669921875, -0.21884536743164062, -0.2068023681640625, -0.19475936889648438, -0.18271636962890625, -0.17067337036132812, -0.15863037109375, -0.14658737182617188, -0.13454437255859375, -0.12250137329101562, -0.1104583740234375, -0.09841537475585938, -0.08637237548828125, -0.07432937622070312, -0.062286376953125, -0.050243377685546875, -0.03820037841796875, -0.026157379150390625, -0.0141143798828125, -0.002071380615234375, 0.00997161865234375, 0.022014617919921875, 0.0340576171875, 0.046100616455078125, 0.05814361572265625, 0.07018661499023438, 0.0822296142578125, 0.09427261352539062, 0.10631561279296875, 0.11835861206054688, 0.130401611328125, 0.14244461059570312, 0.15448760986328125, 0.16653060913085938, 0.1785736083984375, 0.19061660766601562, 0.20265960693359375, 0.21470260620117188, 0.22674560546875, 0.23878860473632812, 0.25083160400390625, 0.2628746032714844, 0.2749176025390625, 0.2869606018066406, 0.29900360107421875, 0.3110466003417969, 0.323089599609375, 0.3351325988769531, 0.34717559814453125, 0.3592185974121094, 0.3712615966796875, 0.3833045959472656, 0.39534759521484375, 0.4073905944824219, 0.41943359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 12.0, 18.0, 18.0, 21.0, 24.0, 49.0, 46.0, 67.0, 68.0, 78.0, 97.0, 89.0, 67.0, 65.0, 49.0, 37.0, 33.0, 30.0, 24.0, 15.0, 13.0, 11.0, 2.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134765625, -0.13036155700683594, -0.12595748901367188, -0.12155342102050781, -0.11714935302734375, -0.11274528503417969, -0.10834121704101562, -0.10393714904785156, -0.0995330810546875, -0.09512901306152344, -0.09072494506835938, -0.08632087707519531, -0.08191680908203125, -0.07751274108886719, -0.07310867309570312, -0.06870460510253906, -0.064300537109375, -0.05989646911621094, -0.055492401123046875, -0.05108833312988281, -0.04668426513671875, -0.04228019714355469, -0.037876129150390625, -0.03347206115722656, -0.0290679931640625, -0.024663925170898438, -0.020259857177734375, -0.015855789184570312, -0.01145172119140625, -0.0070476531982421875, -0.002643585205078125, 0.0017604827880859375, 0.00616455078125, 0.010568618774414062, 0.014972686767578125, 0.019376754760742188, 0.02378082275390625, 0.028184890747070312, 0.032588958740234375, 0.03699302673339844, 0.0413970947265625, 0.04580116271972656, 0.050205230712890625, 0.05460929870605469, 0.05901336669921875, 0.06341743469238281, 0.06782150268554688, 0.07222557067871094, 0.076629638671875, 0.08103370666503906, 0.08543777465820312, 0.08984184265136719, 0.09424591064453125, 0.09864997863769531, 0.10305404663085938, 0.10745811462402344, 0.1118621826171875, 0.11626625061035156, 0.12067031860351562, 0.1250743865966797, 0.12947845458984375, 0.1338825225830078, 0.13828659057617188, 0.14269065856933594, 0.1470947265625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 14.0, 22.0, 49.0, 79.0, 147.0, 159.0, 149.0, 125.0, 105.0, 67.0, 50.0, 12.0, 13.0, 9.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.4617156982421875, -6.337893962860107, -6.214072227478027, -6.090250492095947, -5.966428756713867, -5.842607498168945, -5.718785762786865, -5.594964027404785, -5.471142292022705, -5.347320556640625, -5.223498821258545, -5.099677085876465, -4.975855827331543, -4.852034091949463, -4.728212356567383, -4.604390621185303, -4.480568885803223, -4.356747150421143, -4.2329254150390625, -4.109103679656982, -3.9852821826934814, -3.8614604473114014, -3.7376389503479004, -3.6138172149658203, -3.4899954795837402, -3.36617374420166, -3.24235200881958, -3.118530511856079, -2.994708776473999, -2.870887041091919, -2.747065544128418, -2.623243808746338, -2.499422073364258, -2.3756003379821777, -2.2517786026000977, -2.1279571056365967, -2.0041353702545166, -1.8803136348724365, -1.756492018699646, -1.6326704025268555, -1.508848786354065, -1.3850271701812744, -1.2612054347991943, -1.1373836994171143, -1.0135620832443237, -0.8897404074668884, -0.7659187316894531, -0.6420970559120178, -0.5182753801345825, -0.3944537043571472, -0.2706320285797119, -0.1468103528022766, -0.02298867702484131, 0.100832998752594, 0.2246546745300293, 0.3484763503074646, 0.4722980260848999, 0.5961197018623352, 0.7199413776397705, 0.8437630534172058, 0.9675847291946411, 1.0914063453674316, 1.2152280807495117, 1.3390498161315918, 1.4628714323043823]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 6.0, 12.0, 10.0, 17.0, 18.0, 15.0, 14.0, 27.0, 34.0, 36.0, 37.0, 37.0, 28.0, 50.0, 53.0, 35.0, 41.0, 40.0, 43.0, 54.0, 44.0, 36.0, 36.0, 34.0, 25.0, 36.0, 35.0, 28.0, 25.0, 14.0, 9.0, 11.0, 10.0, 12.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.384341239929199, -2.3093955516815186, -2.234449863433838, -2.1595041751861572, -2.0845584869384766, -2.009612798690796, -1.9346672296524048, -1.8597215414047241, -1.7847758531570435, -1.7098301649093628, -1.6348844766616821, -1.5599387884140015, -1.4849932193756104, -1.4100475311279297, -1.335101842880249, -1.2601561546325684, -1.1852104663848877, -1.110264778137207, -1.0353190898895264, -0.9603734612464905, -0.8854277729988098, -0.8104820847511292, -0.7355364561080933, -0.6605907678604126, -0.5856450796127319, -0.5106993913650513, -0.435753732919693, -0.3608080744743347, -0.28586238622665405, -0.2109166979789734, -0.1359710395336151, -0.061025381088256836, 0.013920307159423828, 0.0888659805059433, 0.16381165385246277, 0.23875732719898224, 0.3137030005455017, 0.3886486887931824, 0.46359434723854065, 0.5385400056838989, 0.6134856939315796, 0.6884313821792603, 0.7633770704269409, 0.8383226990699768, 0.9132683873176575, 0.9882140755653381, 1.063159704208374, 1.1381053924560547, 1.2130510807037354, 1.287996768951416, 1.3629424571990967, 1.4378881454467773, 1.512833833694458, 1.5877795219421387, 1.6627250909805298, 1.7376707792282104, 1.8126164674758911, 1.8875621557235718, 1.9625078439712524, 2.0374534130096436, 2.112399101257324, 2.187344789505005, 2.2622904777526855, 2.337236166000366, 2.412181854248047]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 7.0, 12.0, 5.0, 16.0, 12.0, 8.0, 13.0, 29.0, 42.0, 42.0, 110.0, 208.0, 312.0, 681.0, 1583.0, 4381.0, 14957.0, 92776.0, 1474468.0, 2394435.0, 179532.0, 21512.0, 5528.0, 1955.0, 772.0, 343.0, 223.0, 110.0, 71.0, 36.0, 25.0, 23.0, 11.0, 11.0, 6.0, 5.0, 8.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9716796875, -1.91217041015625, -1.8526611328125, -1.79315185546875, -1.733642578125, -1.67413330078125, -1.6146240234375, -1.55511474609375, -1.49560546875, -1.43609619140625, -1.3765869140625, -1.31707763671875, -1.257568359375, -1.19805908203125, -1.1385498046875, -1.07904052734375, -1.01953125, -0.96002197265625, -0.9005126953125, -0.84100341796875, -0.781494140625, -0.72198486328125, -0.6624755859375, -0.60296630859375, -0.54345703125, -0.48394775390625, -0.4244384765625, -0.36492919921875, -0.305419921875, -0.24591064453125, -0.1864013671875, -0.12689208984375, -0.0673828125, -0.00787353515625, 0.0516357421875, 0.11114501953125, 0.170654296875, 0.23016357421875, 0.2896728515625, 0.34918212890625, 0.40869140625, 0.46820068359375, 0.5277099609375, 0.58721923828125, 0.646728515625, 0.70623779296875, 0.7657470703125, 0.82525634765625, 0.884765625, 0.94427490234375, 1.0037841796875, 1.06329345703125, 1.122802734375, 1.18231201171875, 1.2418212890625, 1.30133056640625, 1.36083984375, 1.42034912109375, 1.4798583984375, 1.53936767578125, 1.598876953125, 1.65838623046875, 1.7178955078125, 1.77740478515625, 1.8369140625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 12.0, 18.0, 25.0, 21.0, 15.0, 22.0, 31.0, 34.0, 45.0, 28.0, 33.0, 35.0, 54.0, 41.0, 45.0, 51.0, 42.0, 41.0, 31.0, 37.0, 35.0, 34.0, 31.0, 33.0, 28.0, 24.0, 22.0, 18.0, 6.0, 17.0, 14.0, 6.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.67724609375, -0.6538925170898438, -0.6305389404296875, -0.6071853637695312, -0.583831787109375, -0.5604782104492188, -0.5371246337890625, -0.5137710571289062, -0.49041748046875, -0.46706390380859375, -0.4437103271484375, -0.42035675048828125, -0.397003173828125, -0.37364959716796875, -0.3502960205078125, -0.32694244384765625, -0.3035888671875, -0.28023529052734375, -0.2568817138671875, -0.23352813720703125, -0.210174560546875, -0.18682098388671875, -0.1634674072265625, -0.14011383056640625, -0.11676025390625, -0.09340667724609375, -0.0700531005859375, -0.04669952392578125, -0.023345947265625, 7.62939453125e-06, 0.0233612060546875, 0.04671478271484375, 0.070068359375, 0.09342193603515625, 0.1167755126953125, 0.14012908935546875, 0.163482666015625, 0.18683624267578125, 0.2101898193359375, 0.23354339599609375, 0.25689697265625, 0.28025054931640625, 0.3036041259765625, 0.32695770263671875, 0.350311279296875, 0.37366485595703125, 0.3970184326171875, 0.42037200927734375, 0.4437255859375, 0.46707916259765625, 0.4904327392578125, 0.5137863159179688, 0.537139892578125, 0.5604934692382812, 0.5838470458984375, 0.6072006225585938, 0.63055419921875, 0.6539077758789062, 0.6772613525390625, 0.7006149291992188, 0.723968505859375, 0.7473220825195312, 0.7706756591796875, 0.7940292358398438, 0.8173828125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 9.0, 9.0, 27.0, 33.0, 66.0, 98.0, 225.0, 486.0, 1391.0, 5160.0, 36699.0, 2241169.0, 1867761.0, 34000.0, 4859.0, 1309.0, 440.0, 205.0, 111.0, 70.0, 43.0, 22.0, 21.0, 12.0, 10.0, 4.0, 9.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.49609375, -3.39892578125, -3.3017578125, -3.20458984375, -3.107421875, -3.01025390625, -2.9130859375, -2.81591796875, -2.71875, -2.62158203125, -2.5244140625, -2.42724609375, -2.330078125, -2.23291015625, -2.1357421875, -2.03857421875, -1.94140625, -1.84423828125, -1.7470703125, -1.64990234375, -1.552734375, -1.45556640625, -1.3583984375, -1.26123046875, -1.1640625, -1.06689453125, -0.9697265625, -0.87255859375, -0.775390625, -0.67822265625, -0.5810546875, -0.48388671875, -0.38671875, -0.28955078125, -0.1923828125, -0.09521484375, 0.001953125, 0.09912109375, 0.1962890625, 0.29345703125, 0.390625, 0.48779296875, 0.5849609375, 0.68212890625, 0.779296875, 0.87646484375, 0.9736328125, 1.07080078125, 1.16796875, 1.26513671875, 1.3623046875, 1.45947265625, 1.556640625, 1.65380859375, 1.7509765625, 1.84814453125, 1.9453125, 2.04248046875, 2.1396484375, 2.23681640625, 2.333984375, 2.43115234375, 2.5283203125, 2.62548828125, 2.72265625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 11.0, 10.0, 16.0, 20.0, 25.0, 52.0, 57.0, 109.0, 232.0, 377.0, 649.0, 775.0, 690.0, 464.0, 263.0, 123.0, 84.0, 31.0, 21.0, 17.0, 15.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.62353515625, -0.60009765625, -0.57666015625, -0.55322265625, -0.52978515625, -0.50634765625, -0.48291015625, -0.45947265625, -0.43603515625, -0.41259765625, -0.38916015625, -0.36572265625, -0.34228515625, -0.31884765625, -0.29541015625, -0.27197265625, -0.24853515625, -0.22509765625, -0.20166015625, -0.17822265625, -0.15478515625, -0.13134765625, -0.10791015625, -0.08447265625, -0.06103515625, -0.03759765625, -0.01416015625, 0.00927734375, 0.03271484375, 0.05615234375, 0.07958984375, 0.10302734375, 0.12646484375, 0.14990234375, 0.17333984375, 0.19677734375, 0.22021484375, 0.24365234375, 0.26708984375, 0.29052734375, 0.31396484375, 0.33740234375, 0.36083984375, 0.38427734375, 0.40771484375, 0.43115234375, 0.45458984375, 0.47802734375, 0.50146484375, 0.52490234375, 0.54833984375, 0.57177734375, 0.59521484375, 0.61865234375, 0.64208984375, 0.66552734375, 0.68896484375, 0.71240234375, 0.73583984375, 0.75927734375, 0.78271484375, 0.80615234375, 0.82958984375, 0.85302734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 9.0, 7.0, 11.0, 16.0, 12.0, 11.0, 16.0, 22.0, 25.0, 31.0, 33.0, 41.0, 50.0, 40.0, 49.0, 60.0, 51.0, 65.0, 53.0, 58.0, 45.0, 52.0, 35.0, 42.0, 32.0, 24.0, 20.0, 16.0, 15.0, 11.0, 10.0, 7.0, 10.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9333469271659851, -0.8966100811958313, -0.8598732352256775, -0.8231363892555237, -0.7863996028900146, -0.7496627569198608, -0.712925910949707, -0.6761890649795532, -0.6394522190093994, -0.6027153730392456, -0.5659785270690918, -0.529241681098938, -0.49250486493110657, -0.45576801896095276, -0.41903120279312134, -0.38229435682296753, -0.3455575108528137, -0.3088206648826599, -0.2720838189125061, -0.23534700274467468, -0.19861015677452087, -0.16187331080436707, -0.12513647973537445, -0.08839964866638184, -0.05166280269622803, -0.014925964176654816, 0.021810874342918396, 0.05854771286249161, 0.09528455138206482, 0.13202139735221863, 0.16875822842121124, 0.20549505949020386, 0.24223196506500244, 0.27896881103515625, 0.31570565700531006, 0.3524424731731415, 0.3891793191432953, 0.4259161651134491, 0.4626529812812805, 0.4993898272514343, 0.5361266732215881, 0.5728635191917419, 0.6096003651618958, 0.6463372111320496, 0.6830739974975586, 0.7198108434677124, 0.7565476894378662, 0.79328453540802, 0.8300213813781738, 0.8667582273483276, 0.9034950733184814, 0.9402319192886353, 0.9769687652587891, 1.0137056112289429, 1.0504424571990967, 1.087179183959961, 1.1239161491394043, 1.160652995109558, 1.197389841079712, 1.2341266870498657, 1.2708635330200195, 1.3076003789901733, 1.3443372249603271, 1.3810739517211914, 1.4178107976913452]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 13.0, 15.0, 17.0, 12.0, 17.0, 19.0, 22.0, 21.0, 23.0, 29.0, 32.0, 32.0, 37.0, 29.0, 42.0, 40.0, 43.0, 40.0, 41.0, 42.0, 37.0, 40.0, 34.0, 36.0, 34.0, 15.0, 13.0, 24.0, 31.0, 20.0, 29.0, 18.0, 14.0, 16.0, 9.0, 4.0, 10.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7717025876045227, -0.7422186732292175, -0.7127347588539124, -0.6832508444786072, -0.653766930103302, -0.6242830157279968, -0.5947991013526917, -0.5653151869773865, -0.5358312726020813, -0.5063473582267761, -0.47686344385147095, -0.44737952947616577, -0.4178956151008606, -0.3884117007255554, -0.35892778635025024, -0.32944387197494507, -0.2999599575996399, -0.2704760432243347, -0.24099212884902954, -0.21150821447372437, -0.1820243000984192, -0.152540385723114, -0.12305647134780884, -0.09357255697250366, -0.06408864259719849, -0.03460472822189331, -0.005120813846588135, 0.02436310052871704, 0.05384701490402222, 0.08333092927932739, 0.11281484365463257, 0.14229875802993774, 0.17178261280059814, 0.20126652717590332, 0.2307504415512085, 0.26023435592651367, 0.28971827030181885, 0.319202184677124, 0.3486860990524292, 0.3781700134277344, 0.40765392780303955, 0.4371378421783447, 0.4666217565536499, 0.4961056709289551, 0.5255895853042603, 0.5550734996795654, 0.5845574140548706, 0.6140413284301758, 0.643525242805481, 0.6730091571807861, 0.7024930715560913, 0.7319769859313965, 0.7614609003067017, 0.7909448146820068, 0.820428729057312, 0.8499126434326172, 0.8793965578079224, 0.9088804721832275, 0.9383643865585327, 0.9678483009338379, 0.9973322153091431, 1.0268161296844482, 1.0563000440597534, 1.0857839584350586, 1.1152678728103638]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 7.0, 14.0, 22.0, 29.0, 32.0, 37.0, 75.0, 97.0, 125.0, 202.0, 301.0, 494.0, 825.0, 1404.0, 2579.0, 5181.0, 13233.0, 67092.0, 477245.0, 404381.0, 52883.0, 11715.0, 4766.0, 2318.0, 1339.0, 737.0, 493.0, 306.0, 166.0, 113.0, 103.0, 67.0, 51.0, 42.0, 21.0, 18.0, 6.0, 5.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4017295837402344, -0.38915252685546875, -0.3765754699707031, -0.3639984130859375, -0.3514213562011719, -0.33884429931640625, -0.3262672424316406, -0.313690185546875, -0.3011131286621094, -0.28853607177734375, -0.2759590148925781, -0.2633819580078125, -0.2508049011230469, -0.23822784423828125, -0.22565078735351562, -0.21307373046875, -0.20049667358398438, -0.18791961669921875, -0.17534255981445312, -0.1627655029296875, -0.15018844604492188, -0.13761138916015625, -0.12503433227539062, -0.112457275390625, -0.09988021850585938, -0.08730316162109375, -0.07472610473632812, -0.0621490478515625, -0.049571990966796875, -0.03699493408203125, -0.024417877197265625, -0.0118408203125, 0.000736236572265625, 0.01331329345703125, 0.025890350341796875, 0.0384674072265625, 0.051044464111328125, 0.06362152099609375, 0.07619857788085938, 0.088775634765625, 0.10135269165039062, 0.11392974853515625, 0.12650680541992188, 0.1390838623046875, 0.15166091918945312, 0.16423797607421875, 0.17681503295898438, 0.18939208984375, 0.20196914672851562, 0.21454620361328125, 0.22712326049804688, 0.2397003173828125, 0.2522773742675781, 0.26485443115234375, 0.2774314880371094, 0.290008544921875, 0.3025856018066406, 0.31516265869140625, 0.3277397155761719, 0.3403167724609375, 0.3528938293457031, 0.36547088623046875, 0.3780479431152344, 0.390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 11.0, 16.0, 20.0, 28.0, 15.0, 28.0, 29.0, 32.0, 42.0, 37.0, 34.0, 41.0, 45.0, 48.0, 41.0, 41.0, 46.0, 54.0, 31.0, 32.0, 34.0, 33.0, 27.0, 32.0, 36.0, 23.0, 15.0, 22.0, 13.0, 11.0, 16.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62451171875, -0.604278564453125, -0.58404541015625, -0.563812255859375, -0.5435791015625, -0.523345947265625, -0.50311279296875, -0.482879638671875, -0.462646484375, -0.442413330078125, -0.42218017578125, -0.401947021484375, -0.3817138671875, -0.361480712890625, -0.34124755859375, -0.321014404296875, -0.30078125, -0.280548095703125, -0.26031494140625, -0.240081787109375, -0.2198486328125, -0.199615478515625, -0.17938232421875, -0.159149169921875, -0.138916015625, -0.118682861328125, -0.09844970703125, -0.078216552734375, -0.0579833984375, -0.037750244140625, -0.01751708984375, 0.002716064453125, 0.02294921875, 0.043182373046875, 0.06341552734375, 0.083648681640625, 0.1038818359375, 0.124114990234375, 0.14434814453125, 0.164581298828125, 0.184814453125, 0.205047607421875, 0.22528076171875, 0.245513916015625, 0.2657470703125, 0.285980224609375, 0.30621337890625, 0.326446533203125, 0.3466796875, 0.366912841796875, 0.38714599609375, 0.407379150390625, 0.4276123046875, 0.447845458984375, 0.46807861328125, 0.488311767578125, 0.508544921875, 0.528778076171875, 0.54901123046875, 0.569244384765625, 0.5894775390625, 0.609710693359375, 0.62994384765625, 0.650177001953125, 0.67041015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 19.0, 21.0, 30.0, 31.0, 49.0, 115.0, 151.0, 270.0, 481.0, 855.0, 1974.0, 5017.0, 23868.0, 431892.0, 542732.0, 30760.0, 5961.0, 2134.0, 965.0, 477.0, 255.0, 154.0, 105.0, 69.0, 48.0, 36.0, 16.0, 26.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6836967468261719, -0.6652450561523438, -0.6467933654785156, -0.6283416748046875, -0.6098899841308594, -0.5914382934570312, -0.5729866027832031, -0.554534912109375, -0.5360832214355469, -0.5176315307617188, -0.4991798400878906, -0.4807281494140625, -0.4622764587402344, -0.44382476806640625, -0.4253730773925781, -0.40692138671875, -0.3884696960449219, -0.37001800537109375, -0.3515663146972656, -0.3331146240234375, -0.3146629333496094, -0.29621124267578125, -0.2777595520019531, -0.259307861328125, -0.24085617065429688, -0.22240447998046875, -0.20395278930664062, -0.1855010986328125, -0.16704940795898438, -0.14859771728515625, -0.13014602661132812, -0.1116943359375, -0.09324264526367188, -0.07479095458984375, -0.056339263916015625, -0.0378875732421875, -0.019435882568359375, -0.00098419189453125, 0.017467498779296875, 0.035919189453125, 0.054370880126953125, 0.07282257080078125, 0.09127426147460938, 0.1097259521484375, 0.12817764282226562, 0.14662933349609375, 0.16508102416992188, 0.18353271484375, 0.20198440551757812, 0.22043609619140625, 0.23888778686523438, 0.2573394775390625, 0.2757911682128906, 0.29424285888671875, 0.3126945495605469, 0.331146240234375, 0.3495979309082031, 0.36804962158203125, 0.3865013122558594, 0.4049530029296875, 0.4234046936035156, 0.44185638427734375, 0.4603080749511719, 0.478759765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 23.0, 10.0, 13.0, 23.0, 23.0, 21.0, 30.0, 19.0, 24.0, 39.0, 42.0, 46.0, 50.0, 46.0, 55.0, 45.0, 31.0, 56.0, 42.0, 48.0, 33.0, 33.0, 23.0, 30.0, 25.0, 27.0, 25.0, 15.0, 11.0, 12.0, 11.0, 8.0, 9.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.9002532958984375, -1.845428466796875, -1.7906036376953125, -1.73577880859375, -1.6809539794921875, -1.626129150390625, -1.5713043212890625, -1.5164794921875, -1.4616546630859375, -1.406829833984375, -1.3520050048828125, -1.29718017578125, -1.2423553466796875, -1.187530517578125, -1.1327056884765625, -1.077880859375, -1.0230560302734375, -0.968231201171875, -0.9134063720703125, -0.85858154296875, -0.8037567138671875, -0.748931884765625, -0.6941070556640625, -0.6392822265625, -0.5844573974609375, -0.529632568359375, -0.4748077392578125, -0.41998291015625, -0.3651580810546875, -0.310333251953125, -0.2555084228515625, -0.20068359375, -0.1458587646484375, -0.091033935546875, -0.0362091064453125, 0.01861572265625, 0.0734405517578125, 0.128265380859375, 0.1830902099609375, 0.2379150390625, 0.2927398681640625, 0.347564697265625, 0.4023895263671875, 0.45721435546875, 0.5120391845703125, 0.566864013671875, 0.6216888427734375, 0.676513671875, 0.7313385009765625, 0.786163330078125, 0.8409881591796875, 0.89581298828125, 0.9506378173828125, 1.005462646484375, 1.0602874755859375, 1.1151123046875, 1.1699371337890625, 1.224761962890625, 1.2795867919921875, 1.33441162109375, 1.3892364501953125, 1.444061279296875, 1.4988861083984375, 1.5537109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 7.0, 12.0, 20.0, 16.0, 31.0, 55.0, 87.0, 111.0, 166.0, 232.0, 404.0, 690.0, 1309.0, 2353.0, 4997.0, 11820.0, 43870.0, 322179.0, 544866.0, 84250.0, 17594.0, 6592.0, 3000.0, 1592.0, 860.0, 528.0, 302.0, 204.0, 122.0, 93.0, 53.0, 35.0, 19.0, 20.0, 9.0, 10.0, 7.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1971435546875, -0.1906108856201172, -0.18407821655273438, -0.17754554748535156, -0.17101287841796875, -0.16448020935058594, -0.15794754028320312, -0.1514148712158203, -0.1448822021484375, -0.1383495330810547, -0.13181686401367188, -0.12528419494628906, -0.11875152587890625, -0.11221885681152344, -0.10568618774414062, -0.09915351867675781, -0.092620849609375, -0.08608818054199219, -0.07955551147460938, -0.07302284240722656, -0.06649017333984375, -0.05995750427246094, -0.053424835205078125, -0.04689216613769531, -0.0403594970703125, -0.03382682800292969, -0.027294158935546875, -0.020761489868164062, -0.01422882080078125, -0.0076961517333984375, -0.001163482666015625, 0.0053691864013671875, 0.01190185546875, 0.018434524536132812, 0.024967193603515625, 0.03149986267089844, 0.03803253173828125, 0.04456520080566406, 0.051097869873046875, 0.05763053894042969, 0.0641632080078125, 0.07069587707519531, 0.07722854614257812, 0.08376121520996094, 0.09029388427734375, 0.09682655334472656, 0.10335922241210938, 0.10989189147949219, 0.116424560546875, 0.12295722961425781, 0.12948989868164062, 0.13602256774902344, 0.14255523681640625, 0.14908790588378906, 0.15562057495117188, 0.1621532440185547, 0.1686859130859375, 0.1752185821533203, 0.18175125122070312, 0.18828392028808594, 0.19481658935546875, 0.20134925842285156, 0.20788192749023438, 0.2144145965576172, 0.220947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 10.0, 10.0, 33.0, 75.0, 204.0, 327.0, 178.0, 100.0, 32.0, 16.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002651214599609375, -0.0002587251365184784, -0.0002523288130760193, -0.0002459324896335602, -0.00023953616619110107, -0.00023313984274864197, -0.00022674351930618286, -0.00022034719586372375, -0.00021395087242126465, -0.00020755454897880554, -0.00020115822553634644, -0.00019476190209388733, -0.00018836557865142822, -0.00018196925520896912, -0.00017557293176651, -0.0001691766083240509, -0.0001627802848815918, -0.0001563839614391327, -0.00014998763799667358, -0.00014359131455421448, -0.00013719499111175537, -0.00013079866766929626, -0.00012440234422683716, -0.00011800602078437805, -0.00011160969734191895, -0.00010521337389945984, -9.881705045700073e-05, -9.242072701454163e-05, -8.602440357208252e-05, -7.962808012962341e-05, -7.32317566871643e-05, -6.68354332447052e-05, -6.0439109802246094e-05, -5.404278635978699e-05, -4.764646291732788e-05, -4.1250139474868774e-05, -3.485381603240967e-05, -2.845749258995056e-05, -2.2061169147491455e-05, -1.566484570503235e-05, -9.268522262573242e-06, -2.8721988201141357e-06, 3.5241246223449707e-06, 9.920448064804077e-06, 1.6316771507263184e-05, 2.271309494972229e-05, 2.9109418392181396e-05, 3.55057418346405e-05, 4.190206527709961e-05, 4.8298388719558716e-05, 5.469471216201782e-05, 6.109103560447693e-05, 6.748735904693604e-05, 7.388368248939514e-05, 8.028000593185425e-05, 8.667632937431335e-05, 9.307265281677246e-05, 9.946897625923157e-05, 0.00010586529970169067, 0.00011226162314414978, 0.00011865794658660889, 0.000125054270029068, 0.0001314505934715271, 0.0001378469169139862, 0.0001442432403564453]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 8.0, 22.0, 20.0, 50.0, 63.0, 97.0, 169.0, 268.0, 422.0, 637.0, 1029.0, 1621.0, 2652.0, 4441.0, 8081.0, 17270.0, 46584.0, 158922.0, 392091.0, 276361.0, 83983.0, 27004.0, 11276.0, 5968.0, 3505.0, 2133.0, 1399.0, 866.0, 541.0, 336.0, 268.0, 154.0, 109.0, 71.0, 36.0, 35.0, 12.0, 13.0, 13.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.136474609375, -0.13254642486572266, -0.1286182403564453, -0.12469005584716797, -0.12076187133789062, -0.11683368682861328, -0.11290550231933594, -0.1089773178100586, -0.10504913330078125, -0.1011209487915039, -0.09719276428222656, -0.09326457977294922, -0.08933639526367188, -0.08540821075439453, -0.08148002624511719, -0.07755184173583984, -0.0736236572265625, -0.06969547271728516, -0.06576728820800781, -0.06183910369873047, -0.057910919189453125, -0.05398273468017578, -0.05005455017089844, -0.046126365661621094, -0.04219818115234375, -0.038269996643066406, -0.03434181213378906, -0.03041362762451172, -0.026485443115234375, -0.02255725860595703, -0.018629074096679688, -0.014700889587402344, -0.010772705078125, -0.006844520568847656, -0.0029163360595703125, 0.0010118484497070312, 0.004940032958984375, 0.008868217468261719, 0.012796401977539062, 0.016724586486816406, 0.02065277099609375, 0.024580955505371094, 0.028509140014648438, 0.03243732452392578, 0.036365509033203125, 0.04029369354248047, 0.04422187805175781, 0.048150062561035156, 0.0520782470703125, 0.056006431579589844, 0.05993461608886719, 0.06386280059814453, 0.06779098510742188, 0.07171916961669922, 0.07564735412597656, 0.0795755386352539, 0.08350372314453125, 0.0874319076538086, 0.09136009216308594, 0.09528827667236328, 0.09921646118164062, 0.10314464569091797, 0.10707283020019531, 0.11100101470947266, 0.11492919921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 9.0, 8.0, 14.0, 13.0, 22.0, 38.0, 59.0, 74.0, 84.0, 88.0, 99.0, 112.0, 92.0, 65.0, 62.0, 37.0, 31.0, 16.0, 13.0, 15.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048187255859375, -0.04643869400024414, -0.04469013214111328, -0.04294157028198242, -0.04119300842285156, -0.0394444465637207, -0.037695884704589844, -0.035947322845458984, -0.034198760986328125, -0.032450199127197266, -0.030701637268066406, -0.028953075408935547, -0.027204513549804688, -0.025455951690673828, -0.02370738983154297, -0.02195882797241211, -0.02021026611328125, -0.01846170425415039, -0.01671314239501953, -0.014964580535888672, -0.013216018676757812, -0.011467456817626953, -0.009718894958496094, -0.007970333099365234, -0.006221771240234375, -0.004473209381103516, -0.0027246475219726562, -0.0009760856628417969, 0.0007724761962890625, 0.002521038055419922, 0.004269599914550781, 0.006018161773681641, 0.0077667236328125, 0.00951528549194336, 0.011263847351074219, 0.013012409210205078, 0.014760971069335938, 0.016509532928466797, 0.018258094787597656, 0.020006656646728516, 0.021755218505859375, 0.023503780364990234, 0.025252342224121094, 0.027000904083251953, 0.028749465942382812, 0.030498027801513672, 0.03224658966064453, 0.03399515151977539, 0.03574371337890625, 0.03749227523803711, 0.03924083709716797, 0.04098939895629883, 0.04273796081542969, 0.04448652267456055, 0.046235084533691406, 0.047983646392822266, 0.049732208251953125, 0.051480770111083984, 0.053229331970214844, 0.0549778938293457, 0.05672645568847656, 0.05847501754760742, 0.06022357940673828, 0.06197214126586914, 0.063720703125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 9.0, 10.0, 3.0, 16.0, 9.0, 16.0, 20.0, 8.0, 24.0, 23.0, 33.0, 56.0, 32.0, 40.0, 38.0, 42.0, 55.0, 54.0, 47.0, 52.0, 67.0, 57.0, 31.0, 31.0, 43.0, 30.0, 30.0, 27.0, 24.0, 14.0, 11.0, 7.0, 9.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5443191528320312, -0.5244734287261963, -0.5046277046203613, -0.48478201031684875, -0.4649362862110138, -0.4450905919075012, -0.42524486780166626, -0.4053991436958313, -0.38555341958999634, -0.3657076954841614, -0.3458620011806488, -0.32601627707481384, -0.3061705529689789, -0.2863248586654663, -0.26647913455963135, -0.2466334104537964, -0.2267877161502838, -0.20694200694561005, -0.18709628283977509, -0.16725057363510132, -0.14740484952926636, -0.1275591403245926, -0.10771343111991882, -0.08786770701408386, -0.0680219978094101, -0.04817628115415573, -0.028330568224191666, -0.0084848552942276, 0.011360861361026764, 0.031206578016281128, 0.051052287220954895, 0.07089801132678986, 0.09074372053146362, 0.11058943718671799, 0.13043515384197235, 0.15028086304664612, 0.17012658715248108, 0.18997229635715485, 0.2098180055618286, 0.22966372966766357, 0.24950943887233734, 0.2693551480770111, 0.28920087218284607, 0.30904656648635864, 0.3288922905921936, 0.34873801469802856, 0.3685837388038635, 0.3884294629096985, 0.40827515721321106, 0.428120881319046, 0.4479665756225586, 0.46781229972839355, 0.4876580238342285, 0.5075037479400635, 0.5273494720458984, 0.5471951961517334, 0.5670408606529236, 0.5868865847587585, 0.6067323088645935, 0.6265779733657837, 0.6464236974716187, 0.6662694215774536, 0.6861151456832886, 0.7059608697891235, 0.7258065938949585]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 5.0, 10.0, 8.0, 16.0, 4.0, 14.0, 11.0, 17.0, 24.0, 31.0, 19.0, 27.0, 24.0, 36.0, 26.0, 41.0, 41.0, 44.0, 35.0, 28.0, 50.0, 38.0, 46.0, 39.0, 44.0, 27.0, 38.0, 25.0, 17.0, 24.0, 22.0, 23.0, 20.0, 28.0, 18.0, 12.0, 12.0, 11.0, 8.0, 9.0, 2.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5060173273086548, -0.48837611079216003, -0.4707348942756653, -0.45309364795684814, -0.4354524314403534, -0.41781121492385864, -0.4001699686050415, -0.38252875208854675, -0.364887535572052, -0.34724631905555725, -0.3296051025390625, -0.31196385622024536, -0.2943226397037506, -0.27668142318725586, -0.2590401768684387, -0.24139896035194397, -0.22375774383544922, -0.20611652731895447, -0.18847529590129852, -0.17083406448364258, -0.15319284796714783, -0.13555163145065308, -0.11791040003299713, -0.10026917606592178, -0.08262795209884644, -0.06498672813177109, -0.04734550416469574, -0.029704280197620392, -0.012063056230545044, 0.005578167736530304, 0.023219391703605652, 0.040860615670681, 0.05850178003311157, 0.07614300400018692, 0.09378422796726227, 0.11142545193433762, 0.12906667590141296, 0.14670789241790771, 0.16434912383556366, 0.1819903552532196, 0.19963157176971436, 0.2172727882862091, 0.23491401970386505, 0.252555251121521, 0.27019646763801575, 0.2878376841545105, 0.30547893047332764, 0.3231201469898224, 0.34076136350631714, 0.3584025800228119, 0.37604379653930664, 0.3936850428581238, 0.41132625937461853, 0.4289674758911133, 0.4466087222099304, 0.46424993872642517, 0.4818911552429199, 0.4995323717594147, 0.5171735882759094, 0.5348148345947266, 0.5524560213088989, 0.5700972676277161, 0.5877385139465332, 0.6053797006607056, 0.6230209469795227]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 10.0, 21.0, 21.0, 21.0, 49.0, 64.0, 105.0, 114.0, 165.0, 265.0, 408.0, 686.0, 1126.0, 2045.0, 3581.0, 6429.0, 11831.0, 22300.0, 43841.0, 101899.0, 263866.0, 330599.0, 141017.0, 57318.0, 27740.0, 14721.0, 7947.0, 4247.0, 2418.0, 1396.0, 839.0, 484.0, 298.0, 186.0, 163.0, 90.0, 74.0, 40.0, 36.0, 23.0, 18.0, 5.0, 6.0, 11.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6786346435546875, -0.653656005859375, -0.6286773681640625, -0.60369873046875, -0.5787200927734375, -0.553741455078125, -0.5287628173828125, -0.5037841796875, -0.4788055419921875, -0.453826904296875, -0.4288482666015625, -0.40386962890625, -0.3788909912109375, -0.353912353515625, -0.3289337158203125, -0.303955078125, -0.2789764404296875, -0.253997802734375, -0.2290191650390625, -0.20404052734375, -0.1790618896484375, -0.154083251953125, -0.1291046142578125, -0.1041259765625, -0.0791473388671875, -0.054168701171875, -0.0291900634765625, -0.00421142578125, 0.0207672119140625, 0.045745849609375, 0.0707244873046875, 0.095703125, 0.1206817626953125, 0.145660400390625, 0.1706390380859375, 0.19561767578125, 0.2205963134765625, 0.245574951171875, 0.2705535888671875, 0.2955322265625, 0.3205108642578125, 0.345489501953125, 0.3704681396484375, 0.39544677734375, 0.4204254150390625, 0.445404052734375, 0.4703826904296875, 0.495361328125, 0.5203399658203125, 0.545318603515625, 0.5702972412109375, 0.59527587890625, 0.6202545166015625, 0.645233154296875, 0.6702117919921875, 0.6951904296875, 0.7201690673828125, 0.745147705078125, 0.7701263427734375, 0.79510498046875, 0.8200836181640625, 0.845062255859375, 0.8700408935546875, 0.89501953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 6.0, 1.0, 6.0, 1.0, 9.0, 7.0, 11.0, 10.0, 15.0, 15.0, 7.0, 18.0, 19.0, 21.0, 34.0, 24.0, 31.0, 37.0, 36.0, 24.0, 33.0, 44.0, 50.0, 45.0, 41.0, 54.0, 34.0, 32.0, 43.0, 27.0, 31.0, 21.0, 28.0, 28.0, 27.0, 20.0, 13.0, 17.0, 22.0, 14.0, 12.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8283462524414062, -0.7968292236328125, -0.7653121948242188, -0.733795166015625, -0.7022781372070312, -0.6707611083984375, -0.6392440795898438, -0.60772705078125, -0.5762100219726562, -0.5446929931640625, -0.5131759643554688, -0.481658935546875, -0.45014190673828125, -0.4186248779296875, -0.38710784912109375, -0.3555908203125, -0.32407379150390625, -0.2925567626953125, -0.26103973388671875, -0.229522705078125, -0.19800567626953125, -0.1664886474609375, -0.13497161865234375, -0.10345458984375, -0.07193756103515625, -0.0404205322265625, -0.00890350341796875, 0.022613525390625, 0.05413055419921875, 0.0856475830078125, 0.11716461181640625, 0.148681640625, 0.18019866943359375, 0.2117156982421875, 0.24323272705078125, 0.274749755859375, 0.30626678466796875, 0.3377838134765625, 0.36930084228515625, 0.40081787109375, 0.43233489990234375, 0.4638519287109375, 0.49536895751953125, 0.526885986328125, 0.5584030151367188, 0.5899200439453125, 0.6214370727539062, 0.6529541015625, 0.6844711303710938, 0.7159881591796875, 0.7475051879882812, 0.779022216796875, 0.8105392456054688, 0.8420562744140625, 0.8735733032226562, 0.90509033203125, 0.9366073608398438, 0.9681243896484375, 0.9996414184570312, 1.031158447265625, 1.0626754760742188, 1.0941925048828125, 1.1257095336914062, 1.1572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 16.0, 40.0, 34.0, 55.0, 84.0, 125.0, 175.0, 310.0, 514.0, 913.0, 1761.0, 3941.0, 10158.0, 27983.0, 90674.0, 361683.0, 398986.0, 100741.0, 30612.0, 10965.0, 4471.0, 1818.0, 949.0, 583.0, 333.0, 175.0, 141.0, 80.0, 62.0, 36.0, 28.0, 29.0, 16.0, 9.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.38507080078125, -1.3404541015625, -1.29583740234375, -1.251220703125, -1.20660400390625, -1.1619873046875, -1.11737060546875, -1.07275390625, -1.02813720703125, -0.9835205078125, -0.93890380859375, -0.894287109375, -0.84967041015625, -0.8050537109375, -0.76043701171875, -0.7158203125, -0.67120361328125, -0.6265869140625, -0.58197021484375, -0.537353515625, -0.49273681640625, -0.4481201171875, -0.40350341796875, -0.35888671875, -0.31427001953125, -0.2696533203125, -0.22503662109375, -0.180419921875, -0.13580322265625, -0.0911865234375, -0.04656982421875, -0.001953125, 0.04266357421875, 0.0872802734375, 0.13189697265625, 0.176513671875, 0.22113037109375, 0.2657470703125, 0.31036376953125, 0.35498046875, 0.39959716796875, 0.4442138671875, 0.48883056640625, 0.533447265625, 0.57806396484375, 0.6226806640625, 0.66729736328125, 0.7119140625, 0.75653076171875, 0.8011474609375, 0.84576416015625, 0.890380859375, 0.93499755859375, 0.9796142578125, 1.02423095703125, 1.06884765625, 1.11346435546875, 1.1580810546875, 1.20269775390625, 1.247314453125, 1.29193115234375, 1.3365478515625, 1.38116455078125, 1.42578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 8.0, 7.0, 16.0, 14.0, 23.0, 20.0, 26.0, 40.0, 31.0, 53.0, 51.0, 42.0, 53.0, 52.0, 49.0, 53.0, 57.0, 57.0, 34.0, 39.0, 34.0, 31.0, 40.0, 27.0, 32.0, 23.0, 14.0, 6.0, 12.0, 12.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4873046875, -1.44317626953125, -1.3990478515625, -1.35491943359375, -1.310791015625, -1.26666259765625, -1.2225341796875, -1.17840576171875, -1.13427734375, -1.09014892578125, -1.0460205078125, -1.00189208984375, -0.957763671875, -0.91363525390625, -0.8695068359375, -0.82537841796875, -0.78125, -0.73712158203125, -0.6929931640625, -0.64886474609375, -0.604736328125, -0.56060791015625, -0.5164794921875, -0.47235107421875, -0.42822265625, -0.38409423828125, -0.3399658203125, -0.29583740234375, -0.251708984375, -0.20758056640625, -0.1634521484375, -0.11932373046875, -0.0751953125, -0.03106689453125, 0.0130615234375, 0.05718994140625, 0.101318359375, 0.14544677734375, 0.1895751953125, 0.23370361328125, 0.27783203125, 0.32196044921875, 0.3660888671875, 0.41021728515625, 0.454345703125, 0.49847412109375, 0.5426025390625, 0.58673095703125, 0.630859375, 0.67498779296875, 0.7191162109375, 0.76324462890625, 0.807373046875, 0.85150146484375, 0.8956298828125, 0.93975830078125, 0.98388671875, 1.02801513671875, 1.0721435546875, 1.11627197265625, 1.160400390625, 1.20452880859375, 1.2486572265625, 1.29278564453125, 1.3369140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 1.0, 9.0, 8.0, 15.0, 17.0, 18.0, 21.0, 42.0, 43.0, 73.0, 106.0, 145.0, 177.0, 315.0, 422.0, 700.0, 1171.0, 2159.0, 4276.0, 8591.0, 19152.0, 48538.0, 130863.0, 358859.0, 277772.0, 117405.0, 43183.0, 17632.0, 7838.0, 3810.0, 2038.0, 1165.0, 659.0, 392.0, 247.0, 188.0, 137.0, 81.0, 98.0, 50.0, 43.0, 21.0, 18.0, 12.0, 11.0, 12.0, 8.0, 4.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.1705322265625, -0.16535568237304688, -0.16017913818359375, -0.15500259399414062, -0.1498260498046875, -0.14464950561523438, -0.13947296142578125, -0.13429641723632812, -0.129119873046875, -0.12394332885742188, -0.11876678466796875, -0.11359024047851562, -0.1084136962890625, -0.10323715209960938, -0.09806060791015625, -0.09288406372070312, -0.08770751953125, -0.08253097534179688, -0.07735443115234375, -0.07217788696289062, -0.0670013427734375, -0.061824798583984375, -0.05664825439453125, -0.051471710205078125, -0.046295166015625, -0.041118621826171875, -0.03594207763671875, -0.030765533447265625, -0.0255889892578125, -0.020412445068359375, -0.01523590087890625, -0.010059356689453125, -0.0048828125, 0.000293731689453125, 0.00547027587890625, 0.010646820068359375, 0.0158233642578125, 0.020999908447265625, 0.02617645263671875, 0.031352996826171875, 0.036529541015625, 0.041706085205078125, 0.04688262939453125, 0.052059173583984375, 0.0572357177734375, 0.062412261962890625, 0.06758880615234375, 0.07276535034179688, 0.07794189453125, 0.08311843872070312, 0.08829498291015625, 0.09347152709960938, 0.0986480712890625, 0.10382461547851562, 0.10900115966796875, 0.11417770385742188, 0.119354248046875, 0.12453079223632812, 0.12970733642578125, 0.13488388061523438, 0.1400604248046875, 0.14523696899414062, 0.15041351318359375, 0.15559005737304688, 0.1607666015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 7.0, 12.0, 12.0, 13.0, 22.0, 17.0, 17.0, 32.0, 38.0, 50.0, 60.0, 70.0, 102.0, 141.0, 76.0, 67.0, 63.0, 38.0, 49.0, 21.0, 22.0, 10.0, 13.0, 11.0, 9.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.738569259643555e-05, -4.587322473526001e-05, -4.436075687408447e-05, -4.2848289012908936e-05, -4.13358211517334e-05, -3.982335329055786e-05, -3.8310885429382324e-05, -3.679841756820679e-05, -3.528594970703125e-05, -3.377348184585571e-05, -3.2261013984680176e-05, -3.074854612350464e-05, -2.92360782623291e-05, -2.7723610401153564e-05, -2.6211142539978027e-05, -2.469867467880249e-05, -2.3186206817626953e-05, -2.1673738956451416e-05, -2.016127109527588e-05, -1.8648803234100342e-05, -1.7136335372924805e-05, -1.5623867511749268e-05, -1.411139965057373e-05, -1.2598931789398193e-05, -1.1086463928222656e-05, -9.573996067047119e-06, -8.061528205871582e-06, -6.549060344696045e-06, -5.036592483520508e-06, -3.5241246223449707e-06, -2.0116567611694336e-06, -4.991888999938965e-07, 1.0132789611816406e-06, 2.5257468223571777e-06, 4.038214683532715e-06, 5.550682544708252e-06, 7.063150405883789e-06, 8.575618267059326e-06, 1.0088086128234863e-05, 1.16005539894104e-05, 1.3113021850585938e-05, 1.4625489711761475e-05, 1.6137957572937012e-05, 1.765042543411255e-05, 1.9162893295288086e-05, 2.0675361156463623e-05, 2.218782901763916e-05, 2.3700296878814697e-05, 2.5212764739990234e-05, 2.672523260116577e-05, 2.823770046234131e-05, 2.9750168323516846e-05, 3.126263618469238e-05, 3.277510404586792e-05, 3.428757190704346e-05, 3.5800039768218994e-05, 3.731250762939453e-05, 3.882497549057007e-05, 4.0337443351745605e-05, 4.184991121292114e-05, 4.336237907409668e-05, 4.487484693527222e-05, 4.6387314796447754e-05, 4.789978265762329e-05, 4.941225051879883e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 5.0, 9.0, 7.0, 17.0, 21.0, 42.0, 44.0, 55.0, 78.0, 120.0, 201.0, 298.0, 436.0, 669.0, 1062.0, 1818.0, 3064.0, 5765.0, 11771.0, 29429.0, 104953.0, 495299.0, 288799.0, 63549.0, 20808.0, 9037.0, 4569.0, 2508.0, 1511.0, 892.0, 590.0, 388.0, 250.0, 170.0, 112.0, 65.0, 48.0, 37.0, 15.0, 16.0, 7.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.349853515625, -0.33919525146484375, -0.3285369873046875, -0.31787872314453125, -0.307220458984375, -0.29656219482421875, -0.2859039306640625, -0.27524566650390625, -0.26458740234375, -0.25392913818359375, -0.2432708740234375, -0.23261260986328125, -0.221954345703125, -0.21129608154296875, -0.2006378173828125, -0.18997955322265625, -0.1793212890625, -0.16866302490234375, -0.1580047607421875, -0.14734649658203125, -0.136688232421875, -0.12602996826171875, -0.1153717041015625, -0.10471343994140625, -0.09405517578125, -0.08339691162109375, -0.0727386474609375, -0.06208038330078125, -0.051422119140625, -0.04076385498046875, -0.0301055908203125, -0.01944732666015625, -0.0087890625, 0.00186920166015625, 0.0125274658203125, 0.02318572998046875, 0.033843994140625, 0.04450225830078125, 0.0551605224609375, 0.06581878662109375, 0.07647705078125, 0.08713531494140625, 0.0977935791015625, 0.10845184326171875, 0.119110107421875, 0.12976837158203125, 0.1404266357421875, 0.15108489990234375, 0.1617431640625, 0.17240142822265625, 0.1830596923828125, 0.19371795654296875, 0.204376220703125, 0.21503448486328125, 0.2256927490234375, 0.23635101318359375, 0.24700927734375, 0.25766754150390625, 0.2683258056640625, 0.27898406982421875, 0.289642333984375, 0.30030059814453125, 0.3109588623046875, 0.32161712646484375, 0.332275390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 8.0, 14.0, 16.0, 22.0, 46.0, 58.0, 83.0, 138.0, 185.0, 124.0, 84.0, 81.0, 37.0, 19.0, 20.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2648277282714844, -0.25670623779296875, -0.24858474731445312, -0.2404632568359375, -0.23234176635742188, -0.22422027587890625, -0.21609878540039062, -0.207977294921875, -0.19985580444335938, -0.19173431396484375, -0.18361282348632812, -0.1754913330078125, -0.16736984252929688, -0.15924835205078125, -0.15112686157226562, -0.14300537109375, -0.13488388061523438, -0.12676239013671875, -0.11864089965820312, -0.1105194091796875, -0.10239791870117188, -0.09427642822265625, -0.08615493774414062, -0.078033447265625, -0.06991195678710938, -0.06179046630859375, -0.053668975830078125, -0.0455474853515625, -0.037425994873046875, -0.02930450439453125, -0.021183013916015625, -0.0130615234375, -0.004940032958984375, 0.00318145751953125, 0.011302947998046875, 0.0194244384765625, 0.027545928955078125, 0.03566741943359375, 0.043788909912109375, 0.051910400390625, 0.060031890869140625, 0.06815338134765625, 0.07627487182617188, 0.0843963623046875, 0.09251785278320312, 0.10063934326171875, 0.10876083374023438, 0.11688232421875, 0.12500381469726562, 0.13312530517578125, 0.14124679565429688, 0.1493682861328125, 0.15748977661132812, 0.16561126708984375, 0.17373275756835938, 0.181854248046875, 0.18997573852539062, 0.19809722900390625, 0.20621871948242188, 0.2143402099609375, 0.22246170043945312, 0.23058319091796875, 0.23870468139648438, 0.246826171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 21.0, 24.0, 58.0, 71.0, 127.0, 128.0, 141.0, 126.0, 109.0, 75.0, 46.0, 25.0, 17.0, 11.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.467543601989746, -2.367278575897217, -2.2670133113861084, -2.166748285293579, -2.06648325920105, -1.966218113899231, -1.865952968597412, -1.7656879425048828, -1.665422797203064, -1.5651576519012451, -1.4648926258087158, -1.364627480506897, -1.2643623352050781, -1.1640973091125488, -1.06383216381073, -0.9635670781135559, -0.8633019924163818, -0.7630369067192078, -0.6627718210220337, -0.5625066757202148, -0.46224159002304077, -0.3619765043258667, -0.26171135902404785, -0.16144627332687378, -0.06118118762969971, 0.03908391296863556, 0.13934901356697083, 0.23961412906646729, 0.33987921476364136, 0.44014430046081543, 0.5404094457626343, 0.6406745314598083, 0.7409393787384033, 0.8412044644355774, 0.9414695501327515, 1.0417346954345703, 1.1419997215270996, 1.2422648668289185, 1.3425300121307373, 1.4427950382232666, 1.5430601835250854, 1.6433253288269043, 1.7435903549194336, 1.8438555002212524, 1.9441206455230713, 2.0443856716156006, 2.144650936126709, 2.2449159622192383, 2.3451809883117676, 2.445446014404297, 2.5457112789154053, 2.6459763050079346, 2.746241331100464, 2.8465065956115723, 2.9467716217041016, 3.047036647796631, 3.14730167388916, 3.2475666999816895, 3.347831964492798, 3.448096990585327, 3.5483620166778564, 3.648627281188965, 3.748892307281494, 3.8491573333740234, 3.949422597885132]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 9.0, 16.0, 16.0, 17.0, 16.0, 18.0, 25.0, 30.0, 29.0, 29.0, 33.0, 48.0, 52.0, 58.0, 46.0, 45.0, 43.0, 49.0, 46.0, 52.0, 39.0, 39.0, 36.0, 37.0, 30.0, 22.0, 18.0, 16.0, 20.0, 10.0, 9.0, 11.0, 10.0, 13.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4961495399475098, -2.424999475479126, -2.353849411010742, -2.2826995849609375, -2.2115495204925537, -2.14039945602417, -2.069249391555786, -1.9980993270874023, -1.9269492626190186, -1.8557991981506348, -1.7846492528915405, -1.7134991884231567, -1.642349123954773, -1.5711991786956787, -1.500049114227295, -1.4288990497589111, -1.357749104499817, -1.286599040031433, -1.2154490947723389, -1.144299030303955, -1.0731489658355713, -1.0019989013671875, -0.9308489561080933, -0.8596988916397095, -0.7885488867759705, -0.7173988819122314, -0.6462488174438477, -0.5750988125801086, -0.5039488077163696, -0.43279874324798584, -0.3616487383842468, -0.2904987037181854, -0.21934866905212402, -0.14819863438606262, -0.07704861462116241, -0.005898594856262207, 0.0652514398097992, 0.1364014744758606, 0.2075514793395996, 0.278701514005661, 0.3498515486717224, 0.4210015833377838, 0.4921516180038452, 0.5633016228675842, 0.6344516277313232, 0.705601692199707, 0.776751697063446, 0.8479017019271851, 0.9190517663955688, 0.9902017712593079, 1.0613517761230469, 1.1325018405914307, 1.2036519050598145, 1.2748019695281982, 1.3459519147872925, 1.4171019792556763, 1.4882519245147705, 1.5594019889831543, 1.6305519342422485, 1.7017019987106323, 1.7728520631790161, 1.8440020084381104, 1.9151520729064941, 1.986302137374878, 2.0574522018432617]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 9.0, 7.0, 10.0, 10.0, 13.0, 16.0, 21.0, 26.0, 35.0, 36.0, 45.0, 67.0, 102.0, 142.0, 130.0, 215.0, 275.0, 355.0, 508.0, 616.0, 892.0, 1111.0, 1515.0, 2084.0, 1033957.0, 2080.0, 1588.0, 1140.0, 879.0, 694.0, 500.0, 381.0, 271.0, 187.0, 156.0, 120.0, 107.0, 82.0, 51.0, 36.0, 25.0, 31.0, 21.0, 20.0, 14.0, 8.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0], "bins": [-2.2587437629699707, -2.1933069229125977, -2.1278700828552246, -2.0624332427978516, -1.9969964027404785, -1.9315595626831055, -1.866122841835022, -1.800686001777649, -1.7352491617202759, -1.6698123216629028, -1.6043754816055298, -1.5389386415481567, -1.4735019207000732, -1.4080650806427002, -1.3426282405853271, -1.277191400527954, -1.211754560470581, -1.146317720413208, -1.080880880355835, -1.015444040298462, -0.9500072598457336, -0.8845704197883606, -0.8191336393356323, -0.7536967992782593, -0.6882599592208862, -0.6228231191635132, -0.5573862791061401, -0.49194949865341187, -0.4265126585960388, -0.36107581853866577, -0.2956390082836151, -0.23020219802856445, -0.1647651195526123, -0.09932829439640045, -0.0338914692401886, 0.031545355916023254, 0.09698218107223511, 0.16241902112960815, 0.2278558313846588, 0.2932926416397095, 0.3587294816970825, 0.42416632175445557, 0.4896031320095062, 0.5550399422645569, 0.6204767823219299, 0.685913622379303, 0.7513504028320312, 0.8167872428894043, 0.8822240829467773, 0.9476609230041504, 1.0130977630615234, 1.0785346031188965, 1.1439714431762695, 1.2094082832336426, 1.274845004081726, 1.3402818441390991, 1.4057186841964722, 1.4711555242538452, 1.5365923643112183, 1.6020292043685913, 1.6674659252166748, 1.7329027652740479, 1.798339605331421, 1.863776445388794, 1.929213285446167]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 20.0, 29.0, 36.0, 22.0, 42.0, 70.0, 123.0, 251.0, 517.0, 1363.0, 3337.0, 8114.0, 23150.0, 51392964.0, 23931.0, 9734.0, 4346.0, 1814.0, 783.0, 346.0, 145.0, 76.0, 39.0, 25.0, 21.0, 11.0, 8.0, 1.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.072476387023926, -6.861478805541992, -6.650481700897217, -6.439484119415283, -6.22848653793335, -6.017489433288574, -5.806491851806641, -5.595494270324707, -5.384497165679932, -5.173499584197998, -4.962502479553223, -4.751504898071289, -4.5405073165893555, -4.32951021194458, -4.1185126304626465, -3.907515287399292, -3.6965177059173584, -3.485520362854004, -3.2745227813720703, -3.063525438308716, -2.8525280952453613, -2.6415305137634277, -2.4305331707000732, -2.2195358276367188, -2.008538246154785, -1.7975407838821411, -1.5865434408187866, -1.3755459785461426, -1.164548635482788, -0.953551173210144, -0.7425537109375, -0.5315563678741455, -0.320559024810791, -0.10956160724163055, 0.10143581032752991, 0.31243324279785156, 0.5234306454658508, 0.7344280481338501, 0.9454255104064941, 1.1564228534698486, 1.3674203157424927, 1.5784177780151367, 1.7894151210784912, 2.0004124641418457, 2.2114100456237793, 2.422407388687134, 2.6334047317504883, 2.844402313232422, 3.0553996562957764, 3.266396999359131, 3.4773945808410645, 3.688391923904419, 3.8993892669677734, 4.110386848449707, 4.321384429931641, 4.532381534576416, 4.74337911605835, 4.954376697540283, 5.165373802185059, 5.376371383666992, 5.587368965148926, 5.798366069793701, 6.009363651275635, 6.22036075592041, 6.431358337402344]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 9.0, 11.0, 20.0, 21.0, 25.0, 52.0, 90.0, 119.0, 159.0, 274.0, 369.0, 654.0, 989.0, 1713.0, 2702.0, 4597.0, 7737.0, 13427.0, 23386.0, 41755.0, 75000.0, 130735.0, 215733.0, 328222.0, 521927.0, 3131769.0, 819608.0, 366794.0, 247929.0, 152645.0, 87470.0, 49823.0, 27634.0, 15679.0, 8753.0, 5259.0, 3178.0, 1947.0, 1225.0, 725.0, 443.0, 283.0, 177.0, 137.0, 79.0, 54.0, 28.0, 20.0, 17.0, 15.0, 8.0, 9.0, 6.0, 2.0, 1.0], "bins": [-1.4921875, -1.449127197265625, -1.40606689453125, -1.363006591796875, -1.3199462890625, -1.276885986328125, -1.23382568359375, -1.190765380859375, -1.147705078125, -1.104644775390625, -1.06158447265625, -1.018524169921875, -0.9754638671875, -0.932403564453125, -0.88934326171875, -0.846282958984375, -0.80322265625, -0.760162353515625, -0.71710205078125, -0.674041748046875, -0.6309814453125, -0.587921142578125, -0.54486083984375, -0.501800537109375, -0.458740234375, -0.415679931640625, -0.37261962890625, -0.329559326171875, -0.2864990234375, -0.243438720703125, -0.20037841796875, -0.157318115234375, -0.1142578125, -0.071197509765625, -0.02813720703125, 0.014923095703125, 0.0579833984375, 0.101043701171875, 0.14410400390625, 0.187164306640625, 0.230224609375, 0.273284912109375, 0.31634521484375, 0.359405517578125, 0.4024658203125, 0.445526123046875, 0.48858642578125, 0.531646728515625, 0.57470703125, 0.617767333984375, 0.66082763671875, 0.703887939453125, 0.7469482421875, 0.790008544921875, 0.83306884765625, 0.876129150390625, 0.919189453125, 0.962249755859375, 1.00531005859375, 1.048370361328125, 1.0914306640625, 1.134490966796875, 1.17755126953125, 1.220611572265625, 1.263671875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 9.0, 11.0, 13.0, 10.0, 22.0, 16.0, 24.0, 22.0, 28.0, 25.0, 13.0, 38.0, 38.0, 53.0, 54.0, 54.0, 123.0, 779.0, 245.0, 59.0, 49.0, 42.0, 41.0, 36.0, 33.0, 30.0, 15.0, 20.0, 26.0, 14.0, 12.0, 10.0, 11.0, 8.0, 8.0, 9.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.55487060546875, -7.3089599609375, -7.06304931640625, -6.817138671875, -6.57122802734375, -6.3253173828125, -6.07940673828125, -5.83349609375, -5.58758544921875, -5.3416748046875, -5.09576416015625, -4.849853515625, -4.60394287109375, -4.3580322265625, -4.11212158203125, -3.8662109375, -3.62030029296875, -3.3743896484375, -3.12847900390625, -2.882568359375, -2.63665771484375, -2.3907470703125, -2.14483642578125, -1.89892578125, -1.65301513671875, -1.4071044921875, -1.16119384765625, -0.915283203125, -0.66937255859375, -0.4234619140625, -0.17755126953125, 0.068359375, 0.31427001953125, 0.5601806640625, 0.80609130859375, 1.052001953125, 1.29791259765625, 1.5438232421875, 1.78973388671875, 2.03564453125, 2.28155517578125, 2.5274658203125, 2.77337646484375, 3.019287109375, 3.26519775390625, 3.5111083984375, 3.75701904296875, 4.0029296875, 4.24884033203125, 4.4947509765625, 4.74066162109375, 4.986572265625, 5.23248291015625, 5.4783935546875, 5.72430419921875, 5.97021484375, 6.21612548828125, 6.4620361328125, 6.70794677734375, 6.953857421875, 7.19976806640625, 7.4456787109375, 7.69158935546875, 7.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 9.0, 7.0, 14.0, 20.0, 43.0, 77.0, 138.0, 205.0, 375.0, 616.0, 921.0, 1623.0, 2517.0, 3951.0, 6200.0, 9470.0, 14756.0, 21888.0, 31698.0, 45857.0, 64232.0, 87046.0, 115635.0, 146235.0, 179375.0, 211251.0, 257409.0, 727671.0, 2302403.0, 833116.0, 264815.0, 214065.0, 181660.0, 148634.0, 117885.0, 89314.0, 65568.0, 47631.0, 33031.0, 22369.0, 15004.0, 9839.0, 6316.0, 4126.0, 2461.0, 1607.0, 971.0, 569.0, 351.0, 200.0, 111.0, 63.0, 30.0, 29.0, 13.0, 9.0, 10.0, 4.0, 2.0, 2.0], "bins": [-0.63232421875, -0.6128921508789062, -0.5934600830078125, -0.5740280151367188, -0.554595947265625, -0.5351638793945312, -0.5157318115234375, -0.49629974365234375, -0.47686767578125, -0.45743560791015625, -0.4380035400390625, -0.41857147216796875, -0.399139404296875, -0.37970733642578125, -0.3602752685546875, -0.34084320068359375, -0.3214111328125, -0.30197906494140625, -0.2825469970703125, -0.26311492919921875, -0.243682861328125, -0.22425079345703125, -0.2048187255859375, -0.18538665771484375, -0.16595458984375, -0.14652252197265625, -0.1270904541015625, -0.10765838623046875, -0.088226318359375, -0.06879425048828125, -0.0493621826171875, -0.02993011474609375, -0.010498046875, 0.00893402099609375, 0.0283660888671875, 0.04779815673828125, 0.067230224609375, 0.08666229248046875, 0.1060943603515625, 0.12552642822265625, 0.14495849609375, 0.16439056396484375, 0.1838226318359375, 0.20325469970703125, 0.222686767578125, 0.24211883544921875, 0.2615509033203125, 0.28098297119140625, 0.3004150390625, 0.31984710693359375, 0.3392791748046875, 0.35871124267578125, 0.378143310546875, 0.39757537841796875, 0.4170074462890625, 0.43643951416015625, 0.45587158203125, 0.47530364990234375, 0.4947357177734375, 0.5141677856445312, 0.533599853515625, 0.5530319213867188, 0.5724639892578125, 0.5918960571289062, 0.611328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 10.0, 8.0, 12.0, 13.0, 15.0, 19.0, 31.0, 28.0, 34.0, 34.0, 36.0, 48.0, 47.0, 38.0, 57.0, 109.0, 731.0, 326.0, 48.0, 32.0, 46.0, 42.0, 34.0, 39.0, 22.0, 12.0, 27.0, 22.0, 21.0, 19.0, 14.0, 7.0, 11.0, 10.0, 6.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.846435546875, -4.66552734375, -4.484619140625, -4.3037109375, -4.122802734375, -3.94189453125, -3.760986328125, -3.580078125, -3.399169921875, -3.21826171875, -3.037353515625, -2.8564453125, -2.675537109375, -2.49462890625, -2.313720703125, -2.1328125, -1.951904296875, -1.77099609375, -1.590087890625, -1.4091796875, -1.228271484375, -1.04736328125, -0.866455078125, -0.685546875, -0.504638671875, -0.32373046875, -0.142822265625, 0.0380859375, 0.218994140625, 0.39990234375, 0.580810546875, 0.76171875, 0.942626953125, 1.12353515625, 1.304443359375, 1.4853515625, 1.666259765625, 1.84716796875, 2.028076171875, 2.208984375, 2.389892578125, 2.57080078125, 2.751708984375, 2.9326171875, 3.113525390625, 3.29443359375, 3.475341796875, 3.65625, 3.837158203125, 4.01806640625, 4.198974609375, 4.3798828125, 4.560791015625, 4.74169921875, 4.922607421875, 5.103515625, 5.284423828125, 5.46533203125, 5.646240234375, 5.8271484375, 6.008056640625, 6.18896484375, 6.369873046875, 6.55078125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 9.0, 18.0, 19.0, 37.0, 27.0, 37.0, 57.0, 77.0, 108.0, 140.0, 201.0, 305.0, 431.0, 558.0, 820.0, 1191.0, 1969.0, 3801.0, 8582.0, 24006.0, 71284.0, 201838.0, 477514.0, 2407099.0, 2307029.0, 474175.0, 198763.0, 69436.0, 23595.0, 8586.0, 3689.0, 1989.0, 1233.0, 848.0, 549.0, 414.0, 257.0, 202.0, 130.0, 117.0, 82.0, 55.0, 47.0, 31.0, 29.0, 11.0, 6.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-1.7333984375, -1.6808624267578125, -1.628326416015625, -1.5757904052734375, -1.52325439453125, -1.4707183837890625, -1.418182373046875, -1.3656463623046875, -1.3131103515625, -1.2605743408203125, -1.208038330078125, -1.1555023193359375, -1.10296630859375, -1.0504302978515625, -0.997894287109375, -0.9453582763671875, -0.892822265625, -0.8402862548828125, -0.787750244140625, -0.7352142333984375, -0.68267822265625, -0.6301422119140625, -0.577606201171875, -0.5250701904296875, -0.4725341796875, -0.4199981689453125, -0.367462158203125, -0.3149261474609375, -0.26239013671875, -0.2098541259765625, -0.157318115234375, -0.1047821044921875, -0.05224609375, 0.0002899169921875, 0.052825927734375, 0.1053619384765625, 0.15789794921875, 0.2104339599609375, 0.262969970703125, 0.3155059814453125, 0.3680419921875, 0.4205780029296875, 0.473114013671875, 0.5256500244140625, 0.57818603515625, 0.6307220458984375, 0.683258056640625, 0.7357940673828125, 0.788330078125, 0.8408660888671875, 0.893402099609375, 0.9459381103515625, 0.99847412109375, 1.0510101318359375, 1.103546142578125, 1.1560821533203125, 1.2086181640625, 1.2611541748046875, 1.313690185546875, 1.3662261962890625, 1.41876220703125, 1.4712982177734375, 1.523834228515625, 1.5763702392578125, 1.62890625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 4.0, 10.0, 14.0, 13.0, 12.0, 18.0, 16.0, 25.0, 21.0, 24.0, 28.0, 31.0, 31.0, 37.0, 31.0, 37.0, 35.0, 41.0, 214.0, 662.0, 266.0, 41.0, 40.0, 40.0, 38.0, 43.0, 37.0, 29.0, 26.0, 27.0, 19.0, 15.0, 19.0, 13.0, 12.0, 11.0, 6.0, 8.0, 9.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.90234375, -3.786468505859375, -3.67059326171875, -3.554718017578125, -3.4388427734375, -3.322967529296875, -3.20709228515625, -3.091217041015625, -2.975341796875, -2.859466552734375, -2.74359130859375, -2.627716064453125, -2.5118408203125, -2.395965576171875, -2.28009033203125, -2.164215087890625, -2.04833984375, -1.932464599609375, -1.81658935546875, -1.700714111328125, -1.5848388671875, -1.468963623046875, -1.35308837890625, -1.237213134765625, -1.121337890625, -1.005462646484375, -0.88958740234375, -0.773712158203125, -0.6578369140625, -0.541961669921875, -0.42608642578125, -0.310211181640625, -0.1943359375, -0.078460693359375, 0.03741455078125, 0.153289794921875, 0.2691650390625, 0.385040283203125, 0.50091552734375, 0.616790771484375, 0.732666015625, 0.848541259765625, 0.96441650390625, 1.080291748046875, 1.1961669921875, 1.312042236328125, 1.42791748046875, 1.543792724609375, 1.65966796875, 1.775543212890625, 1.89141845703125, 2.007293701171875, 2.1231689453125, 2.239044189453125, 2.35491943359375, 2.470794677734375, 2.586669921875, 2.702545166015625, 2.81842041015625, 2.934295654296875, 3.0501708984375, 3.166046142578125, 3.28192138671875, 3.397796630859375, 3.513671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 45.0, 102.0, 216.0, 316.0, 192.0, 93.0, 20.0, 12.0, 1.0], "bins": [-38.39568328857422, -37.740325927734375, -37.0849723815918, -36.42961502075195, -35.774261474609375, -35.11890411376953, -34.46355056762695, -33.80819320678711, -33.15283966064453, -32.49748229980469, -31.84212875366211, -31.1867733001709, -30.531417846679688, -29.876060485839844, -29.220705032348633, -28.565349578857422, -27.909992218017578, -27.254636764526367, -26.599281311035156, -25.943925857543945, -25.288570404052734, -24.63321304321289, -23.97785758972168, -23.32250213623047, -22.667146682739258, -22.011791229248047, -21.356435775756836, -20.701080322265625, -20.04572296142578, -19.39036750793457, -18.73501205444336, -18.07965660095215, -17.424301147460938, -16.768945693969727, -16.113590240478516, -15.458233833312988, -14.802878379821777, -14.147522926330566, -13.492166519165039, -12.836811065673828, -12.181456565856934, -11.526101112365723, -10.870744705200195, -10.215389251708984, -9.560033798217773, -8.904678344726562, -8.249322891235352, -7.593966484069824, -6.938611030578613, -6.283255577087402, -5.627899646759033, -4.972543716430664, -4.317188262939453, -3.661832571029663, -3.006476879119873, -2.351120948791504, -1.695765495300293, -1.040409803390503, -0.3850541114807129, 0.27030158042907715, 0.9256572723388672, 1.5810129642486572, 2.2363686561584473, 2.8917245864868164, 3.5470800399780273]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 12.0, 5.0, 10.0, 7.0, 10.0, 21.0, 14.0, 14.0, 22.0, 20.0, 27.0, 38.0, 41.0, 40.0, 40.0, 39.0, 38.0, 39.0, 36.0, 38.0, 42.0, 40.0, 37.0, 40.0, 38.0, 26.0, 20.0, 35.0, 23.0, 25.0, 21.0, 25.0, 17.0, 18.0, 10.0, 10.0, 17.0, 12.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-6.85384464263916, -6.670539379119873, -6.487234115600586, -6.303928375244141, -6.1206231117248535, -5.937317848205566, -5.754012584686279, -5.570707321166992, -5.387401580810547, -5.20409631729126, -5.020791053771973, -4.837485313415527, -4.65418004989624, -4.470874786376953, -4.287569522857666, -4.104264259338379, -3.920958995819092, -3.7376537322998047, -3.5543482303619385, -3.3710429668426514, -3.187737464904785, -3.004432201385498, -2.821126937866211, -2.637821674346924, -2.4545161724090576, -2.2712109088897705, -2.0879054069519043, -1.9046001434326172, -1.7212947607040405, -1.5379893779754639, -1.3546841144561768, -1.1713787317276, -0.9880733489990234, -0.8047679662704468, -0.6214626431465149, -0.438157320022583, -0.25485193729400635, -0.07154655456542969, 0.11175870895385742, 0.2950640916824341, 0.47836947441101074, 0.6616748571395874, 0.8449801802635193, 1.0282855033874512, 1.2115908861160278, 1.3948962688446045, 1.5782015323638916, 1.7615069150924683, 1.944812297821045, 2.128117561340332, 2.3114230632781982, 2.4947283267974854, 2.6780338287353516, 2.8613390922546387, 3.044644355773926, 3.227949619293213, 3.411255121231079, 3.594560384750366, 3.7778658866882324, 3.9611711502075195, 4.144476413726807, 4.327781677246094, 4.511087417602539, 4.694392681121826, 4.877697944641113]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 10.0, 3.0, 10.0, 10.0, 20.0, 22.0, 35.0, 61.0, 133.0, 231.0, 536.0, 1270.0, 2966.0, 7230.0, 22256.0, 102875.0, 1521857.0, 2315876.0, 174180.0, 28973.0, 9390.0, 3561.0, 1448.0, 643.0, 319.0, 151.0, 78.0, 57.0, 27.0, 16.0, 9.0, 13.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.2281970977783203, -0.21945571899414062, -0.21071434020996094, -0.20197296142578125, -0.19323158264160156, -0.18449020385742188, -0.1757488250732422, -0.1670074462890625, -0.1582660675048828, -0.14952468872070312, -0.14078330993652344, -0.13204193115234375, -0.12330055236816406, -0.11455917358398438, -0.10581779479980469, -0.097076416015625, -0.08833503723144531, -0.07959365844726562, -0.07085227966308594, -0.06211090087890625, -0.05336952209472656, -0.044628143310546875, -0.03588676452636719, -0.0271453857421875, -0.018404006958007812, -0.009662628173828125, -0.0009212493896484375, 0.00782012939453125, 0.016561508178710938, 0.025302886962890625, 0.03404426574707031, 0.04278564453125, 0.05152702331542969, 0.060268402099609375, 0.06900978088378906, 0.07775115966796875, 0.08649253845214844, 0.09523391723632812, 0.10397529602050781, 0.1127166748046875, 0.12145805358886719, 0.13019943237304688, 0.13894081115722656, 0.14768218994140625, 0.15642356872558594, 0.16516494750976562, 0.1739063262939453, 0.182647705078125, 0.1913890838623047, 0.20013046264648438, 0.20887184143066406, 0.21761322021484375, 0.22635459899902344, 0.23509597778320312, 0.2438373565673828, 0.2525787353515625, 0.2613201141357422, 0.2700614929199219, 0.27880287170410156, 0.28754425048828125, 0.29628562927246094, 0.3050270080566406, 0.3137683868408203, 0.322509765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 7.0, 11.0, 12.0, 11.0, 20.0, 20.0, 27.0, 37.0, 44.0, 50.0, 61.0, 43.0, 81.0, 78.0, 75.0, 53.0, 45.0, 59.0, 45.0, 59.0, 34.0, 27.0, 24.0, 13.0, 21.0, 13.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12065315246582031, -0.11618423461914062, -0.11171531677246094, -0.10724639892578125, -0.10277748107910156, -0.09830856323242188, -0.09383964538574219, -0.0893707275390625, -0.08490180969238281, -0.08043289184570312, -0.07596397399902344, -0.07149505615234375, -0.06702613830566406, -0.06255722045898438, -0.05808830261230469, -0.053619384765625, -0.04915046691894531, -0.044681549072265625, -0.04021263122558594, -0.03574371337890625, -0.03127479553222656, -0.026805877685546875, -0.022336959838867188, -0.0178680419921875, -0.013399124145507812, -0.008930206298828125, -0.0044612884521484375, 7.62939453125e-06, 0.0044765472412109375, 0.008945465087890625, 0.013414382934570312, 0.01788330078125, 0.022352218627929688, 0.026821136474609375, 0.03129005432128906, 0.03575897216796875, 0.04022789001464844, 0.044696807861328125, 0.04916572570800781, 0.0536346435546875, 0.05810356140136719, 0.06257247924804688, 0.06704139709472656, 0.07151031494140625, 0.07597923278808594, 0.08044815063476562, 0.08491706848144531, 0.089385986328125, 0.09385490417480469, 0.09832382202148438, 0.10279273986816406, 0.10726165771484375, 0.11173057556152344, 0.11619949340820312, 0.12066841125488281, 0.1251373291015625, 0.1296062469482422, 0.13407516479492188, 0.13854408264160156, 0.14301300048828125, 0.14748191833496094, 0.15195083618164062, 0.1564197540283203, 0.160888671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 2.0, 8.0, 5.0, 7.0, 13.0, 23.0, 28.0, 37.0, 54.0, 77.0, 162.0, 260.0, 501.0, 1235.0, 3669.0, 12347.0, 61325.0, 530538.0, 2703471.0, 774085.0, 83944.0, 15354.0, 4281.0, 1524.0, 584.0, 314.0, 144.0, 91.0, 46.0, 33.0, 31.0, 17.0, 11.0, 15.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17236328125, -0.1665363311767578, -0.16070938110351562, -0.15488243103027344, -0.14905548095703125, -0.14322853088378906, -0.13740158081054688, -0.1315746307373047, -0.1257476806640625, -0.11992073059082031, -0.11409378051757812, -0.10826683044433594, -0.10243988037109375, -0.09661293029785156, -0.09078598022460938, -0.08495903015136719, -0.079132080078125, -0.07330513000488281, -0.06747817993164062, -0.06165122985839844, -0.05582427978515625, -0.04999732971191406, -0.044170379638671875, -0.03834342956542969, -0.0325164794921875, -0.026689529418945312, -0.020862579345703125, -0.015035629272460938, -0.00920867919921875, -0.0033817291259765625, 0.002445220947265625, 0.008272171020507812, 0.01409912109375, 0.019926071166992188, 0.025753021240234375, 0.03157997131347656, 0.03740692138671875, 0.04323387145996094, 0.049060821533203125, 0.05488777160644531, 0.0607147216796875, 0.06654167175292969, 0.07236862182617188, 0.07819557189941406, 0.08402252197265625, 0.08984947204589844, 0.09567642211914062, 0.10150337219238281, 0.107330322265625, 0.11315727233886719, 0.11898422241210938, 0.12481117248535156, 0.13063812255859375, 0.13646507263183594, 0.14229202270507812, 0.1481189727783203, 0.1539459228515625, 0.1597728729248047, 0.16559982299804688, 0.17142677307128906, 0.17725372314453125, 0.18308067321777344, 0.18890762329101562, 0.1947345733642578, 0.2005615234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 13.0, 8.0, 23.0, 35.0, 34.0, 58.0, 87.0, 114.0, 200.0, 240.0, 325.0, 427.0, 447.0, 486.0, 413.0, 323.0, 221.0, 184.0, 114.0, 83.0, 56.0, 37.0, 31.0, 21.0, 23.0, 13.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12817859649658203, -0.12452125549316406, -0.1208639144897461, -0.11720657348632812, -0.11354923248291016, -0.10989189147949219, -0.10623455047607422, -0.10257720947265625, -0.09891986846923828, -0.09526252746582031, -0.09160518646240234, -0.08794784545898438, -0.0842905044555664, -0.08063316345214844, -0.07697582244873047, -0.0733184814453125, -0.06966114044189453, -0.06600379943847656, -0.062346458435058594, -0.058689117431640625, -0.055031776428222656, -0.05137443542480469, -0.04771709442138672, -0.04405975341796875, -0.04040241241455078, -0.03674507141113281, -0.033087730407714844, -0.029430389404296875, -0.025773048400878906, -0.022115707397460938, -0.01845836639404297, -0.014801025390625, -0.011143684387207031, -0.0074863433837890625, -0.0038290023803710938, -0.000171661376953125, 0.0034856796264648438, 0.0071430206298828125, 0.010800361633300781, 0.01445770263671875, 0.01811504364013672, 0.021772384643554688, 0.025429725646972656, 0.029087066650390625, 0.032744407653808594, 0.03640174865722656, 0.04005908966064453, 0.0437164306640625, 0.04737377166748047, 0.05103111267089844, 0.054688453674316406, 0.058345794677734375, 0.062003135681152344, 0.06566047668457031, 0.06931781768798828, 0.07297515869140625, 0.07663249969482422, 0.08028984069824219, 0.08394718170166016, 0.08760452270507812, 0.0912618637084961, 0.09491920471191406, 0.09857654571533203, 0.10223388671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 16.0, 38.0, 78.0, 122.0, 158.0, 188.0, 161.0, 95.0, 72.0, 30.0, 16.0, 9.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9050458669662476, -0.878834068775177, -0.8526222705841064, -0.8264104723930359, -0.8001986742019653, -0.77398681640625, -0.7477750182151794, -0.7215632200241089, -0.6953514218330383, -0.6691396236419678, -0.6429278254508972, -0.6167160272598267, -0.5905041694641113, -0.5642924308776855, -0.5380805730819702, -0.5118687748908997, -0.4856569766998291, -0.45944517850875854, -0.433233380317688, -0.40702155232429504, -0.3808097541332245, -0.35459795594215393, -0.328386127948761, -0.30217432975769043, -0.2759625315666199, -0.24975073337554932, -0.22353892028331757, -0.19732710719108582, -0.17111530900001526, -0.1449035108089447, -0.11869169771671295, -0.0924798846244812, -0.06626814603805542, -0.040056340396404266, -0.013844534754753113, 0.01236727088689804, 0.038579076528549194, 0.06479087471961975, 0.0910026878118515, 0.11721450090408325, 0.1434262990951538, 0.16963809728622437, 0.19584991037845612, 0.22206172347068787, 0.24827352166175842, 0.274485319852829, 0.3006971478462219, 0.3269089460372925, 0.35312074422836304, 0.3793325424194336, 0.40554434061050415, 0.4317561686038971, 0.45796796679496765, 0.4841797649860382, 0.5103915929794312, 0.5366033911705017, 0.5628151893615723, 0.5890269875526428, 0.6152387857437134, 0.6414505839347839, 0.6676623821258545, 0.6938742399215698, 0.7200860381126404, 0.7462978363037109, 0.7725096344947815]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 11.0, 7.0, 10.0, 14.0, 24.0, 16.0, 18.0, 23.0, 29.0, 27.0, 32.0, 47.0, 40.0, 41.0, 61.0, 47.0, 33.0, 40.0, 38.0, 53.0, 54.0, 35.0, 48.0, 33.0, 30.0, 34.0, 25.0, 21.0, 28.0, 16.0, 16.0, 11.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.37412774562835693, -0.36378976702690125, -0.35345175862312317, -0.3431137800216675, -0.3327757716178894, -0.3224377930164337, -0.31209978461265564, -0.30176180601119995, -0.2914237976074219, -0.2810858190059662, -0.2707478106021881, -0.2604098320007324, -0.25007182359695435, -0.23973384499549866, -0.22939585149288177, -0.2190578579902649, -0.2087198793888092, -0.19838188588619232, -0.18804389238357544, -0.17770589888095856, -0.16736790537834167, -0.157029926776886, -0.1466919332742691, -0.13635393977165222, -0.12601594626903534, -0.11567795276641846, -0.10533995926380157, -0.09500197321176529, -0.08466397970914841, -0.07432598620653152, -0.06398800015449524, -0.05365000665187836, -0.043312013149261475, -0.03297401964664459, -0.02263602986931801, -0.012298038229346275, -0.0019600465893745422, 0.00837794691324234, 0.018715936690568924, 0.029053926467895508, 0.03939191997051239, 0.04972991347312927, 0.060067903250455856, 0.07040589302778244, 0.08074388653039932, 0.0910818800330162, 0.10141986608505249, 0.11175785958766937, 0.12209585309028625, 0.13243384659290314, 0.14277184009552002, 0.1531098335981369, 0.16344782710075378, 0.17378580570220947, 0.18412379920482635, 0.19446179270744324, 0.20479978621006012, 0.215137779712677, 0.22547577321529388, 0.23581376671791077, 0.24615174531936646, 0.25648975372314453, 0.2668277323246002, 0.2771657109260559, 0.287503719329834]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 8.0, 12.0, 16.0, 19.0, 31.0, 45.0, 68.0, 70.0, 100.0, 163.0, 208.0, 338.0, 494.0, 759.0, 1415.0, 2609.0, 6048.0, 18030.0, 69424.0, 308558.0, 463738.0, 128898.0, 29919.0, 9258.0, 3568.0, 1824.0, 1045.0, 621.0, 348.0, 253.0, 178.0, 125.0, 83.0, 81.0, 38.0, 32.0, 18.0, 24.0, 11.0, 9.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18650245666503906, -0.17988967895507812, -0.1732769012451172, -0.16666412353515625, -0.1600513458251953, -0.15343856811523438, -0.14682579040527344, -0.1402130126953125, -0.13360023498535156, -0.12698745727539062, -0.12037467956542969, -0.11376190185546875, -0.10714912414550781, -0.10053634643554688, -0.09392356872558594, -0.087310791015625, -0.08069801330566406, -0.07408523559570312, -0.06747245788574219, -0.06085968017578125, -0.05424690246582031, -0.047634124755859375, -0.04102134704589844, -0.0344085693359375, -0.027795791625976562, -0.021183013916015625, -0.014570236206054688, -0.00795745849609375, -0.0013446807861328125, 0.005268096923828125, 0.011880874633789062, 0.01849365234375, 0.025106430053710938, 0.031719207763671875, 0.03833198547363281, 0.04494476318359375, 0.05155754089355469, 0.058170318603515625, 0.06478309631347656, 0.0713958740234375, 0.07800865173339844, 0.08462142944335938, 0.09123420715332031, 0.09784698486328125, 0.10445976257324219, 0.11107254028320312, 0.11768531799316406, 0.124298095703125, 0.13091087341308594, 0.13752365112304688, 0.1441364288330078, 0.15074920654296875, 0.1573619842529297, 0.16397476196289062, 0.17058753967285156, 0.1772003173828125, 0.18381309509277344, 0.19042587280273438, 0.1970386505126953, 0.20365142822265625, 0.2102642059326172, 0.21687698364257812, 0.22348976135253906, 0.2301025390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 9.0, 7.0, 9.0, 15.0, 16.0, 20.0, 16.0, 22.0, 29.0, 36.0, 41.0, 44.0, 55.0, 47.0, 54.0, 55.0, 76.0, 48.0, 56.0, 55.0, 32.0, 41.0, 28.0, 35.0, 36.0, 20.0, 20.0, 27.0, 8.0, 5.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12804889678955078, -0.12426185607910156, -0.12047481536865234, -0.11668777465820312, -0.1129007339477539, -0.10911369323730469, -0.10532665252685547, -0.10153961181640625, -0.09775257110595703, -0.09396553039550781, -0.0901784896850586, -0.08639144897460938, -0.08260440826416016, -0.07881736755371094, -0.07503032684326172, -0.0712432861328125, -0.06745624542236328, -0.06366920471191406, -0.059882164001464844, -0.056095123291015625, -0.052308082580566406, -0.04852104187011719, -0.04473400115966797, -0.04094696044921875, -0.03715991973876953, -0.03337287902832031, -0.029585838317871094, -0.025798797607421875, -0.022011756896972656, -0.018224716186523438, -0.014437675476074219, -0.010650634765625, -0.006863594055175781, -0.0030765533447265625, 0.0007104873657226562, 0.004497528076171875, 0.008284568786621094, 0.012071609497070312, 0.01585865020751953, 0.01964569091796875, 0.02343273162841797, 0.027219772338867188, 0.031006813049316406, 0.034793853759765625, 0.038580894470214844, 0.04236793518066406, 0.04615497589111328, 0.0499420166015625, 0.05372905731201172, 0.05751609802246094, 0.061303138732910156, 0.06509017944335938, 0.0688772201538086, 0.07266426086425781, 0.07645130157470703, 0.08023834228515625, 0.08402538299560547, 0.08781242370605469, 0.0915994644165039, 0.09538650512695312, 0.09917354583740234, 0.10296058654785156, 0.10674762725830078, 0.11053466796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 3.0, 9.0, 12.0, 11.0, 13.0, 13.0, 16.0, 25.0, 30.0, 57.0, 97.0, 202.0, 453.0, 1111.0, 3128.0, 9656.0, 32141.0, 106313.0, 279569.0, 356968.0, 176349.0, 57390.0, 16697.0, 5117.0, 1785.0, 697.0, 292.0, 135.0, 71.0, 49.0, 32.0, 22.0, 22.0, 7.0, 10.0, 17.0, 4.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16057395935058594, -0.15574264526367188, -0.1509113311767578, -0.14608001708984375, -0.1412487030029297, -0.13641738891601562, -0.13158607482910156, -0.1267547607421875, -0.12192344665527344, -0.11709213256835938, -0.11226081848144531, -0.10742950439453125, -0.10259819030761719, -0.09776687622070312, -0.09293556213378906, -0.088104248046875, -0.08327293395996094, -0.07844161987304688, -0.07361030578613281, -0.06877899169921875, -0.06394767761230469, -0.059116363525390625, -0.05428504943847656, -0.0494537353515625, -0.04462242126464844, -0.039791107177734375, -0.03495979309082031, -0.03012847900390625, -0.025297164916992188, -0.020465850830078125, -0.015634536743164062, -0.01080322265625, -0.0059719085693359375, -0.001140594482421875, 0.0036907196044921875, 0.00852203369140625, 0.013353347778320312, 0.018184661865234375, 0.023015975952148438, 0.0278472900390625, 0.03267860412597656, 0.037509918212890625, 0.04234123229980469, 0.04717254638671875, 0.05200386047363281, 0.056835174560546875, 0.06166648864746094, 0.066497802734375, 0.07132911682128906, 0.07616043090820312, 0.08099174499511719, 0.08582305908203125, 0.09065437316894531, 0.09548568725585938, 0.10031700134277344, 0.1051483154296875, 0.10997962951660156, 0.11481094360351562, 0.11964225769042969, 0.12447357177734375, 0.1293048858642578, 0.13413619995117188, 0.13896751403808594, 0.143798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 4.0, 9.0, 7.0, 10.0, 19.0, 30.0, 18.0, 29.0, 30.0, 25.0, 29.0, 33.0, 35.0, 41.0, 43.0, 49.0, 48.0, 49.0, 48.0, 49.0, 44.0, 51.0, 43.0, 29.0, 39.0, 22.0, 21.0, 21.0, 17.0, 13.0, 16.0, 12.0, 11.0, 12.0, 7.0, 7.0, 5.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23122215270996094, -0.22257614135742188, -0.2139301300048828, -0.20528411865234375, -0.1966381072998047, -0.18799209594726562, -0.17934608459472656, -0.1707000732421875, -0.16205406188964844, -0.15340805053710938, -0.1447620391845703, -0.13611602783203125, -0.1274700164794922, -0.11882400512695312, -0.11017799377441406, -0.101531982421875, -0.09288597106933594, -0.08423995971679688, -0.07559394836425781, -0.06694793701171875, -0.05830192565917969, -0.049655914306640625, -0.04100990295410156, -0.0323638916015625, -0.023717880249023438, -0.015071868896484375, -0.0064258575439453125, 0.00222015380859375, 0.010866165161132812, 0.019512176513671875, 0.028158187866210938, 0.03680419921875, 0.04545021057128906, 0.054096221923828125, 0.06274223327636719, 0.07138824462890625, 0.08003425598144531, 0.08868026733398438, 0.09732627868652344, 0.1059722900390625, 0.11461830139160156, 0.12326431274414062, 0.1319103240966797, 0.14055633544921875, 0.1492023468017578, 0.15784835815429688, 0.16649436950683594, 0.175140380859375, 0.18378639221191406, 0.19243240356445312, 0.2010784149169922, 0.20972442626953125, 0.2183704376220703, 0.22701644897460938, 0.23566246032714844, 0.2443084716796875, 0.25295448303222656, 0.2616004943847656, 0.2702465057373047, 0.27889251708984375, 0.2875385284423828, 0.2961845397949219, 0.30483055114746094, 0.3134765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 10.0, 10.0, 16.0, 14.0, 11.0, 18.0, 29.0, 59.0, 81.0, 112.0, 195.0, 304.0, 596.0, 1166.0, 2346.0, 5538.0, 15200.0, 52924.0, 212126.0, 459851.0, 217488.0, 54059.0, 15599.0, 5624.0, 2440.0, 1174.0, 630.0, 319.0, 197.0, 139.0, 94.0, 48.0, 34.0, 18.0, 23.0, 8.0, 12.0, 10.0, 3.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07391357421875, -0.0716400146484375, -0.069366455078125, -0.0670928955078125, -0.0648193359375, -0.0625457763671875, -0.060272216796875, -0.0579986572265625, -0.05572509765625, -0.0534515380859375, -0.051177978515625, -0.0489044189453125, -0.046630859375, -0.0443572998046875, -0.042083740234375, -0.0398101806640625, -0.03753662109375, -0.0352630615234375, -0.032989501953125, -0.0307159423828125, -0.0284423828125, -0.0261688232421875, -0.023895263671875, -0.0216217041015625, -0.01934814453125, -0.0170745849609375, -0.014801025390625, -0.0125274658203125, -0.01025390625, -0.0079803466796875, -0.005706787109375, -0.0034332275390625, -0.00115966796875, 0.0011138916015625, 0.003387451171875, 0.0056610107421875, 0.0079345703125, 0.0102081298828125, 0.012481689453125, 0.0147552490234375, 0.01702880859375, 0.0193023681640625, 0.021575927734375, 0.0238494873046875, 0.026123046875, 0.0283966064453125, 0.030670166015625, 0.0329437255859375, 0.03521728515625, 0.0374908447265625, 0.039764404296875, 0.0420379638671875, 0.0443115234375, 0.0465850830078125, 0.048858642578125, 0.0511322021484375, 0.05340576171875, 0.0556793212890625, 0.057952880859375, 0.0602264404296875, 0.0625, 0.0647735595703125, 0.067047119140625, 0.0693206787109375, 0.07159423828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 11.0, 17.0, 12.0, 21.0, 16.0, 33.0, 47.0, 48.0, 40.0, 60.0, 66.0, 65.0, 73.0, 48.0, 68.0, 57.0, 65.0, 39.0, 35.0, 35.0, 24.0, 14.0, 16.0, 23.0, 16.0, 14.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.046627044677734e-06, -7.821246981620789e-06, -7.595866918563843e-06, -7.370486855506897e-06, -7.145106792449951e-06, -6.919726729393005e-06, -6.6943466663360596e-06, -6.468966603279114e-06, -6.243586540222168e-06, -6.018206477165222e-06, -5.792826414108276e-06, -5.5674463510513306e-06, -5.342066287994385e-06, -5.116686224937439e-06, -4.891306161880493e-06, -4.665926098823547e-06, -4.4405460357666016e-06, -4.215165972709656e-06, -3.98978590965271e-06, -3.764405846595764e-06, -3.5390257835388184e-06, -3.3136457204818726e-06, -3.0882656574249268e-06, -2.862885594367981e-06, -2.637505531311035e-06, -2.4121254682540894e-06, -2.1867454051971436e-06, -1.9613653421401978e-06, -1.735985279083252e-06, -1.5106052160263062e-06, -1.2852251529693604e-06, -1.0598450899124146e-06, -8.344650268554688e-07, -6.09084963798523e-07, -3.8370490074157715e-07, -1.5832483768463135e-07, 6.705522537231445e-08, 2.9243528842926025e-07, 5.178153514862061e-07, 7.431954145431519e-07, 9.685754776000977e-07, 1.1939555406570435e-06, 1.4193356037139893e-06, 1.644715666770935e-06, 1.8700957298278809e-06, 2.0954757928848267e-06, 2.3208558559417725e-06, 2.5462359189987183e-06, 2.771615982055664e-06, 2.99699604511261e-06, 3.2223761081695557e-06, 3.4477561712265015e-06, 3.6731362342834473e-06, 3.898516297340393e-06, 4.123896360397339e-06, 4.349276423454285e-06, 4.5746564865112305e-06, 4.800036549568176e-06, 5.025416612625122e-06, 5.250796675682068e-06, 5.476176738739014e-06, 5.7015568017959595e-06, 5.926936864852905e-06, 6.152316927909851e-06, 6.377696990966797e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 20.0, 12.0, 35.0, 40.0, 44.0, 80.0, 143.0, 234.0, 382.0, 724.0, 1413.0, 3079.0, 7777.0, 22614.0, 80988.0, 307167.0, 425935.0, 141203.0, 36335.0, 11747.0, 4451.0, 1979.0, 916.0, 509.0, 289.0, 183.0, 86.0, 52.0, 33.0, 19.0, 20.0, 12.0, 8.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08306884765625, -0.08063983917236328, -0.07821083068847656, -0.07578182220458984, -0.07335281372070312, -0.0709238052368164, -0.06849479675292969, -0.06606578826904297, -0.06363677978515625, -0.06120777130126953, -0.05877876281738281, -0.056349754333496094, -0.053920745849609375, -0.051491737365722656, -0.04906272888183594, -0.04663372039794922, -0.0442047119140625, -0.04177570343017578, -0.03934669494628906, -0.036917686462402344, -0.034488677978515625, -0.032059669494628906, -0.029630661010742188, -0.02720165252685547, -0.02477264404296875, -0.02234363555908203, -0.019914627075195312, -0.017485618591308594, -0.015056610107421875, -0.012627601623535156, -0.010198593139648438, -0.007769584655761719, -0.005340576171875, -0.0029115676879882812, -0.0004825592041015625, 0.0019464492797851562, 0.004375457763671875, 0.006804466247558594, 0.009233474731445312, 0.011662483215332031, 0.01409149169921875, 0.01652050018310547, 0.018949508666992188, 0.021378517150878906, 0.023807525634765625, 0.026236534118652344, 0.028665542602539062, 0.03109455108642578, 0.0335235595703125, 0.03595256805419922, 0.03838157653808594, 0.040810585021972656, 0.043239593505859375, 0.045668601989746094, 0.04809761047363281, 0.05052661895751953, 0.05295562744140625, 0.05538463592529297, 0.05781364440917969, 0.060242652893066406, 0.06267166137695312, 0.06510066986083984, 0.06752967834472656, 0.06995868682861328, 0.0723876953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 14.0, 14.0, 13.0, 27.0, 28.0, 40.0, 41.0, 39.0, 71.0, 70.0, 64.0, 100.0, 75.0, 77.0, 64.0, 42.0, 46.0, 30.0, 29.0, 21.0, 16.0, 8.0, 8.0, 6.0, 4.0, 10.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.0656728744506836, -0.06359672546386719, -0.06152057647705078, -0.059444427490234375, -0.05736827850341797, -0.05529212951660156, -0.053215980529785156, -0.05113983154296875, -0.049063682556152344, -0.04698753356933594, -0.04491138458251953, -0.042835235595703125, -0.04075908660888672, -0.03868293762207031, -0.036606788635253906, -0.0345306396484375, -0.032454490661621094, -0.030378341674804688, -0.02830219268798828, -0.026226043701171875, -0.02414989471435547, -0.022073745727539062, -0.019997596740722656, -0.01792144775390625, -0.015845298767089844, -0.013769149780273438, -0.011693000793457031, -0.009616851806640625, -0.007540702819824219, -0.0054645538330078125, -0.0033884048461914062, -0.001312255859375, 0.0007638931274414062, 0.0028400421142578125, 0.004916191101074219, 0.006992340087890625, 0.009068489074707031, 0.011144638061523438, 0.013220787048339844, 0.01529693603515625, 0.017373085021972656, 0.019449234008789062, 0.02152538299560547, 0.023601531982421875, 0.02567768096923828, 0.027753829956054688, 0.029829978942871094, 0.0319061279296875, 0.033982276916503906, 0.03605842590332031, 0.03813457489013672, 0.040210723876953125, 0.04228687286376953, 0.04436302185058594, 0.046439170837402344, 0.04851531982421875, 0.050591468811035156, 0.05266761779785156, 0.05474376678466797, 0.056819915771484375, 0.05889606475830078, 0.06097221374511719, 0.0630483627319336, 0.06512451171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 15.0, 31.0, 78.0, 148.0, 219.0, 222.0, 155.0, 79.0, 30.0, 17.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7163475751876831, -0.6607193350791931, -0.6050910949707031, -0.5494627952575684, -0.49383458495140076, -0.43820634484291077, -0.3825780749320984, -0.3269498348236084, -0.2713215947151184, -0.21569335460662842, -0.16006509959697723, -0.10443684458732605, -0.04880860447883606, 0.006819635629653931, 0.06244790554046631, 0.1180761456489563, 0.1737043857574463, 0.22933262586593628, 0.28496086597442627, 0.34058913588523865, 0.39621737599372864, 0.45184561610221863, 0.507473886013031, 0.563102126121521, 0.618730366230011, 0.674358606338501, 0.729986846446991, 0.785615086555481, 0.8412433862686157, 0.8968715667724609, 0.9524998664855957, 1.0081281661987305, 1.0637564659118652, 1.119384765625, 1.1750129461288452, 1.23064124584198, 1.2862694263458252, 1.34189772605896, 1.3975260257720947, 1.45315420627594, 1.5087823867797852, 1.56441068649292, 1.6200388669967651, 1.6756671667099, 1.7312953472137451, 1.7869236469268799, 1.8425519466400146, 1.8981801271438599, 1.9538084268569946, 2.00943660736084, 2.0650649070739746, 2.1206932067871094, 2.176321506500244, 2.2319495677948, 2.2875778675079346, 2.3432061672210693, 2.398834466934204, 2.454462766647339, 2.5100910663604736, 2.5657191276550293, 2.621347427368164, 2.676975727081299, 2.7326040267944336, 2.7882323265075684, 2.843860387802124]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 10.0, 11.0, 13.0, 11.0, 19.0, 18.0, 18.0, 20.0, 31.0, 31.0, 31.0, 40.0, 30.0, 45.0, 31.0, 58.0, 47.0, 42.0, 33.0, 46.0, 46.0, 46.0, 38.0, 29.0, 42.0, 32.0, 27.0, 23.0, 17.0, 14.0, 15.0, 12.0, 12.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.2559125423431396, -1.2153220176696777, -1.1747313737869263, -1.1341408491134644, -1.0935503244400024, -1.0529597997665405, -1.012369155883789, -0.9717786312103271, -0.9311881065368652, -0.8905975222587585, -0.8500069975852966, -0.8094164133071899, -0.768825888633728, -0.7282353043556213, -0.6876447200775146, -0.6470541954040527, -0.606463611125946, -0.5658730268478394, -0.5252825021743774, -0.48469191789627075, -0.44410139322280884, -0.40351080894470215, -0.36292025446891785, -0.32232969999313354, -0.28173914551734924, -0.24114859104156494, -0.20055803656578064, -0.15996746718883514, -0.11937691271305084, -0.07878635823726654, -0.038195788860321045, 0.002394765615463257, 0.04298532009124756, 0.08357587456703186, 0.12416643649339676, 0.16475699841976166, 0.20534755289554596, 0.24593810737133026, 0.28652867674827576, 0.32711923122406006, 0.36770978569984436, 0.40830034017562866, 0.44889089465141296, 0.48948144912719727, 0.530072033405304, 0.5706625580787659, 0.6112531423568726, 0.6518436670303345, 0.6924342513084412, 0.7330248355865479, 0.7736153602600098, 0.8142059445381165, 0.8547964692115784, 0.8953870534896851, 0.935977578163147, 0.9765681624412537, 1.0171587467193604, 1.0577492713928223, 1.0983399152755737, 1.1389304399490356, 1.1795209646224976, 1.2201114892959595, 1.260702133178711, 1.3012926578521729, 1.3418831825256348]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 2.0, 6.0, 8.0, 5.0, 6.0, 14.0, 17.0, 16.0, 21.0, 32.0, 44.0, 57.0, 113.0, 239.0, 533.0, 1512.0, 5487.0, 28820.0, 415632.0, 3564301.0, 155508.0, 16689.0, 3376.0, 990.0, 383.0, 158.0, 74.0, 42.0, 36.0, 29.0, 24.0, 12.0, 18.0, 8.0, 14.0, 8.0, 6.0, 9.0, 1.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.6259765625, -0.6082687377929688, -0.5905609130859375, -0.5728530883789062, -0.555145263671875, -0.5374374389648438, -0.5197296142578125, -0.5020217895507812, -0.48431396484375, -0.46660614013671875, -0.4488983154296875, -0.43119049072265625, -0.413482666015625, -0.39577484130859375, -0.3780670166015625, -0.36035919189453125, -0.3426513671875, -0.32494354248046875, -0.3072357177734375, -0.28952789306640625, -0.271820068359375, -0.25411224365234375, -0.2364044189453125, -0.21869659423828125, -0.20098876953125, -0.18328094482421875, -0.1655731201171875, -0.14786529541015625, -0.130157470703125, -0.11244964599609375, -0.0947418212890625, -0.07703399658203125, -0.059326171875, -0.04161834716796875, -0.0239105224609375, -0.00620269775390625, 0.011505126953125, 0.02921295166015625, 0.0469207763671875, 0.06462860107421875, 0.08233642578125, 0.10004425048828125, 0.1177520751953125, 0.13545989990234375, 0.153167724609375, 0.17087554931640625, 0.1885833740234375, 0.20629119873046875, 0.2239990234375, 0.24170684814453125, 0.2594146728515625, 0.27712249755859375, 0.294830322265625, 0.31253814697265625, 0.3302459716796875, 0.34795379638671875, 0.36566162109375, 0.38336944580078125, 0.4010772705078125, 0.41878509521484375, 0.436492919921875, 0.45420074462890625, 0.4719085693359375, 0.48961639404296875, 0.50732421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 10.0, 9.0, 12.0, 16.0, 17.0, 18.0, 15.0, 29.0, 26.0, 38.0, 33.0, 36.0, 50.0, 51.0, 54.0, 61.0, 43.0, 41.0, 43.0, 34.0, 47.0, 41.0, 32.0, 40.0, 28.0, 32.0, 18.0, 14.0, 18.0, 9.0, 17.0, 12.0, 5.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.12469482421875, -0.12134075164794922, -0.11798667907714844, -0.11463260650634766, -0.11127853393554688, -0.1079244613647461, -0.10457038879394531, -0.10121631622314453, -0.09786224365234375, -0.09450817108154297, -0.09115409851074219, -0.0878000259399414, -0.08444595336914062, -0.08109188079833984, -0.07773780822753906, -0.07438373565673828, -0.0710296630859375, -0.06767559051513672, -0.06432151794433594, -0.060967445373535156, -0.057613372802734375, -0.054259300231933594, -0.05090522766113281, -0.04755115509033203, -0.04419708251953125, -0.04084300994873047, -0.03748893737792969, -0.034134864807128906, -0.030780792236328125, -0.027426719665527344, -0.024072647094726562, -0.02071857452392578, -0.017364501953125, -0.014010429382324219, -0.010656356811523438, -0.007302284240722656, -0.003948211669921875, -0.0005941390991210938, 0.0027599334716796875, 0.006114006042480469, 0.00946807861328125, 0.012822151184082031, 0.016176223754882812, 0.019530296325683594, 0.022884368896484375, 0.026238441467285156, 0.029592514038085938, 0.03294658660888672, 0.0363006591796875, 0.03965473175048828, 0.04300880432128906, 0.046362876892089844, 0.049716949462890625, 0.053071022033691406, 0.05642509460449219, 0.05977916717529297, 0.06313323974609375, 0.06648731231689453, 0.06984138488769531, 0.0731954574584961, 0.07654953002929688, 0.07990360260009766, 0.08325767517089844, 0.08661174774169922, 0.0899658203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 7.0, 23.0, 18.0, 35.0, 39.0, 93.0, 128.0, 223.0, 392.0, 757.0, 1545.0, 3039.0, 6858.0, 15832.0, 41137.0, 120240.0, 411574.0, 1532211.0, 1478753.0, 395509.0, 117425.0, 40013.0, 15728.0, 6516.0, 3091.0, 1499.0, 711.0, 353.0, 212.0, 105.0, 81.0, 39.0, 25.0, 20.0, 16.0, 10.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251953125, -0.2445392608642578, -0.23712539672851562, -0.22971153259277344, -0.22229766845703125, -0.21488380432128906, -0.20746994018554688, -0.2000560760498047, -0.1926422119140625, -0.1852283477783203, -0.17781448364257812, -0.17040061950683594, -0.16298675537109375, -0.15557289123535156, -0.14815902709960938, -0.1407451629638672, -0.133331298828125, -0.1259174346923828, -0.11850357055664062, -0.11108970642089844, -0.10367584228515625, -0.09626197814941406, -0.08884811401367188, -0.08143424987792969, -0.0740203857421875, -0.06660652160644531, -0.059192657470703125, -0.05177879333496094, -0.04436492919921875, -0.03695106506347656, -0.029537200927734375, -0.022123336791992188, -0.01470947265625, -0.0072956085205078125, 0.000118255615234375, 0.0075321197509765625, 0.01494598388671875, 0.022359848022460938, 0.029773712158203125, 0.03718757629394531, 0.0446014404296875, 0.05201530456542969, 0.059429168701171875, 0.06684303283691406, 0.07425689697265625, 0.08167076110839844, 0.08908462524414062, 0.09649848937988281, 0.103912353515625, 0.11132621765136719, 0.11874008178710938, 0.12615394592285156, 0.13356781005859375, 0.14098167419433594, 0.14839553833007812, 0.1558094024658203, 0.1632232666015625, 0.1706371307373047, 0.17805099487304688, 0.18546485900878906, 0.19287872314453125, 0.20029258728027344, 0.20770645141601562, 0.2151203155517578, 0.2225341796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 3.0, 6.0, 12.0, 13.0, 11.0, 19.0, 32.0, 35.0, 49.0, 90.0, 100.0, 139.0, 227.0, 258.0, 378.0, 503.0, 556.0, 497.0, 320.0, 213.0, 153.0, 133.0, 87.0, 58.0, 37.0, 31.0, 22.0, 19.0, 13.0, 14.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1646728515625, -0.1595745086669922, -0.15447616577148438, -0.14937782287597656, -0.14427947998046875, -0.13918113708496094, -0.13408279418945312, -0.1289844512939453, -0.1238861083984375, -0.11878776550292969, -0.11368942260742188, -0.10859107971191406, -0.10349273681640625, -0.09839439392089844, -0.09329605102539062, -0.08819770812988281, -0.083099365234375, -0.07800102233886719, -0.07290267944335938, -0.06780433654785156, -0.06270599365234375, -0.05760765075683594, -0.052509307861328125, -0.04741096496582031, -0.0423126220703125, -0.03721427917480469, -0.032115936279296875, -0.027017593383789062, -0.02191925048828125, -0.016820907592773438, -0.011722564697265625, -0.0066242218017578125, -0.00152587890625, 0.0035724639892578125, 0.008670806884765625, 0.013769149780273438, 0.01886749267578125, 0.023965835571289062, 0.029064178466796875, 0.03416252136230469, 0.0392608642578125, 0.04435920715332031, 0.049457550048828125, 0.05455589294433594, 0.05965423583984375, 0.06475257873535156, 0.06985092163085938, 0.07494926452636719, 0.080047607421875, 0.08514595031738281, 0.09024429321289062, 0.09534263610839844, 0.10044097900390625, 0.10553932189941406, 0.11063766479492188, 0.11573600769042969, 0.1208343505859375, 0.1259326934814453, 0.13103103637695312, 0.13612937927246094, 0.14122772216796875, 0.14632606506347656, 0.15142440795898438, 0.1565227508544922, 0.16162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 22.0, 68.0, 155.0, 256.0, 261.0, 140.0, 67.0, 21.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3985989093780518, -1.3351898193359375, -1.2717807292938232, -1.2083717584609985, -1.1449626684188843, -1.08155357837677, -1.0181446075439453, -0.954735517501831, -0.8913264274597168, -0.8279173374176025, -0.7645083069801331, -0.7010992765426636, -0.6376901865005493, -0.5742810964584351, -0.5108720660209656, -0.4474630057811737, -0.38405394554138184, -0.32064488530158997, -0.2572358250617981, -0.19382676482200623, -0.13041770458221436, -0.06700864434242249, -0.0035995841026306152, 0.059809476137161255, 0.12321853637695312, 0.186627596616745, 0.25003665685653687, 0.31344571709632874, 0.3768547773361206, 0.4402638375759125, 0.5036728978157043, 0.5670819282531738, 0.630490779876709, 0.6938998699188232, 0.7573089003562927, 0.8207179307937622, 0.8841270208358765, 0.9475361108779907, 1.0109450817108154, 1.0743541717529297, 1.137763261795044, 1.2011723518371582, 1.2645814418792725, 1.3279904127120972, 1.3913995027542114, 1.4548085927963257, 1.5182175636291504, 1.5816266536712646, 1.645035743713379, 1.7084448337554932, 1.7718539237976074, 1.8352628946304321, 1.8986719846725464, 1.9620810747146606, 2.0254900455474854, 2.0888991355895996, 2.152308225631714, 2.215717315673828, 2.2791264057159424, 2.3425354957580566, 2.405944347381592, 2.469353437423706, 2.5327625274658203, 2.5961716175079346, 2.659580707550049]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 9.0, 8.0, 8.0, 7.0, 18.0, 19.0, 25.0, 25.0, 32.0, 47.0, 47.0, 32.0, 60.0, 58.0, 55.0, 52.0, 53.0, 52.0, 62.0, 50.0, 36.0, 32.0, 45.0, 31.0, 21.0, 25.0, 23.0, 14.0, 10.0, 11.0, 4.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611383855342865, -0.5926598310470581, -0.573935866355896, -0.5552118420600891, -0.536487877368927, -0.5177638530731201, -0.499039888381958, -0.4803158640861511, -0.461591899394989, -0.4428679049015045, -0.42414391040802, -0.4054199159145355, -0.386695921421051, -0.36797192692756653, -0.34924793243408203, -0.33052390813827515, -0.31179991364479065, -0.29307591915130615, -0.27435192465782166, -0.25562793016433716, -0.23690393567085266, -0.21817994117736816, -0.19945593178272247, -0.18073193728923798, -0.16200794279575348, -0.14328394830226898, -0.12455995380878448, -0.10583595186471939, -0.0871119573712349, -0.0683879628777504, -0.0496639609336853, -0.030939966440200806, -0.012215971946716309, 0.006508024409413338, 0.025232020765542984, 0.04395601898431778, 0.06268001347780228, 0.08140400797128677, 0.10012800991535187, 0.11885200440883636, 0.13757599890232086, 0.15629999339580536, 0.17502398788928986, 0.19374799728393555, 0.21247199177742004, 0.23119598627090454, 0.24991998076438904, 0.26864397525787354, 0.28736796975135803, 0.30609196424484253, 0.324815958738327, 0.3435399532318115, 0.362263947725296, 0.3809879422187805, 0.3997119665145874, 0.4184359312057495, 0.4371599555015564, 0.4558839499950409, 0.4746079444885254, 0.4933319389820099, 0.5120559334754944, 0.5307799577713013, 0.5495039224624634, 0.5682279467582703, 0.5869519114494324]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 14.0, 17.0, 11.0, 29.0, 56.0, 67.0, 116.0, 174.0, 293.0, 498.0, 866.0, 1601.0, 3270.0, 6739.0, 14837.0, 34984.0, 86057.0, 204365.0, 323574.0, 212437.0, 90939.0, 37514.0, 15655.0, 7114.0, 3476.0, 1663.0, 887.0, 504.0, 272.0, 176.0, 110.0, 82.0, 49.0, 39.0, 22.0, 10.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19287109375, -0.1867542266845703, -0.18063735961914062, -0.17452049255371094, -0.16840362548828125, -0.16228675842285156, -0.15616989135742188, -0.1500530242919922, -0.1439361572265625, -0.1378192901611328, -0.13170242309570312, -0.12558555603027344, -0.11946868896484375, -0.11335182189941406, -0.10723495483398438, -0.10111808776855469, -0.095001220703125, -0.08888435363769531, -0.08276748657226562, -0.07665061950683594, -0.07053375244140625, -0.06441688537597656, -0.058300018310546875, -0.05218315124511719, -0.0460662841796875, -0.03994941711425781, -0.033832550048828125, -0.027715682983398438, -0.02159881591796875, -0.015481948852539062, -0.009365081787109375, -0.0032482147216796875, 0.00286865234375, 0.008985519409179688, 0.015102386474609375, 0.021219253540039062, 0.02733612060546875, 0.03345298767089844, 0.039569854736328125, 0.04568672180175781, 0.0518035888671875, 0.05792045593261719, 0.06403732299804688, 0.07015419006347656, 0.07627105712890625, 0.08238792419433594, 0.08850479125976562, 0.09462165832519531, 0.100738525390625, 0.10685539245605469, 0.11297225952148438, 0.11908912658691406, 0.12520599365234375, 0.13132286071777344, 0.13743972778320312, 0.1435565948486328, 0.1496734619140625, 0.1557903289794922, 0.16190719604492188, 0.16802406311035156, 0.17414093017578125, 0.18025779724121094, 0.18637466430664062, 0.1924915313720703, 0.1986083984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 3.0, 9.0, 17.0, 9.0, 16.0, 19.0, 22.0, 24.0, 26.0, 18.0, 36.0, 44.0, 36.0, 46.0, 49.0, 55.0, 45.0, 58.0, 50.0, 39.0, 40.0, 39.0, 38.0, 41.0, 38.0, 36.0, 21.0, 20.0, 20.0, 13.0, 7.0, 13.0, 9.0, 7.0, 9.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12249755859375, -0.11919498443603516, -0.11589241027832031, -0.11258983612060547, -0.10928726196289062, -0.10598468780517578, -0.10268211364746094, -0.0993795394897461, -0.09607696533203125, -0.0927743911743164, -0.08947181701660156, -0.08616924285888672, -0.08286666870117188, -0.07956409454345703, -0.07626152038574219, -0.07295894622802734, -0.0696563720703125, -0.06635379791259766, -0.06305122375488281, -0.05974864959716797, -0.056446075439453125, -0.05314350128173828, -0.04984092712402344, -0.046538352966308594, -0.04323577880859375, -0.039933204650878906, -0.03663063049316406, -0.03332805633544922, -0.030025482177734375, -0.02672290802001953, -0.023420333862304688, -0.020117759704589844, -0.016815185546875, -0.013512611389160156, -0.010210037231445312, -0.006907463073730469, -0.003604888916015625, -0.00030231475830078125, 0.0030002593994140625, 0.006302833557128906, 0.00960540771484375, 0.012907981872558594, 0.016210556030273438, 0.01951313018798828, 0.022815704345703125, 0.02611827850341797, 0.029420852661132812, 0.032723426818847656, 0.0360260009765625, 0.039328575134277344, 0.04263114929199219, 0.04593372344970703, 0.049236297607421875, 0.05253887176513672, 0.05584144592285156, 0.059144020080566406, 0.06244659423828125, 0.0657491683959961, 0.06905174255371094, 0.07235431671142578, 0.07565689086914062, 0.07895946502685547, 0.08226203918457031, 0.08556461334228516, 0.0888671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 13.0, 8.0, 11.0, 14.0, 11.0, 12.0, 26.0, 36.0, 28.0, 37.0, 60.0, 82.0, 183.0, 624.0, 7171.0, 252236.0, 761437.0, 24430.0, 1444.0, 224.0, 82.0, 55.0, 38.0, 44.0, 35.0, 35.0, 24.0, 16.0, 13.0, 20.0, 11.0, 15.0, 13.0, 14.0, 11.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1572265625, -1.1261138916015625, -1.095001220703125, -1.0638885498046875, -1.03277587890625, -1.0016632080078125, -0.970550537109375, -0.9394378662109375, -0.9083251953125, -0.8772125244140625, -0.846099853515625, -0.8149871826171875, -0.78387451171875, -0.7527618408203125, -0.721649169921875, -0.6905364990234375, -0.659423828125, -0.6283111572265625, -0.597198486328125, -0.5660858154296875, -0.53497314453125, -0.5038604736328125, -0.472747802734375, -0.4416351318359375, -0.4105224609375, -0.3794097900390625, -0.348297119140625, -0.3171844482421875, -0.28607177734375, -0.2549591064453125, -0.223846435546875, -0.1927337646484375, -0.16162109375, -0.1305084228515625, -0.099395751953125, -0.0682830810546875, -0.03717041015625, -0.0060577392578125, 0.025054931640625, 0.0561676025390625, 0.0872802734375, 0.1183929443359375, 0.149505615234375, 0.1806182861328125, 0.21173095703125, 0.2428436279296875, 0.273956298828125, 0.3050689697265625, 0.336181640625, 0.3672943115234375, 0.398406982421875, 0.4295196533203125, 0.46063232421875, 0.4917449951171875, 0.522857666015625, 0.5539703369140625, 0.5850830078125, 0.6161956787109375, 0.647308349609375, 0.6784210205078125, 0.70953369140625, 0.7406463623046875, 0.771759033203125, 0.8028717041015625, 0.833984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 1.0, 12.0, 2.0, 15.0, 9.0, 10.0, 14.0, 13.0, 18.0, 16.0, 37.0, 32.0, 29.0, 55.0, 34.0, 33.0, 40.0, 50.0, 51.0, 51.0, 42.0, 30.0, 49.0, 32.0, 30.0, 28.0, 38.0, 30.0, 33.0, 25.0, 18.0, 15.0, 19.0, 13.0, 13.0, 13.0, 13.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.249755859375, -0.24301910400390625, -0.2362823486328125, -0.22954559326171875, -0.222808837890625, -0.21607208251953125, -0.2093353271484375, -0.20259857177734375, -0.19586181640625, -0.18912506103515625, -0.1823883056640625, -0.17565155029296875, -0.168914794921875, -0.16217803955078125, -0.1554412841796875, -0.14870452880859375, -0.1419677734375, -0.13523101806640625, -0.1284942626953125, -0.12175750732421875, -0.115020751953125, -0.10828399658203125, -0.1015472412109375, -0.09481048583984375, -0.08807373046875, -0.08133697509765625, -0.0746002197265625, -0.06786346435546875, -0.061126708984375, -0.05438995361328125, -0.0476531982421875, -0.04091644287109375, -0.0341796875, -0.02744293212890625, -0.0207061767578125, -0.01396942138671875, -0.007232666015625, -0.00049591064453125, 0.0062408447265625, 0.01297760009765625, 0.01971435546875, 0.02645111083984375, 0.0331878662109375, 0.03992462158203125, 0.046661376953125, 0.05339813232421875, 0.0601348876953125, 0.06687164306640625, 0.0736083984375, 0.08034515380859375, 0.0870819091796875, 0.09381866455078125, 0.100555419921875, 0.10729217529296875, 0.1140289306640625, 0.12076568603515625, 0.12750244140625, 0.13423919677734375, 0.1409759521484375, 0.14771270751953125, 0.154449462890625, 0.16118621826171875, 0.1679229736328125, 0.17465972900390625, 0.181396484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 5.0, 12.0, 14.0, 21.0, 31.0, 63.0, 112.0, 148.0, 267.0, 524.0, 898.0, 1841.0, 3986.0, 8975.0, 23430.0, 70192.0, 236759.0, 427909.0, 184552.0, 55205.0, 19139.0, 7550.0, 3448.0, 1600.0, 784.0, 436.0, 263.0, 125.0, 86.0, 43.0, 46.0, 24.0, 16.0, 9.0, 9.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.15003204345703125, -0.1454010009765625, -0.14076995849609375, -0.136138916015625, -0.13150787353515625, -0.1268768310546875, -0.12224578857421875, -0.11761474609375, -0.11298370361328125, -0.1083526611328125, -0.10372161865234375, -0.099090576171875, -0.09445953369140625, -0.0898284912109375, -0.08519744873046875, -0.08056640625, -0.07593536376953125, -0.0713043212890625, -0.06667327880859375, -0.062042236328125, -0.05741119384765625, -0.0527801513671875, -0.04814910888671875, -0.04351806640625, -0.03888702392578125, -0.0342559814453125, -0.02962493896484375, -0.024993896484375, -0.02036285400390625, -0.0157318115234375, -0.01110076904296875, -0.0064697265625, -0.00183868408203125, 0.0027923583984375, 0.00742340087890625, 0.012054443359375, 0.01668548583984375, 0.0213165283203125, 0.02594757080078125, 0.03057861328125, 0.03520965576171875, 0.0398406982421875, 0.04447174072265625, 0.049102783203125, 0.05373382568359375, 0.0583648681640625, 0.06299591064453125, 0.067626953125, 0.07225799560546875, 0.0768890380859375, 0.08152008056640625, 0.086151123046875, 0.09078216552734375, 0.0954132080078125, 0.10004425048828125, 0.10467529296875, 0.10930633544921875, 0.1139373779296875, 0.11856842041015625, 0.123199462890625, 0.12783050537109375, 0.1324615478515625, 0.13709259033203125, 0.1417236328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 10.0, 16.0, 21.0, 23.0, 36.0, 47.0, 63.0, 75.0, 107.0, 112.0, 88.0, 89.0, 72.0, 65.0, 37.0, 33.0, 12.0, 15.0, 13.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.87847763299942e-05, -1.807883381843567e-05, -1.7372891306877136e-05, -1.6666948795318604e-05, -1.596100628376007e-05, -1.5255063772201538e-05, -1.4549121260643005e-05, -1.3843178749084473e-05, -1.313723623752594e-05, -1.2431293725967407e-05, -1.1725351214408875e-05, -1.1019408702850342e-05, -1.0313466191291809e-05, -9.607523679733276e-06, -8.901581168174744e-06, -8.195638656616211e-06, -7.489696145057678e-06, -6.7837536334991455e-06, -6.077811121940613e-06, -5.37186861038208e-06, -4.665926098823547e-06, -3.959983587265015e-06, -3.254041075706482e-06, -2.5480985641479492e-06, -1.8421560525894165e-06, -1.1362135410308838e-06, -4.302710294723511e-07, 2.7567148208618164e-07, 9.816139936447144e-07, 1.687556505203247e-06, 2.3934990167617798e-06, 3.0994415283203125e-06, 3.8053840398788452e-06, 4.511326551437378e-06, 5.217269062995911e-06, 5.923211574554443e-06, 6.629154086112976e-06, 7.335096597671509e-06, 8.041039109230042e-06, 8.746981620788574e-06, 9.452924132347107e-06, 1.015886664390564e-05, 1.0864809155464172e-05, 1.1570751667022705e-05, 1.2276694178581238e-05, 1.298263669013977e-05, 1.3688579201698303e-05, 1.4394521713256836e-05, 1.5100464224815369e-05, 1.58064067363739e-05, 1.6512349247932434e-05, 1.7218291759490967e-05, 1.79242342710495e-05, 1.8630176782608032e-05, 1.9336119294166565e-05, 2.0042061805725098e-05, 2.074800431728363e-05, 2.1453946828842163e-05, 2.2159889340400696e-05, 2.286583185195923e-05, 2.357177436351776e-05, 2.4277716875076294e-05, 2.4983659386634827e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 7.0, 11.0, 6.0, 5.0, 9.0, 13.0, 20.0, 24.0, 33.0, 65.0, 158.0, 732.0, 6684.0, 153239.0, 835993.0, 47746.0, 3047.0, 421.0, 108.0, 63.0, 44.0, 26.0, 21.0, 14.0, 11.0, 20.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.414306640625, -0.4034996032714844, -0.39269256591796875, -0.3818855285644531, -0.3710784912109375, -0.3602714538574219, -0.34946441650390625, -0.3386573791503906, -0.327850341796875, -0.3170433044433594, -0.30623626708984375, -0.2954292297363281, -0.2846221923828125, -0.2738151550292969, -0.26300811767578125, -0.2522010803222656, -0.24139404296875, -0.23058700561523438, -0.21977996826171875, -0.20897293090820312, -0.1981658935546875, -0.18735885620117188, -0.17655181884765625, -0.16574478149414062, -0.154937744140625, -0.14413070678710938, -0.13332366943359375, -0.12251663208007812, -0.1117095947265625, -0.10090255737304688, -0.09009552001953125, -0.07928848266601562, -0.0684814453125, -0.057674407958984375, -0.04686737060546875, -0.036060333251953125, -0.0252532958984375, -0.014446258544921875, -0.00363922119140625, 0.007167816162109375, 0.017974853515625, 0.028781890869140625, 0.03958892822265625, 0.050395965576171875, 0.0612030029296875, 0.07201004028320312, 0.08281707763671875, 0.09362411499023438, 0.10443115234375, 0.11523818969726562, 0.12604522705078125, 0.13685226440429688, 0.1476593017578125, 0.15846633911132812, 0.16927337646484375, 0.18008041381835938, 0.190887451171875, 0.20169448852539062, 0.21250152587890625, 0.22330856323242188, 0.2341156005859375, 0.24492263793945312, 0.25572967529296875, 0.2665367126464844, 0.27734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 10.0, 8.0, 5.0, 11.0, 6.0, 23.0, 22.0, 23.0, 41.0, 59.0, 42.0, 65.0, 80.0, 83.0, 74.0, 106.0, 63.0, 50.0, 41.0, 49.0, 28.0, 22.0, 18.0, 12.0, 19.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.08514404296875, -0.0829463005065918, -0.0807485580444336, -0.07855081558227539, -0.07635307312011719, -0.07415533065795898, -0.07195758819580078, -0.06975984573364258, -0.06756210327148438, -0.06536436080932617, -0.06316661834716797, -0.060968875885009766, -0.05877113342285156, -0.05657339096069336, -0.054375648498535156, -0.05217790603637695, -0.04998016357421875, -0.04778242111206055, -0.045584678649902344, -0.04338693618774414, -0.04118919372558594, -0.038991451263427734, -0.03679370880126953, -0.03459596633911133, -0.032398223876953125, -0.030200481414794922, -0.02800273895263672, -0.025804996490478516, -0.023607254028320312, -0.02140951156616211, -0.019211769104003906, -0.017014026641845703, -0.0148162841796875, -0.012618541717529297, -0.010420799255371094, -0.00822305679321289, -0.0060253143310546875, -0.0038275718688964844, -0.0016298294067382812, 0.0005679130554199219, 0.002765655517578125, 0.004963397979736328, 0.007161140441894531, 0.009358882904052734, 0.011556625366210938, 0.01375436782836914, 0.015952110290527344, 0.018149852752685547, 0.02034759521484375, 0.022545337677001953, 0.024743080139160156, 0.02694082260131836, 0.029138565063476562, 0.031336307525634766, 0.03353404998779297, 0.03573179244995117, 0.037929534912109375, 0.04012727737426758, 0.04232501983642578, 0.044522762298583984, 0.04672050476074219, 0.04891824722290039, 0.051115989685058594, 0.0533137321472168, 0.055511474609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 15.0, 169.0, 752.0, 75.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0834548473358154, -0.8841234445571899, -0.6847920417785645, -0.48546063899993896, -0.2861292362213135, -0.08679783344268799, 0.1125335693359375, 0.311864972114563, 0.5111963748931885, 0.710527777671814, 0.9098591804504395, 1.109190583229065, 1.3085219860076904, 1.507853388786316, 1.7071847915649414, 1.906516194343567, 2.1058475971221924, 2.3051791191101074, 2.5045104026794434, 2.7038416862487793, 2.9031732082366943, 3.1025047302246094, 3.3018360137939453, 3.5011672973632812, 3.7004988193511963, 3.8998303413391113, 4.099161624908447, 4.298492908477783, 4.497824668884277, 4.697155952453613, 4.896487236022949, 5.095818519592285, 5.295149803161621, 5.494481086730957, 5.693812370300293, 5.893144130706787, 6.092475414276123, 6.291806697845459, 6.491138458251953, 6.690469741821289, 6.889801025390625, 7.089132308959961, 7.288463592529297, 7.487795352935791, 7.687126636505127, 7.886457920074463, 8.085789680480957, 8.285120964050293, 8.484452247619629, 8.683783531188965, 8.8831148147583, 9.082446098327637, 9.281778335571289, 9.481109619140625, 9.680440902709961, 9.879772186279297, 10.079103469848633, 10.278434753417969, 10.477766036987305, 10.67709732055664, 10.876428604125977, 11.075760841369629, 11.275092124938965, 11.4744234085083, 11.673754692077637]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 6.0, 10.0, 10.0, 12.0, 14.0, 26.0, 27.0, 24.0, 21.0, 31.0, 29.0, 44.0, 40.0, 33.0, 50.0, 47.0, 32.0, 55.0, 30.0, 47.0, 40.0, 42.0, 33.0, 37.0, 34.0, 25.0, 22.0, 26.0, 21.0, 17.0, 19.0, 14.0, 9.0, 11.0, 3.0, 6.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8769701719284058, -0.8489359021186829, -0.8209016919136047, -0.7928674221038818, -0.7648331522941589, -0.736798882484436, -0.7087646722793579, -0.680730402469635, -0.6526961326599121, -0.6246618628501892, -0.5966276526451111, -0.5685933828353882, -0.5405591130256653, -0.5125248432159424, -0.48449063301086426, -0.45645636320114136, -0.42842215299606323, -0.4003879129886627, -0.3723536431789398, -0.3443194031715393, -0.3162851333618164, -0.2882508933544159, -0.2602166533470154, -0.23218239843845367, -0.20414814352989197, -0.17611388862133026, -0.14807963371276855, -0.12004539370536804, -0.09201113879680634, -0.06397688388824463, -0.035942643880844116, -0.00790838897228241, 0.020125925540924072, 0.04816017672419548, 0.07619442790746689, 0.104228675365448, 0.1322629302740097, 0.1602971851825714, 0.18833142518997192, 0.21636568009853363, 0.24439993500709534, 0.27243417501449585, 0.30046844482421875, 0.32850268483161926, 0.3565369248390198, 0.3845711946487427, 0.4126054346561432, 0.4406396746635437, 0.4686739444732666, 0.4967081844806671, 0.5247424244880676, 0.5527766942977905, 0.5808109641075134, 0.6088452339172363, 0.6368794441223145, 0.6649137139320374, 0.6929479837417603, 0.7209822535514832, 0.7490164637565613, 0.7770507335662842, 0.8050850033760071, 0.83311927318573, 0.8611534833908081, 0.889187753200531, 0.9172219634056091]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 9.0, 5.0, 9.0, 12.0, 21.0, 22.0, 41.0, 40.0, 67.0, 102.0, 135.0, 256.0, 396.0, 632.0, 1232.0, 2245.0, 4588.0, 10214.0, 24890.0, 68859.0, 241632.0, 1391338.0, 1968226.0, 338071.0, 88808.0, 30142.0, 11807.0, 5209.0, 2392.0, 1165.0, 675.0, 359.0, 229.0, 153.0, 101.0, 57.0, 38.0, 41.0, 17.0, 16.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.295166015625, -0.28721046447753906, -0.2792549133300781, -0.2712993621826172, -0.26334381103515625, -0.2553882598876953, -0.24743270874023438, -0.23947715759277344, -0.2315216064453125, -0.22356605529785156, -0.21561050415039062, -0.2076549530029297, -0.19969940185546875, -0.1917438507080078, -0.18378829956054688, -0.17583274841308594, -0.167877197265625, -0.15992164611816406, -0.15196609497070312, -0.1440105438232422, -0.13605499267578125, -0.1280994415283203, -0.12014389038085938, -0.11218833923339844, -0.1042327880859375, -0.09627723693847656, -0.08832168579101562, -0.08036613464355469, -0.07241058349609375, -0.06445503234863281, -0.056499481201171875, -0.04854393005371094, -0.04058837890625, -0.03263282775878906, -0.024677276611328125, -0.016721725463867188, -0.00876617431640625, -0.0008106231689453125, 0.007144927978515625, 0.015100479125976562, 0.0230560302734375, 0.031011581420898438, 0.038967132568359375, 0.04692268371582031, 0.05487823486328125, 0.06283378601074219, 0.07078933715820312, 0.07874488830566406, 0.086700439453125, 0.09465599060058594, 0.10261154174804688, 0.11056709289550781, 0.11852264404296875, 0.1264781951904297, 0.13443374633789062, 0.14238929748535156, 0.1503448486328125, 0.15830039978027344, 0.16625595092773438, 0.1742115020751953, 0.18216705322265625, 0.1901226043701172, 0.19807815551757812, 0.20603370666503906, 0.2139892578125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 6.0, 4.0, 10.0, 8.0, 9.0, 13.0, 13.0, 15.0, 25.0, 29.0, 28.0, 35.0, 33.0, 44.0, 43.0, 57.0, 59.0, 47.0, 60.0, 43.0, 43.0, 57.0, 39.0, 42.0, 40.0, 33.0, 25.0, 29.0, 23.0, 14.0, 20.0, 11.0, 9.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.14208984375, -0.13835620880126953, -0.13462257385253906, -0.1308889389038086, -0.12715530395507812, -0.12342166900634766, -0.11968803405761719, -0.11595439910888672, -0.11222076416015625, -0.10848712921142578, -0.10475349426269531, -0.10101985931396484, -0.09728622436523438, -0.0935525894165039, -0.08981895446777344, -0.08608531951904297, -0.0823516845703125, -0.07861804962158203, -0.07488441467285156, -0.0711507797241211, -0.06741714477539062, -0.06368350982666016, -0.05994987487792969, -0.05621623992919922, -0.05248260498046875, -0.04874897003173828, -0.04501533508300781, -0.041281700134277344, -0.037548065185546875, -0.033814430236816406, -0.030080795288085938, -0.02634716033935547, -0.022613525390625, -0.01887989044189453, -0.015146255493164062, -0.011412620544433594, -0.007678985595703125, -0.003945350646972656, -0.0002117156982421875, 0.0035219192504882812, 0.00725555419921875, 0.010989189147949219, 0.014722824096679688, 0.018456459045410156, 0.022190093994140625, 0.025923728942871094, 0.029657363891601562, 0.03339099884033203, 0.0371246337890625, 0.04085826873779297, 0.04459190368652344, 0.048325538635253906, 0.052059173583984375, 0.055792808532714844, 0.05952644348144531, 0.06326007843017578, 0.06699371337890625, 0.07072734832763672, 0.07446098327636719, 0.07819461822509766, 0.08192825317382812, 0.0856618881225586, 0.08939552307128906, 0.09312915802001953, 0.09686279296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 2.0, 6.0, 12.0, 12.0, 33.0, 51.0, 76.0, 166.0, 327.0, 886.0, 3071.0, 16364.0, 123553.0, 1209425.0, 2517439.0, 281468.0, 33595.0, 5546.0, 1366.0, 473.0, 182.0, 95.0, 50.0, 35.0, 24.0, 16.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5436553955078125, -0.526763916015625, -0.5098724365234375, -0.49298095703125, -0.4760894775390625, -0.459197998046875, -0.4423065185546875, -0.4254150390625, -0.4085235595703125, -0.391632080078125, -0.3747406005859375, -0.35784912109375, -0.3409576416015625, -0.324066162109375, -0.3071746826171875, -0.290283203125, -0.2733917236328125, -0.256500244140625, -0.2396087646484375, -0.22271728515625, -0.2058258056640625, -0.188934326171875, -0.1720428466796875, -0.1551513671875, -0.1382598876953125, -0.121368408203125, -0.1044769287109375, -0.08758544921875, -0.0706939697265625, -0.053802490234375, -0.0369110107421875, -0.02001953125, -0.0031280517578125, 0.013763427734375, 0.0306549072265625, 0.04754638671875, 0.0644378662109375, 0.081329345703125, 0.0982208251953125, 0.1151123046875, 0.1320037841796875, 0.148895263671875, 0.1657867431640625, 0.18267822265625, 0.1995697021484375, 0.216461181640625, 0.2333526611328125, 0.250244140625, 0.2671356201171875, 0.284027099609375, 0.3009185791015625, 0.31781005859375, 0.3347015380859375, 0.351593017578125, 0.3684844970703125, 0.3853759765625, 0.4022674560546875, 0.419158935546875, 0.4360504150390625, 0.45294189453125, 0.4698333740234375, 0.486724853515625, 0.5036163330078125, 0.5205078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 15.0, 24.0, 41.0, 63.0, 104.0, 164.0, 237.0, 378.0, 551.0, 821.0, 614.0, 379.0, 259.0, 142.0, 86.0, 60.0, 52.0, 19.0, 13.0, 10.0, 5.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17276763916015625, -0.1634063720703125, -0.15404510498046875, -0.144683837890625, -0.13532257080078125, -0.1259613037109375, -0.11660003662109375, -0.10723876953125, -0.09787750244140625, -0.0885162353515625, -0.07915496826171875, -0.069793701171875, -0.06043243408203125, -0.0510711669921875, -0.04170989990234375, -0.0323486328125, -0.02298736572265625, -0.0136260986328125, -0.00426483154296875, 0.005096435546875, 0.01445770263671875, 0.0238189697265625, 0.03318023681640625, 0.04254150390625, 0.05190277099609375, 0.0612640380859375, 0.07062530517578125, 0.079986572265625, 0.08934783935546875, 0.0987091064453125, 0.10807037353515625, 0.117431640625, 0.12679290771484375, 0.1361541748046875, 0.14551544189453125, 0.154876708984375, 0.16423797607421875, 0.1735992431640625, 0.18296051025390625, 0.19232177734375, 0.20168304443359375, 0.2110443115234375, 0.22040557861328125, 0.229766845703125, 0.23912811279296875, 0.2484893798828125, 0.25785064697265625, 0.2672119140625, 0.27657318115234375, 0.2859344482421875, 0.29529571533203125, 0.304656982421875, 0.31401824951171875, 0.3233795166015625, 0.33274078369140625, 0.34210205078125, 0.35146331787109375, 0.3608245849609375, 0.37018585205078125, 0.379547119140625, 0.38890838623046875, 0.3982696533203125, 0.40763092041015625, 0.4169921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 43.0, 281.0, 462.0, 177.0, 29.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2849271297454834, -2.1603193283081055, -2.0357117652893066, -1.9111040830612183, -1.7864964008331299, -1.6618887186050415, -1.5372810363769531, -1.4126733541488647, -1.2880656719207764, -1.163457989692688, -1.0388503074645996, -0.9142426252365112, -0.7896349430084229, -0.6650272607803345, -0.5404195785522461, -0.4158118963241577, -0.29120421409606934, -0.16659653186798096, -0.04198884963989258, 0.0826188325881958, 0.20722651481628418, 0.33183419704437256, 0.45644187927246094, 0.5810495615005493, 0.7056572437286377, 0.8302649259567261, 0.9548726081848145, 1.0794802904129028, 1.2040879726409912, 1.3286956548690796, 1.453303337097168, 1.5779110193252563, 1.7025184631347656, 1.827126145362854, 1.9517338275909424, 2.0763416290283203, 2.200949192047119, 2.325556755065918, 2.450164556503296, 2.574772357940674, 2.6993799209594727, 2.8239874839782715, 2.9485952854156494, 3.0732030868530273, 3.197810649871826, 3.322418212890625, 3.447026014328003, 3.571633815765381, 3.6962413787841797, 3.8208489418029785, 3.9454567432403564, 4.070064544677734, 4.194672107696533, 4.319279670715332, 4.443887710571289, 4.568495273590088, 4.693102836608887, 4.8177103996276855, 4.942317962646484, 5.066926002502441, 5.19153356552124, 5.316141128540039, 5.440749168395996, 5.565356731414795, 5.689964294433594]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 9.0, 9.0, 16.0, 18.0, 10.0, 15.0, 23.0, 17.0, 21.0, 28.0, 28.0, 34.0, 48.0, 38.0, 41.0, 41.0, 47.0, 40.0, 35.0, 38.0, 28.0, 30.0, 42.0, 34.0, 39.0, 32.0, 28.0, 31.0, 26.0, 16.0, 20.0, 15.0, 21.0, 15.0, 9.0, 5.0, 6.0, 3.0, 7.0, 8.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5839733481407166, -0.5656446814537048, -0.5473159551620483, -0.5289872884750366, -0.5106586217880249, -0.4923299551010132, -0.4740012586116791, -0.45567256212234497, -0.43734389543533325, -0.41901522874832153, -0.4006865322589874, -0.3823578357696533, -0.3640291690826416, -0.3457005023956299, -0.3273718059062958, -0.30904310941696167, -0.29071444272994995, -0.27238577604293823, -0.2540570795536041, -0.2357283979654312, -0.2173997163772583, -0.1990710347890854, -0.18074235320091248, -0.16241367161273956, -0.14408499002456665, -0.12575630843639374, -0.10742762684822083, -0.08909894526004791, -0.070770263671875, -0.05244158208370209, -0.034112900495529175, -0.015784218907356262, 0.002544403076171875, 0.020873084664344788, 0.0392017662525177, 0.05753044784069061, 0.07585912942886353, 0.09418781101703644, 0.11251649260520935, 0.13084517419338226, 0.14917385578155518, 0.1675025373697281, 0.185831218957901, 0.2041599005460739, 0.22248858213424683, 0.24081726372241974, 0.25914594531059265, 0.27747464179992676, 0.2958033084869385, 0.3141319751739502, 0.3324606716632843, 0.3507893681526184, 0.3691180348396301, 0.38744670152664185, 0.40577539801597595, 0.42410409450531006, 0.4424327611923218, 0.4607614278793335, 0.4790901243686676, 0.4974188208580017, 0.5157474875450134, 0.5340761542320251, 0.5524048805236816, 0.5707335472106934, 0.5890622138977051]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 10.0, 13.0, 12.0, 12.0, 25.0, 42.0, 59.0, 79.0, 132.0, 163.0, 244.0, 322.0, 538.0, 774.0, 1127.0, 1701.0, 2447.0, 3905.0, 5991.0, 9885.0, 18215.0, 35669.0, 75853.0, 162177.0, 264072.0, 228729.0, 118748.0, 54329.0, 26406.0, 14030.0, 7982.0, 5023.0, 3207.0, 2187.0, 1397.0, 921.0, 684.0, 471.0, 276.0, 204.0, 159.0, 106.0, 71.0, 51.0, 34.0, 28.0, 15.0, 10.0, 12.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.229736328125, -0.22250938415527344, -0.21528244018554688, -0.2080554962158203, -0.20082855224609375, -0.1936016082763672, -0.18637466430664062, -0.17914772033691406, -0.1719207763671875, -0.16469383239746094, -0.15746688842773438, -0.1502399444580078, -0.14301300048828125, -0.1357860565185547, -0.12855911254882812, -0.12133216857910156, -0.114105224609375, -0.10687828063964844, -0.09965133666992188, -0.09242439270019531, -0.08519744873046875, -0.07797050476074219, -0.07074356079101562, -0.06351661682128906, -0.0562896728515625, -0.04906272888183594, -0.041835784912109375, -0.03460884094238281, -0.02738189697265625, -0.020154953002929688, -0.012928009033203125, -0.0057010650634765625, 0.00152587890625, 0.008752822875976562, 0.015979766845703125, 0.023206710815429688, 0.03043365478515625, 0.03766059875488281, 0.044887542724609375, 0.05211448669433594, 0.0593414306640625, 0.06656837463378906, 0.07379531860351562, 0.08102226257324219, 0.08824920654296875, 0.09547615051269531, 0.10270309448242188, 0.10993003845214844, 0.117156982421875, 0.12438392639160156, 0.13161087036132812, 0.1388378143310547, 0.14606475830078125, 0.1532917022705078, 0.16051864624023438, 0.16774559020996094, 0.1749725341796875, 0.18219947814941406, 0.18942642211914062, 0.1966533660888672, 0.20388031005859375, 0.2111072540283203, 0.21833419799804688, 0.22556114196777344, 0.2327880859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 2.0, 7.0, 13.0, 12.0, 27.0, 18.0, 10.0, 14.0, 31.0, 23.0, 34.0, 31.0, 32.0, 42.0, 38.0, 50.0, 39.0, 43.0, 57.0, 53.0, 42.0, 54.0, 44.0, 45.0, 39.0, 28.0, 34.0, 21.0, 17.0, 19.0, 7.0, 16.0, 8.0, 10.0, 6.0, 10.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.11444091796875, -0.11114501953125, -0.10784912109375, -0.10455322265625, -0.10125732421875, -0.09796142578125, -0.09466552734375, -0.09136962890625, -0.08807373046875, -0.08477783203125, -0.08148193359375, -0.07818603515625, -0.07489013671875, -0.07159423828125, -0.06829833984375, -0.06500244140625, -0.06170654296875, -0.05841064453125, -0.05511474609375, -0.05181884765625, -0.04852294921875, -0.04522705078125, -0.04193115234375, -0.03863525390625, -0.03533935546875, -0.03204345703125, -0.02874755859375, -0.02545166015625, -0.02215576171875, -0.01885986328125, -0.01556396484375, -0.01226806640625, -0.00897216796875, -0.00567626953125, -0.00238037109375, 0.00091552734375, 0.00421142578125, 0.00750732421875, 0.01080322265625, 0.01409912109375, 0.01739501953125, 0.02069091796875, 0.02398681640625, 0.02728271484375, 0.03057861328125, 0.03387451171875, 0.03717041015625, 0.04046630859375, 0.04376220703125, 0.04705810546875, 0.05035400390625, 0.05364990234375, 0.05694580078125, 0.06024169921875, 0.06353759765625, 0.06683349609375, 0.07012939453125, 0.07342529296875, 0.07672119140625, 0.08001708984375, 0.08331298828125, 0.08660888671875, 0.08990478515625, 0.09320068359375, 0.09649658203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 16.0, 12.0, 22.0, 27.0, 35.0, 53.0, 75.0, 109.0, 200.0, 330.0, 622.0, 1247.0, 2697.0, 6321.0, 14896.0, 39916.0, 128249.0, 363345.0, 326719.0, 106444.0, 33631.0, 12976.0, 5603.0, 2385.0, 1170.0, 621.0, 275.0, 179.0, 102.0, 73.0, 57.0, 39.0, 26.0, 20.0, 16.0, 12.0, 8.0, 8.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.369384765625, -0.3581657409667969, -0.34694671630859375, -0.3357276916503906, -0.3245086669921875, -0.3132896423339844, -0.30207061767578125, -0.2908515930175781, -0.279632568359375, -0.2684135437011719, -0.25719451904296875, -0.24597549438476562, -0.2347564697265625, -0.22353744506835938, -0.21231842041015625, -0.20109939575195312, -0.18988037109375, -0.17866134643554688, -0.16744232177734375, -0.15622329711914062, -0.1450042724609375, -0.13378524780273438, -0.12256622314453125, -0.11134719848632812, -0.100128173828125, -0.08890914916992188, -0.07769012451171875, -0.06647109985351562, -0.0552520751953125, -0.044033050537109375, -0.03281402587890625, -0.021595001220703125, -0.0103759765625, 0.000843048095703125, 0.01206207275390625, 0.023281097412109375, 0.0345001220703125, 0.045719146728515625, 0.05693817138671875, 0.06815719604492188, 0.079376220703125, 0.09059524536132812, 0.10181427001953125, 0.11303329467773438, 0.1242523193359375, 0.13547134399414062, 0.14669036865234375, 0.15790939331054688, 0.16912841796875, 0.18034744262695312, 0.19156646728515625, 0.20278549194335938, 0.2140045166015625, 0.22522354125976562, 0.23644256591796875, 0.24766159057617188, 0.258880615234375, 0.2700996398925781, 0.28131866455078125, 0.2925376892089844, 0.3037567138671875, 0.3149757385253906, 0.32619476318359375, 0.3374137878417969, 0.3486328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 9.0, 7.0, 5.0, 10.0, 8.0, 12.0, 12.0, 10.0, 28.0, 25.0, 18.0, 30.0, 38.0, 47.0, 42.0, 44.0, 40.0, 47.0, 58.0, 40.0, 41.0, 53.0, 42.0, 29.0, 43.0, 45.0, 33.0, 32.0, 20.0, 17.0, 28.0, 20.0, 20.0, 15.0, 9.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25048828125, -0.24302291870117188, -0.23555755615234375, -0.22809219360351562, -0.2206268310546875, -0.21316146850585938, -0.20569610595703125, -0.19823074340820312, -0.190765380859375, -0.18330001831054688, -0.17583465576171875, -0.16836929321289062, -0.1609039306640625, -0.15343856811523438, -0.14597320556640625, -0.13850784301757812, -0.13104248046875, -0.12357711791992188, -0.11611175537109375, -0.10864639282226562, -0.1011810302734375, -0.09371566772460938, -0.08625030517578125, -0.07878494262695312, -0.071319580078125, -0.06385421752929688, -0.05638885498046875, -0.048923492431640625, -0.0414581298828125, -0.033992767333984375, -0.02652740478515625, -0.019062042236328125, -0.0115966796875, -0.004131317138671875, 0.00333404541015625, 0.010799407958984375, 0.0182647705078125, 0.025730133056640625, 0.03319549560546875, 0.040660858154296875, 0.048126220703125, 0.055591583251953125, 0.06305694580078125, 0.07052230834960938, 0.0779876708984375, 0.08545303344726562, 0.09291839599609375, 0.10038375854492188, 0.10784912109375, 0.11531448364257812, 0.12277984619140625, 0.13024520874023438, 0.1377105712890625, 0.14517593383789062, 0.15264129638671875, 0.16010665893554688, 0.167572021484375, 0.17503738403320312, 0.18250274658203125, 0.18996810913085938, 0.1974334716796875, 0.20489883422851562, 0.21236419677734375, 0.21982955932617188, 0.227294921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 12.0, 22.0, 19.0, 36.0, 64.0, 104.0, 171.0, 242.0, 386.0, 699.0, 1212.0, 2289.0, 6570.0, 96157.0, 893616.0, 37822.0, 4626.0, 1842.0, 1047.0, 643.0, 376.0, 246.0, 132.0, 82.0, 53.0, 21.0, 18.0, 12.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96142578125, -0.936370849609375, -0.91131591796875, -0.886260986328125, -0.8612060546875, -0.836151123046875, -0.81109619140625, -0.786041259765625, -0.760986328125, -0.735931396484375, -0.71087646484375, -0.685821533203125, -0.6607666015625, -0.635711669921875, -0.61065673828125, -0.585601806640625, -0.560546875, -0.535491943359375, -0.51043701171875, -0.485382080078125, -0.4603271484375, -0.435272216796875, -0.41021728515625, -0.385162353515625, -0.360107421875, -0.335052490234375, -0.30999755859375, -0.284942626953125, -0.2598876953125, -0.234832763671875, -0.20977783203125, -0.184722900390625, -0.15966796875, -0.134613037109375, -0.10955810546875, -0.084503173828125, -0.0594482421875, -0.034393310546875, -0.00933837890625, 0.015716552734375, 0.040771484375, 0.065826416015625, 0.09088134765625, 0.115936279296875, 0.1409912109375, 0.166046142578125, 0.19110107421875, 0.216156005859375, 0.2412109375, 0.266265869140625, 0.29132080078125, 0.316375732421875, 0.3414306640625, 0.366485595703125, 0.39154052734375, 0.416595458984375, 0.441650390625, 0.466705322265625, 0.49176025390625, 0.516815185546875, 0.5418701171875, 0.566925048828125, 0.59197998046875, 0.617034912109375, 0.64208984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 8.0, 12.0, 22.0, 100.0, 454.0, 313.0, 48.0, 19.0, 4.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001448923721909523, -0.00014124996960163116, -0.00013760756701231003, -0.0001339651644229889, -0.00013032276183366776, -0.00012668035924434662, -0.00012303795665502548, -0.00011939555406570435, -0.00011575315147638321, -0.00011211074888706207, -0.00010846834629774094, -0.0001048259437084198, -0.00010118354111909866, -9.754113852977753e-05, -9.389873594045639e-05, -9.025633335113525e-05, -8.661393076181412e-05, -8.297152817249298e-05, -7.932912558317184e-05, -7.568672299385071e-05, -7.204432040452957e-05, -6.840191781520844e-05, -6.47595152258873e-05, -6.111711263656616e-05, -5.7474710047245026e-05, -5.383230745792389e-05, -5.018990486860275e-05, -4.6547502279281616e-05, -4.290509968996048e-05, -3.926269710063934e-05, -3.562029451131821e-05, -3.197789192199707e-05, -2.8335489332675934e-05, -2.4693086743354797e-05, -2.105068415403366e-05, -1.7408281564712524e-05, -1.3765878975391388e-05, -1.0123476386070251e-05, -6.481073796749115e-06, -2.8386712074279785e-06, 8.03731381893158e-07, 4.4461339712142944e-06, 8.088536560535431e-06, 1.1730939149856567e-05, 1.5373341739177704e-05, 1.901574432849884e-05, 2.2658146917819977e-05, 2.6300549507141113e-05, 2.994295209646225e-05, 3.3585354685783386e-05, 3.722775727510452e-05, 4.087015986442566e-05, 4.4512562453746796e-05, 4.815496504306793e-05, 5.179736763238907e-05, 5.5439770221710205e-05, 5.908217281103134e-05, 6.272457540035248e-05, 6.636697798967361e-05, 7.000938057899475e-05, 7.365178316831589e-05, 7.729418575763702e-05, 8.093658834695816e-05, 8.45789909362793e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 13.0, 14.0, 13.0, 21.0, 28.0, 42.0, 54.0, 85.0, 101.0, 177.0, 260.0, 377.0, 744.0, 1211.0, 2143.0, 4044.0, 7678.0, 15528.0, 33179.0, 77820.0, 181143.0, 294902.0, 232895.0, 108498.0, 45631.0, 20426.0, 9811.0, 5201.0, 2779.0, 1426.0, 871.0, 490.0, 302.0, 192.0, 138.0, 81.0, 69.0, 49.0, 38.0, 26.0, 18.0, 8.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.127197265625, -0.1233062744140625, -0.119415283203125, -0.1155242919921875, -0.11163330078125, -0.1077423095703125, -0.103851318359375, -0.0999603271484375, -0.0960693359375, -0.0921783447265625, -0.088287353515625, -0.0843963623046875, -0.08050537109375, -0.0766143798828125, -0.072723388671875, -0.0688323974609375, -0.06494140625, -0.0610504150390625, -0.057159423828125, -0.0532684326171875, -0.04937744140625, -0.0454864501953125, -0.041595458984375, -0.0377044677734375, -0.0338134765625, -0.0299224853515625, -0.026031494140625, -0.0221405029296875, -0.01824951171875, -0.0143585205078125, -0.010467529296875, -0.0065765380859375, -0.002685546875, 0.0012054443359375, 0.005096435546875, 0.0089874267578125, 0.01287841796875, 0.0167694091796875, 0.020660400390625, 0.0245513916015625, 0.0284423828125, 0.0323333740234375, 0.036224365234375, 0.0401153564453125, 0.04400634765625, 0.0478973388671875, 0.051788330078125, 0.0556793212890625, 0.0595703125, 0.0634613037109375, 0.067352294921875, 0.0712432861328125, 0.07513427734375, 0.0790252685546875, 0.082916259765625, 0.0868072509765625, 0.0906982421875, 0.0945892333984375, 0.098480224609375, 0.1023712158203125, 0.10626220703125, 0.1101531982421875, 0.114044189453125, 0.1179351806640625, 0.121826171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 3.0, 10.0, 13.0, 12.0, 14.0, 20.0, 37.0, 33.0, 37.0, 39.0, 39.0, 41.0, 64.0, 52.0, 63.0, 58.0, 62.0, 59.0, 47.0, 43.0, 30.0, 34.0, 28.0, 18.0, 19.0, 22.0, 18.0, 15.0, 10.0, 9.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07611083984375, -0.07369804382324219, -0.07128524780273438, -0.06887245178222656, -0.06645965576171875, -0.06404685974121094, -0.061634063720703125, -0.05922126770019531, -0.0568084716796875, -0.05439567565917969, -0.051982879638671875, -0.04957008361816406, -0.04715728759765625, -0.04474449157714844, -0.042331695556640625, -0.03991889953613281, -0.037506103515625, -0.03509330749511719, -0.032680511474609375, -0.030267715454101562, -0.02785491943359375, -0.025442123413085938, -0.023029327392578125, -0.020616531372070312, -0.0182037353515625, -0.015790939331054688, -0.013378143310546875, -0.010965347290039062, -0.00855255126953125, -0.0061397552490234375, -0.003726959228515625, -0.0013141632080078125, 0.0010986328125, 0.0035114288330078125, 0.005924224853515625, 0.008337020874023438, 0.01074981689453125, 0.013162612915039062, 0.015575408935546875, 0.017988204956054688, 0.0204010009765625, 0.022813796997070312, 0.025226593017578125, 0.027639389038085938, 0.03005218505859375, 0.03246498107910156, 0.034877777099609375, 0.03729057312011719, 0.039703369140625, 0.04211616516113281, 0.044528961181640625, 0.04694175720214844, 0.04935455322265625, 0.05176734924316406, 0.054180145263671875, 0.05659294128417969, 0.0590057373046875, 0.06141853332519531, 0.06383132934570312, 0.06624412536621094, 0.06865692138671875, 0.07106971740722656, 0.07348251342773438, 0.07589530944824219, 0.07830810546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 84.0, 318.0, 424.0, 136.0, 32.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7269718647003174, -2.6042118072509766, -2.4814517498016357, -2.358691692352295, -2.235931634902954, -2.1131715774536133, -1.990411400794983, -1.867651343345642, -1.7448912858963013, -1.6221312284469604, -1.4993711709976196, -1.3766109943389893, -1.2538509368896484, -1.1310908794403076, -1.0083308219909668, -0.885570764541626, -0.7628107070922852, -0.6400506496429443, -0.5172905921936035, -0.3945304751396179, -0.2717704176902771, -0.14901036024093628, -0.026250243186950684, 0.09650981426239014, 0.21926987171173096, 0.3420299291610718, 0.464790016412735, 0.5875501036643982, 0.710310161113739, 0.8330702185630798, 0.9558303356170654, 1.0785903930664062, 1.201350212097168, 1.3241102695465088, 1.4468703269958496, 1.5696303844451904, 1.6923904418945312, 1.815150499343872, 1.9379106760025024, 2.060670852661133, 2.1834306716918945, 2.3061907291412354, 2.428950786590576, 2.551710844039917, 2.674470901489258, 2.7972309589385986, 2.9199910163879395, 3.0427513122558594, 3.1655113697052, 3.288271427154541, 3.411031484603882, 3.5337915420532227, 3.6565515995025635, 3.7793116569519043, 3.902071952819824, 4.024831771850586, 4.147592067718506, 4.270352363586426, 4.3931121826171875, 4.515872478485107, 4.638632297515869, 4.761392593383789, 4.884152412414551, 5.006912708282471, 5.129672527313232]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 2.0, 8.0, 13.0, 14.0, 17.0, 20.0, 22.0, 21.0, 26.0, 38.0, 30.0, 40.0, 53.0, 40.0, 58.0, 45.0, 59.0, 39.0, 60.0, 50.0, 46.0, 42.0, 34.0, 35.0, 21.0, 28.0, 22.0, 23.0, 11.0, 19.0, 8.0, 8.0, 8.0, 7.0, 6.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7051905393600464, -0.6822935938835144, -0.6593967080116272, -0.6364997625350952, -0.6136028170585632, -0.5907058715820312, -0.567808985710144, -0.5449120402336121, -0.5220150947570801, -0.4991181790828705, -0.4762212336063385, -0.4533243179321289, -0.4304273724555969, -0.40753045678138733, -0.38463354110717773, -0.36173659563064575, -0.33883970975875854, -0.31594279408454895, -0.29304584860801697, -0.2701489329338074, -0.24725200235843658, -0.2243550717830658, -0.2014581561088562, -0.1785612255334854, -0.15566429495811462, -0.13276736438274384, -0.10987044125795364, -0.08697351813316345, -0.06407658755779266, -0.041179656982421875, -0.01828274130821228, 0.004614189267158508, 0.027511179447174072, 0.05040810629725456, 0.07330503314733505, 0.09620195627212524, 0.11909888684749603, 0.14199581742286682, 0.16489273309707642, 0.1877896636724472, 0.210686594247818, 0.23358352482318878, 0.25648045539855957, 0.27937737107276917, 0.30227428674697876, 0.32517123222351074, 0.34806814789772034, 0.37096506357192993, 0.3938620090484619, 0.4167589247226715, 0.4396558701992035, 0.4625527858734131, 0.48544973134994507, 0.508346676826477, 0.5312435626983643, 0.5541405081748962, 0.5770374536514282, 0.5999343991279602, 0.6228312849998474, 0.6457282304763794, 0.6686251759529114, 0.6915221214294434, 0.7144190073013306, 0.7373159527778625, 0.7602128386497498]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 10.0, 8.0, 18.0, 18.0, 25.0, 36.0, 47.0, 90.0, 146.0, 280.0, 498.0, 1025.0, 2078.0, 4805.0, 12358.0, 35259.0, 117980.0, 517597.0, 1873977.0, 1245810.0, 273136.0, 71451.0, 23032.0, 8316.0, 3313.0, 1469.0, 697.0, 345.0, 173.0, 101.0, 56.0, 46.0, 29.0, 16.0, 10.0, 8.0, 2.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.224365234375, -0.2177257537841797, -0.21108627319335938, -0.20444679260253906, -0.19780731201171875, -0.19116783142089844, -0.18452835083007812, -0.1778888702392578, -0.1712493896484375, -0.1646099090576172, -0.15797042846679688, -0.15133094787597656, -0.14469146728515625, -0.13805198669433594, -0.13141250610351562, -0.12477302551269531, -0.118133544921875, -0.11149406433105469, -0.10485458374023438, -0.09821510314941406, -0.09157562255859375, -0.08493614196777344, -0.07829666137695312, -0.07165718078613281, -0.0650177001953125, -0.05837821960449219, -0.051738739013671875, -0.04509925842285156, -0.03845977783203125, -0.03182029724121094, -0.025180816650390625, -0.018541336059570312, -0.01190185546875, -0.0052623748779296875, 0.001377105712890625, 0.008016586303710938, 0.01465606689453125, 0.021295547485351562, 0.027935028076171875, 0.03457450866699219, 0.0412139892578125, 0.04785346984863281, 0.054492950439453125, 0.06113243103027344, 0.06777191162109375, 0.07441139221191406, 0.08105087280273438, 0.08769035339355469, 0.094329833984375, 0.10096931457519531, 0.10760879516601562, 0.11424827575683594, 0.12088775634765625, 0.12752723693847656, 0.13416671752929688, 0.1408061981201172, 0.1474456787109375, 0.1540851593017578, 0.16072463989257812, 0.16736412048339844, 0.17400360107421875, 0.18064308166503906, 0.18728256225585938, 0.1939220428466797, 0.2005615234375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 16.0, 9.0, 18.0, 17.0, 19.0, 24.0, 33.0, 37.0, 28.0, 48.0, 42.0, 39.0, 52.0, 52.0, 40.0, 50.0, 56.0, 53.0, 56.0, 52.0, 28.0, 24.0, 29.0, 17.0, 30.0, 31.0, 11.0, 14.0, 7.0, 17.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.124755859375, -0.1212615966796875, -0.117767333984375, -0.1142730712890625, -0.11077880859375, -0.1072845458984375, -0.103790283203125, -0.1002960205078125, -0.0968017578125, -0.0933074951171875, -0.089813232421875, -0.0863189697265625, -0.08282470703125, -0.0793304443359375, -0.075836181640625, -0.0723419189453125, -0.06884765625, -0.0653533935546875, -0.061859130859375, -0.0583648681640625, -0.05487060546875, -0.0513763427734375, -0.047882080078125, -0.0443878173828125, -0.0408935546875, -0.0373992919921875, -0.033905029296875, -0.0304107666015625, -0.02691650390625, -0.0234222412109375, -0.019927978515625, -0.0164337158203125, -0.012939453125, -0.0094451904296875, -0.005950927734375, -0.0024566650390625, 0.00103759765625, 0.0045318603515625, 0.008026123046875, 0.0115203857421875, 0.0150146484375, 0.0185089111328125, 0.022003173828125, 0.0254974365234375, 0.02899169921875, 0.0324859619140625, 0.035980224609375, 0.0394744873046875, 0.04296875, 0.0464630126953125, 0.049957275390625, 0.0534515380859375, 0.05694580078125, 0.0604400634765625, 0.063934326171875, 0.0674285888671875, 0.0709228515625, 0.0744171142578125, 0.077911376953125, 0.0814056396484375, 0.08489990234375, 0.0883941650390625, 0.091888427734375, 0.0953826904296875, 0.098876953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 9.0, 15.0, 30.0, 46.0, 54.0, 72.0, 143.0, 302.0, 502.0, 1108.0, 3134.0, 9742.0, 35409.0, 141724.0, 565812.0, 1678470.0, 1276766.0, 358589.0, 89195.0, 22532.0, 6590.0, 2183.0, 899.0, 373.0, 219.0, 114.0, 84.0, 53.0, 36.0, 27.0, 16.0, 8.0, 8.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.314453125, -0.30591583251953125, -0.2973785400390625, -0.28884124755859375, -0.280303955078125, -0.27176666259765625, -0.2632293701171875, -0.25469207763671875, -0.24615478515625, -0.23761749267578125, -0.2290802001953125, -0.22054290771484375, -0.212005615234375, -0.20346832275390625, -0.1949310302734375, -0.18639373779296875, -0.1778564453125, -0.16931915283203125, -0.1607818603515625, -0.15224456787109375, -0.143707275390625, -0.13516998291015625, -0.1266326904296875, -0.11809539794921875, -0.10955810546875, -0.10102081298828125, -0.0924835205078125, -0.08394622802734375, -0.075408935546875, -0.06687164306640625, -0.0583343505859375, -0.04979705810546875, -0.041259765625, -0.03272247314453125, -0.0241851806640625, -0.01564788818359375, -0.007110595703125, 0.00142669677734375, 0.0099639892578125, 0.01850128173828125, 0.02703857421875, 0.03557586669921875, 0.0441131591796875, 0.05265045166015625, 0.061187744140625, 0.06972503662109375, 0.0782623291015625, 0.08679962158203125, 0.0953369140625, 0.10387420654296875, 0.1124114990234375, 0.12094879150390625, 0.129486083984375, 0.13802337646484375, 0.1465606689453125, 0.15509796142578125, 0.16363525390625, 0.17217254638671875, 0.1807098388671875, 0.18924713134765625, 0.197784423828125, 0.20632171630859375, 0.2148590087890625, 0.22339630126953125, 0.23193359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 3.0, 11.0, 18.0, 26.0, 31.0, 45.0, 41.0, 65.0, 85.0, 106.0, 137.0, 185.0, 210.0, 272.0, 345.0, 353.0, 384.0, 370.0, 318.0, 244.0, 224.0, 158.0, 109.0, 87.0, 66.0, 54.0, 26.0, 24.0, 19.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.13652992248535156, -0.13011550903320312, -0.12370109558105469, -0.11728668212890625, -0.11087226867675781, -0.10445785522460938, -0.09804344177246094, -0.0916290283203125, -0.08521461486816406, -0.07880020141601562, -0.07238578796386719, -0.06597137451171875, -0.05955696105957031, -0.053142547607421875, -0.04672813415527344, -0.040313720703125, -0.03389930725097656, -0.027484893798828125, -0.021070480346679688, -0.01465606689453125, -0.008241653442382812, -0.001827239990234375, 0.0045871734619140625, 0.0110015869140625, 0.017416000366210938, 0.023830413818359375, 0.030244827270507812, 0.03665924072265625, 0.04307365417480469, 0.049488067626953125, 0.05590248107910156, 0.06231689453125, 0.06873130798339844, 0.07514572143554688, 0.08156013488769531, 0.08797454833984375, 0.09438896179199219, 0.10080337524414062, 0.10721778869628906, 0.1136322021484375, 0.12004661560058594, 0.12646102905273438, 0.1328754425048828, 0.13928985595703125, 0.1457042694091797, 0.15211868286132812, 0.15853309631347656, 0.164947509765625, 0.17136192321777344, 0.17777633666992188, 0.1841907501220703, 0.19060516357421875, 0.1970195770263672, 0.20343399047851562, 0.20984840393066406, 0.2162628173828125, 0.22267723083496094, 0.22909164428710938, 0.2355060577392578, 0.24192047119140625, 0.2483348846435547, 0.2547492980957031, 0.26116371154785156, 0.267578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 17.0, 32.0, 79.0, 137.0, 183.0, 211.0, 161.0, 118.0, 41.0, 19.0, 8.0, 2.0, 3.0], "bins": [-4.22857666015625, -4.153481960296631, -4.07838773727417, -4.003293037414551, -3.9281985759735107, -3.8531041145324707, -3.7780096530914307, -3.7029151916503906, -3.6278207302093506, -3.5527262687683105, -3.4776318073272705, -3.4025373458862305, -3.3274426460266113, -3.2523481845855713, -3.1772537231445312, -3.102159261703491, -3.027064800262451, -2.951970338821411, -2.876875877380371, -2.801781177520752, -2.726686716079712, -2.651592254638672, -2.576497793197632, -2.501403331756592, -2.4263086318969727, -2.3512141704559326, -2.2761197090148926, -2.2010250091552734, -2.1259305477142334, -2.0508360862731934, -1.9757416248321533, -1.9006471633911133, -1.8255524635314941, -1.750458002090454, -1.6753634214401245, -1.6002689599990845, -1.5251744985580444, -1.4500799179077148, -1.3749854564666748, -1.2998909950256348, -1.2247965335845947, -1.1497020721435547, -1.074607491493225, -0.9995130300521851, -0.924418568611145, -0.8493240475654602, -0.7742295265197754, -0.6991350650787354, -0.6240405440330505, -0.5489460229873657, -0.4738515615463257, -0.39875704050064087, -0.32366254925727844, -0.24856805801391602, -0.1734735369682312, -0.09837907552719116, -0.023284554481506348, 0.051809944212436676, 0.1269044429063797, 0.20199894905090332, 0.27709344029426575, 0.3521879315376282, 0.427282452583313, 0.502376914024353, 0.5774714350700378]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 11.0, 11.0, 4.0, 11.0, 14.0, 22.0, 16.0, 21.0, 18.0, 32.0, 34.0, 40.0, 22.0, 32.0, 48.0, 39.0, 36.0, 47.0, 44.0, 35.0, 30.0, 39.0, 34.0, 41.0, 35.0, 29.0, 35.0, 24.0, 33.0, 23.0, 20.0, 18.0, 18.0, 11.0, 10.0, 3.0, 9.0, 12.0, 8.0, 1.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6475735306739807, -0.6264436841011047, -0.6053138971328735, -0.5841840505599976, -0.5630542039871216, -0.5419243574142456, -0.5207945704460144, -0.4996647238731384, -0.47853490710258484, -0.45740509033203125, -0.4362752437591553, -0.4151454269886017, -0.3940156102180481, -0.3728857636451721, -0.35175594687461853, -0.33062613010406494, -0.30949628353118896, -0.2883664667606354, -0.2672366201877594, -0.2461068034172058, -0.22497697174549103, -0.20384714007377625, -0.18271732330322266, -0.16158749163150787, -0.1404576599597931, -0.11932782828807831, -0.09819800406694412, -0.07706817984580994, -0.055938348174095154, -0.03480851650238037, -0.013678699731826782, 0.0074511319398880005, 0.028580963611602783, 0.04971079155802727, 0.07084061950445175, 0.09197044372558594, 0.11310027539730072, 0.1342301070690155, 0.1553599238395691, 0.17648975551128387, 0.19761958718299866, 0.21874941885471344, 0.23987925052642822, 0.2610090672969818, 0.2821388840675354, 0.3032687306404114, 0.32439854741096497, 0.34552836418151855, 0.36665821075439453, 0.3877880275249481, 0.4089178740978241, 0.4300476908683777, 0.45117753744125366, 0.47230735421180725, 0.49343717098236084, 0.5145670175552368, 0.5356968641281128, 0.5568267107009888, 0.57795649766922, 0.599086344242096, 0.6202161908149719, 0.6413459777832031, 0.6624758243560791, 0.6836056709289551, 0.7047354578971863]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 12.0, 14.0, 26.0, 30.0, 42.0, 106.0, 147.0, 258.0, 489.0, 1034.0, 1969.0, 4029.0, 8044.0, 16986.0, 34438.0, 68905.0, 131793.0, 212771.0, 232435.0, 160243.0, 87771.0, 44317.0, 21705.0, 10552.0, 5144.0, 2572.0, 1192.0, 631.0, 348.0, 209.0, 129.0, 69.0, 45.0, 34.0, 14.0, 11.0, 13.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21263504028320312, -0.20481109619140625, -0.19698715209960938, -0.1891632080078125, -0.18133926391601562, -0.17351531982421875, -0.16569137573242188, -0.157867431640625, -0.15004348754882812, -0.14221954345703125, -0.13439559936523438, -0.1265716552734375, -0.11874771118164062, -0.11092376708984375, -0.10309982299804688, -0.09527587890625, -0.08745193481445312, -0.07962799072265625, -0.07180404663085938, -0.0639801025390625, -0.056156158447265625, -0.04833221435546875, -0.040508270263671875, -0.032684326171875, -0.024860382080078125, -0.01703643798828125, -0.009212493896484375, -0.0013885498046875, 0.006435394287109375, 0.01425933837890625, 0.022083282470703125, 0.0299072265625, 0.037731170654296875, 0.04555511474609375, 0.053379058837890625, 0.0612030029296875, 0.06902694702148438, 0.07685089111328125, 0.08467483520507812, 0.092498779296875, 0.10032272338867188, 0.10814666748046875, 0.11597061157226562, 0.1237945556640625, 0.13161849975585938, 0.13944244384765625, 0.14726638793945312, 0.15509033203125, 0.16291427612304688, 0.17073822021484375, 0.17856216430664062, 0.1863861083984375, 0.19421005249023438, 0.20203399658203125, 0.20985794067382812, 0.217681884765625, 0.22550582885742188, 0.23332977294921875, 0.24115371704101562, 0.2489776611328125, 0.2568016052246094, 0.26462554931640625, 0.2724494934082031, 0.2802734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 10.0, 5.0, 21.0, 14.0, 16.0, 19.0, 22.0, 26.0, 34.0, 23.0, 49.0, 41.0, 62.0, 58.0, 60.0, 64.0, 54.0, 40.0, 55.0, 45.0, 44.0, 28.0, 35.0, 35.0, 22.0, 23.0, 25.0, 15.0, 12.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.133544921875, -0.12995338439941406, -0.12636184692382812, -0.12277030944824219, -0.11917877197265625, -0.11558723449707031, -0.11199569702148438, -0.10840415954589844, -0.1048126220703125, -0.10122108459472656, -0.09762954711914062, -0.09403800964355469, -0.09044647216796875, -0.08685493469238281, -0.08326339721679688, -0.07967185974121094, -0.076080322265625, -0.07248878479003906, -0.06889724731445312, -0.06530570983886719, -0.06171417236328125, -0.05812263488769531, -0.054531097412109375, -0.05093955993652344, -0.0473480224609375, -0.04375648498535156, -0.040164947509765625, -0.03657341003417969, -0.03298187255859375, -0.029390335083007812, -0.025798797607421875, -0.022207260131835938, -0.01861572265625, -0.015024185180664062, -0.011432647705078125, -0.007841110229492188, -0.00424957275390625, -0.0006580352783203125, 0.002933502197265625, 0.0065250396728515625, 0.0101165771484375, 0.013708114624023438, 0.017299652099609375, 0.020891189575195312, 0.02448272705078125, 0.028074264526367188, 0.031665802001953125, 0.03525733947753906, 0.038848876953125, 0.04244041442871094, 0.046031951904296875, 0.04962348937988281, 0.05321502685546875, 0.05680656433105469, 0.060398101806640625, 0.06398963928222656, 0.0675811767578125, 0.07117271423339844, 0.07476425170898438, 0.07835578918457031, 0.08194732666015625, 0.08553886413574219, 0.08913040161132812, 0.09272193908691406, 0.0963134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 23.0, 45.0, 65.0, 101.0, 175.0, 308.0, 519.0, 1000.0, 1974.0, 4355.0, 10259.0, 23958.0, 54793.0, 120487.0, 231894.0, 277755.0, 172822.0, 82286.0, 36552.0, 16124.0, 6877.0, 2991.0, 1451.0, 664.0, 399.0, 228.0, 155.0, 92.0, 66.0, 29.0, 26.0, 11.0, 10.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341796875, -0.33119964599609375, -0.3206024169921875, -0.31000518798828125, -0.299407958984375, -0.28881072998046875, -0.2782135009765625, -0.26761627197265625, -0.25701904296875, -0.24642181396484375, -0.2358245849609375, -0.22522735595703125, -0.214630126953125, -0.20403289794921875, -0.1934356689453125, -0.18283843994140625, -0.1722412109375, -0.16164398193359375, -0.1510467529296875, -0.14044952392578125, -0.129852294921875, -0.11925506591796875, -0.1086578369140625, -0.09806060791015625, -0.08746337890625, -0.07686614990234375, -0.0662689208984375, -0.05567169189453125, -0.045074462890625, -0.03447723388671875, -0.0238800048828125, -0.01328277587890625, -0.002685546875, 0.00791168212890625, 0.0185089111328125, 0.02910614013671875, 0.039703369140625, 0.05030059814453125, 0.0608978271484375, 0.07149505615234375, 0.08209228515625, 0.09268951416015625, 0.1032867431640625, 0.11388397216796875, 0.124481201171875, 0.13507843017578125, 0.1456756591796875, 0.15627288818359375, 0.1668701171875, 0.17746734619140625, 0.1880645751953125, 0.19866180419921875, 0.209259033203125, 0.21985626220703125, 0.2304534912109375, 0.24105072021484375, 0.25164794921875, 0.26224517822265625, 0.2728424072265625, 0.28343963623046875, 0.294036865234375, 0.30463409423828125, 0.3152313232421875, 0.32582855224609375, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 12.0, 5.0, 13.0, 9.0, 14.0, 24.0, 18.0, 16.0, 28.0, 37.0, 38.0, 33.0, 35.0, 55.0, 52.0, 48.0, 50.0, 57.0, 49.0, 42.0, 51.0, 43.0, 33.0, 29.0, 31.0, 21.0, 27.0, 28.0, 14.0, 18.0, 12.0, 9.0, 8.0, 13.0, 5.0, 6.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.364990234375, -0.35565757751464844, -0.3463249206542969, -0.3369922637939453, -0.32765960693359375, -0.3183269500732422, -0.3089942932128906, -0.29966163635253906, -0.2903289794921875, -0.28099632263183594, -0.2716636657714844, -0.2623310089111328, -0.25299835205078125, -0.2436656951904297, -0.23433303833007812, -0.22500038146972656, -0.215667724609375, -0.20633506774902344, -0.19700241088867188, -0.1876697540283203, -0.17833709716796875, -0.1690044403076172, -0.15967178344726562, -0.15033912658691406, -0.1410064697265625, -0.13167381286621094, -0.12234115600585938, -0.11300849914550781, -0.10367584228515625, -0.09434318542480469, -0.08501052856445312, -0.07567787170410156, -0.06634521484375, -0.05701255798339844, -0.047679901123046875, -0.03834724426269531, -0.02901458740234375, -0.019681930541992188, -0.010349273681640625, -0.0010166168212890625, 0.0083160400390625, 0.017648696899414062, 0.026981353759765625, 0.03631401062011719, 0.04564666748046875, 0.05497932434082031, 0.06431198120117188, 0.07364463806152344, 0.082977294921875, 0.09230995178222656, 0.10164260864257812, 0.11097526550292969, 0.12030792236328125, 0.1296405792236328, 0.13897323608398438, 0.14830589294433594, 0.1576385498046875, 0.16697120666503906, 0.17630386352539062, 0.1856365203857422, 0.19496917724609375, 0.2043018341064453, 0.21363449096679688, 0.22296714782714844, 0.2322998046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 10.0, 7.0, 21.0, 26.0, 29.0, 35.0, 47.0, 71.0, 106.0, 123.0, 195.0, 309.0, 590.0, 917.0, 1513.0, 2746.0, 5894.0, 76542.0, 918515.0, 29938.0, 4911.0, 2412.0, 1408.0, 788.0, 467.0, 319.0, 167.0, 146.0, 77.0, 69.0, 47.0, 32.0, 27.0, 19.0, 13.0, 12.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72705078125, -0.7038955688476562, -0.6807403564453125, -0.6575851440429688, -0.634429931640625, -0.6112747192382812, -0.5881195068359375, -0.5649642944335938, -0.54180908203125, -0.5186538696289062, -0.4954986572265625, -0.47234344482421875, -0.449188232421875, -0.42603302001953125, -0.4028778076171875, -0.37972259521484375, -0.3565673828125, -0.33341217041015625, -0.3102569580078125, -0.28710174560546875, -0.263946533203125, -0.24079132080078125, -0.2176361083984375, -0.19448089599609375, -0.17132568359375, -0.14817047119140625, -0.1250152587890625, -0.10186004638671875, -0.078704833984375, -0.05554962158203125, -0.0323944091796875, -0.00923919677734375, 0.013916015625, 0.03707122802734375, 0.0602264404296875, 0.08338165283203125, 0.106536865234375, 0.12969207763671875, 0.1528472900390625, 0.17600250244140625, 0.19915771484375, 0.22231292724609375, 0.2454681396484375, 0.26862335205078125, 0.291778564453125, 0.31493377685546875, 0.3380889892578125, 0.36124420166015625, 0.3843994140625, 0.40755462646484375, 0.4307098388671875, 0.45386505126953125, 0.477020263671875, 0.5001754760742188, 0.5233306884765625, 0.5464859008789062, 0.56964111328125, 0.5927963256835938, 0.6159515380859375, 0.6391067504882812, 0.662261962890625, 0.6854171752929688, 0.7085723876953125, 0.7317276000976562, 0.7548828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 14.0, 23.0, 51.0, 138.0, 262.0, 271.0, 118.0, 65.0, 28.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.173154830932617e-05, -8.886680006980896e-05, -8.600205183029175e-05, -8.313730359077454e-05, -8.027255535125732e-05, -7.740780711174011e-05, -7.45430588722229e-05, -7.167831063270569e-05, -6.881356239318848e-05, -6.594881415367126e-05, -6.308406591415405e-05, -6.021931767463684e-05, -5.735456943511963e-05, -5.448982119560242e-05, -5.1625072956085205e-05, -4.876032471656799e-05, -4.589557647705078e-05, -4.303082823753357e-05, -4.016607999801636e-05, -3.7301331758499146e-05, -3.4436583518981934e-05, -3.157183527946472e-05, -2.870708703994751e-05, -2.5842338800430298e-05, -2.2977590560913086e-05, -2.0112842321395874e-05, -1.7248094081878662e-05, -1.438334584236145e-05, -1.1518597602844238e-05, -8.653849363327026e-06, -5.7891011238098145e-06, -2.9243528842926025e-06, -5.960464477539063e-08, 2.8051435947418213e-06, 5.669891834259033e-06, 8.534640073776245e-06, 1.1399388313293457e-05, 1.4264136552810669e-05, 1.712888479232788e-05, 1.9993633031845093e-05, 2.2858381271362305e-05, 2.5723129510879517e-05, 2.858787775039673e-05, 3.145262598991394e-05, 3.431737422943115e-05, 3.7182122468948364e-05, 4.0046870708465576e-05, 4.291161894798279e-05, 4.57763671875e-05, 4.864111542701721e-05, 5.1505863666534424e-05, 5.4370611906051636e-05, 5.723536014556885e-05, 6.010010838508606e-05, 6.296485662460327e-05, 6.582960486412048e-05, 6.86943531036377e-05, 7.155910134315491e-05, 7.442384958267212e-05, 7.728859782218933e-05, 8.015334606170654e-05, 8.301809430122375e-05, 8.588284254074097e-05, 8.874759078025818e-05, 9.161233901977539e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 12.0, 19.0, 22.0, 50.0, 63.0, 130.0, 200.0, 337.0, 614.0, 1212.0, 2558.0, 5701.0, 13944.0, 33770.0, 80170.0, 164366.0, 246464.0, 235764.0, 144817.0, 68515.0, 28551.0, 11723.0, 4950.0, 2217.0, 1018.0, 586.0, 299.0, 202.0, 111.0, 55.0, 41.0, 20.0, 21.0, 10.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10781192779541016, -0.10472297668457031, -0.10163402557373047, -0.09854507446289062, -0.09545612335205078, -0.09236717224121094, -0.0892782211303711, -0.08618927001953125, -0.0831003189086914, -0.08001136779785156, -0.07692241668701172, -0.07383346557617188, -0.07074451446533203, -0.06765556335449219, -0.06456661224365234, -0.0614776611328125, -0.058388710021972656, -0.05529975891113281, -0.05221080780029297, -0.049121856689453125, -0.04603290557861328, -0.04294395446777344, -0.039855003356933594, -0.03676605224609375, -0.033677101135253906, -0.030588150024414062, -0.02749919891357422, -0.024410247802734375, -0.02132129669189453, -0.018232345581054688, -0.015143394470214844, -0.012054443359375, -0.008965492248535156, -0.0058765411376953125, -0.0027875900268554688, 0.000301361083984375, 0.0033903121948242188, 0.0064792633056640625, 0.009568214416503906, 0.01265716552734375, 0.015746116638183594, 0.018835067749023438, 0.02192401885986328, 0.025012969970703125, 0.02810192108154297, 0.031190872192382812, 0.034279823303222656, 0.0373687744140625, 0.040457725524902344, 0.04354667663574219, 0.04663562774658203, 0.049724578857421875, 0.05281352996826172, 0.05590248107910156, 0.058991432189941406, 0.06208038330078125, 0.0651693344116211, 0.06825828552246094, 0.07134723663330078, 0.07443618774414062, 0.07752513885498047, 0.08061408996582031, 0.08370304107666016, 0.0867919921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 12.0, 12.0, 16.0, 10.0, 20.0, 20.0, 31.0, 29.0, 32.0, 39.0, 45.0, 51.0, 49.0, 70.0, 67.0, 53.0, 53.0, 52.0, 54.0, 46.0, 29.0, 36.0, 25.0, 29.0, 21.0, 20.0, 15.0, 17.0, 11.0, 1.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.060814857482910156, -0.05882453918457031, -0.05683422088623047, -0.054843902587890625, -0.05285358428955078, -0.05086326599121094, -0.048872947692871094, -0.04688262939453125, -0.044892311096191406, -0.04290199279785156, -0.04091167449951172, -0.038921356201171875, -0.03693103790283203, -0.03494071960449219, -0.032950401306152344, -0.0309600830078125, -0.028969764709472656, -0.026979446411132812, -0.02498912811279297, -0.022998809814453125, -0.02100849151611328, -0.019018173217773438, -0.017027854919433594, -0.01503753662109375, -0.013047218322753906, -0.011056900024414062, -0.009066581726074219, -0.007076263427734375, -0.005085945129394531, -0.0030956268310546875, -0.0011053085327148438, 0.000885009765625, 0.0028753280639648438, 0.0048656463623046875, 0.006855964660644531, 0.008846282958984375, 0.010836601257324219, 0.012826919555664062, 0.014817237854003906, 0.01680755615234375, 0.018797874450683594, 0.020788192749023438, 0.02277851104736328, 0.024768829345703125, 0.02675914764404297, 0.028749465942382812, 0.030739784240722656, 0.0327301025390625, 0.034720420837402344, 0.03671073913574219, 0.03870105743408203, 0.040691375732421875, 0.04268169403076172, 0.04467201232910156, 0.046662330627441406, 0.04865264892578125, 0.050642967224121094, 0.05263328552246094, 0.05462360382080078, 0.056613922119140625, 0.05860424041748047, 0.06059455871582031, 0.06258487701416016, 0.0645751953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 13.0, 30.0, 64.0, 80.0, 143.0, 182.0, 134.0, 142.0, 91.0, 49.0, 26.0, 18.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9887200593948364, -0.9365886449813843, -0.8844572901725769, -0.8323259353637695, -0.7801945209503174, -0.7280631065368652, -0.6759317517280579, -0.6238003969192505, -0.5716689825057983, -0.5195375680923462, -0.4674062132835388, -0.41527482867240906, -0.3631434440612793, -0.31101205945014954, -0.2588806748390198, -0.20674929022789001, -0.15461790561676025, -0.1024865210056305, -0.05035513639450073, 0.0017762482166290283, 0.05390763282775879, 0.10603901743888855, 0.1581704020500183, 0.21030178666114807, 0.26243317127227783, 0.3145645558834076, 0.36669594049453735, 0.4188273251056671, 0.4709587097167969, 0.523090124130249, 0.5752214789390564, 0.6273528337478638, 0.6794843673706055, 0.7316157817840576, 0.783747136592865, 0.8358784914016724, 0.8880099058151245, 0.9401413202285767, 0.992272675037384, 1.0444040298461914, 1.0965354442596436, 1.1486668586730957, 1.2007982730865479, 1.2529295682907104, 1.3050609827041626, 1.3571923971176147, 1.4093236923217773, 1.4614551067352295, 1.5135865211486816, 1.5657179355621338, 1.617849349975586, 1.6699806451797485, 1.7221120595932007, 1.7742434740066528, 1.8263747692108154, 1.8785061836242676, 1.9306375980377197, 1.9827690124511719, 2.034900426864624, 2.087031841278076, 2.139163017272949, 2.1912944316864014, 2.2434258460998535, 2.2955572605133057, 2.347688674926758]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 10.0, 12.0, 12.0, 11.0, 33.0, 23.0, 27.0, 39.0, 45.0, 37.0, 50.0, 48.0, 57.0, 47.0, 38.0, 49.0, 36.0, 45.0, 50.0, 51.0, 38.0, 32.0, 33.0, 26.0, 28.0, 23.0, 18.0, 13.0, 13.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9896751046180725, -0.9601157903671265, -0.9305564761161804, -0.9009971618652344, -0.8714378476142883, -0.8418785333633423, -0.8123192191123962, -0.7827599048614502, -0.7532005906105042, -0.7236412763595581, -0.6940819621086121, -0.664522647857666, -0.63496333360672, -0.6054040193557739, -0.5758447051048279, -0.5462853908538818, -0.5167261362075806, -0.4871668219566345, -0.4576075077056885, -0.42804819345474243, -0.3984888792037964, -0.36892956495285034, -0.3393702507019043, -0.30981093645095825, -0.2802516222000122, -0.25069230794906616, -0.22113299369812012, -0.19157367944717407, -0.16201436519622803, -0.13245506584644318, -0.10289575159549713, -0.07333643734455109, -0.04377710819244385, -0.014217795804142952, 0.015341516584157944, 0.04490082710981369, 0.07446014136075974, 0.10401944816112518, 0.13357876241207123, 0.16313807666301727, 0.19269739091396332, 0.22225670516490936, 0.2518160045146942, 0.28137531876564026, 0.3109346330165863, 0.34049394726753235, 0.3700532615184784, 0.39961257576942444, 0.4291718900203705, 0.45873120427131653, 0.4882905185222626, 0.5178498029708862, 0.5474091172218323, 0.5769684314727783, 0.6065277457237244, 0.6360870599746704, 0.6656463742256165, 0.6952056884765625, 0.7247650027275085, 0.7543243169784546, 0.7838836312294006, 0.8134429454803467, 0.8430022597312927, 0.8725615739822388, 0.9021208882331848]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 10.0, 12.0, 13.0, 16.0, 22.0, 37.0, 47.0, 79.0, 127.0, 206.0, 405.0, 800.0, 1784.0, 4461.0, 13277.0, 46535.0, 221525.0, 1513383.0, 1977421.0, 326618.0, 61454.0, 16755.0, 5442.0, 2052.0, 841.0, 413.0, 184.0, 115.0, 54.0, 58.0, 39.0, 22.0, 12.0, 12.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.246337890625, -0.2386646270751953, -0.23099136352539062, -0.22331809997558594, -0.21564483642578125, -0.20797157287597656, -0.20029830932617188, -0.1926250457763672, -0.1849517822265625, -0.1772785186767578, -0.16960525512695312, -0.16193199157714844, -0.15425872802734375, -0.14658546447753906, -0.13891220092773438, -0.1312389373779297, -0.123565673828125, -0.11589241027832031, -0.10821914672851562, -0.10054588317871094, -0.09287261962890625, -0.08519935607910156, -0.07752609252929688, -0.06985282897949219, -0.0621795654296875, -0.05450630187988281, -0.046833038330078125, -0.03915977478027344, -0.03148651123046875, -0.023813247680664062, -0.016139984130859375, -0.008466720581054688, -0.00079345703125, 0.0068798065185546875, 0.014553070068359375, 0.022226333618164062, 0.02989959716796875, 0.03757286071777344, 0.045246124267578125, 0.05291938781738281, 0.0605926513671875, 0.06826591491699219, 0.07593917846679688, 0.08361244201660156, 0.09128570556640625, 0.09895896911621094, 0.10663223266601562, 0.11430549621582031, 0.121978759765625, 0.1296520233154297, 0.13732528686523438, 0.14499855041503906, 0.15267181396484375, 0.16034507751464844, 0.16801834106445312, 0.1756916046142578, 0.1833648681640625, 0.1910381317138672, 0.19871139526367188, 0.20638465881347656, 0.21405792236328125, 0.22173118591308594, 0.22940444946289062, 0.2370777130126953, 0.2447509765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 10.0, 9.0, 29.0, 25.0, 32.0, 26.0, 33.0, 31.0, 51.0, 44.0, 39.0, 58.0, 43.0, 44.0, 44.0, 45.0, 50.0, 42.0, 33.0, 41.0, 36.0, 28.0, 31.0, 25.0, 22.0, 15.0, 22.0, 10.0, 9.0, 8.0, 5.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10982418060302734, -0.10636711120605469, -0.10291004180908203, -0.09945297241210938, -0.09599590301513672, -0.09253883361816406, -0.0890817642211914, -0.08562469482421875, -0.0821676254272461, -0.07871055603027344, -0.07525348663330078, -0.07179641723632812, -0.06833934783935547, -0.06488227844238281, -0.061425209045410156, -0.0579681396484375, -0.054511070251464844, -0.05105400085449219, -0.04759693145751953, -0.044139862060546875, -0.04068279266357422, -0.03722572326660156, -0.033768653869628906, -0.03031158447265625, -0.026854515075683594, -0.023397445678710938, -0.01994037628173828, -0.016483306884765625, -0.013026237487792969, -0.009569168090820312, -0.006112098693847656, -0.002655029296875, 0.0008020401000976562, 0.0042591094970703125, 0.007716178894042969, 0.011173248291015625, 0.014630317687988281, 0.018087387084960938, 0.021544456481933594, 0.02500152587890625, 0.028458595275878906, 0.03191566467285156, 0.03537273406982422, 0.038829803466796875, 0.04228687286376953, 0.04574394226074219, 0.049201011657714844, 0.0526580810546875, 0.056115150451660156, 0.05957221984863281, 0.06302928924560547, 0.06648635864257812, 0.06994342803955078, 0.07340049743652344, 0.0768575668334961, 0.08031463623046875, 0.0837717056274414, 0.08722877502441406, 0.09068584442138672, 0.09414291381835938, 0.09759998321533203, 0.10105705261230469, 0.10451412200927734, 0.10797119140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 10.0, 12.0, 22.0, 32.0, 42.0, 60.0, 107.0, 195.0, 319.0, 610.0, 1433.0, 3457.0, 9621.0, 29531.0, 97856.0, 337826.0, 1153466.0, 1690901.0, 615839.0, 175092.0, 51876.0, 16221.0, 5600.0, 2167.0, 967.0, 445.0, 214.0, 120.0, 78.0, 49.0, 36.0, 28.0, 12.0, 9.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24266815185546875, -0.2355804443359375, -0.22849273681640625, -0.221405029296875, -0.21431732177734375, -0.2072296142578125, -0.20014190673828125, -0.19305419921875, -0.18596649169921875, -0.1788787841796875, -0.17179107666015625, -0.164703369140625, -0.15761566162109375, -0.1505279541015625, -0.14344024658203125, -0.1363525390625, -0.12926483154296875, -0.1221771240234375, -0.11508941650390625, -0.108001708984375, -0.10091400146484375, -0.0938262939453125, -0.08673858642578125, -0.07965087890625, -0.07256317138671875, -0.0654754638671875, -0.05838775634765625, -0.051300048828125, -0.04421234130859375, -0.0371246337890625, -0.03003692626953125, -0.02294921875, -0.01586151123046875, -0.0087738037109375, -0.00168609619140625, 0.005401611328125, 0.01248931884765625, 0.0195770263671875, 0.02666473388671875, 0.03375244140625, 0.04084014892578125, 0.0479278564453125, 0.05501556396484375, 0.062103271484375, 0.06919097900390625, 0.0762786865234375, 0.08336639404296875, 0.0904541015625, 0.09754180908203125, 0.1046295166015625, 0.11171722412109375, 0.118804931640625, 0.12589263916015625, 0.1329803466796875, 0.14006805419921875, 0.14715576171875, 0.15424346923828125, 0.1613311767578125, 0.16841888427734375, 0.175506591796875, 0.18259429931640625, 0.1896820068359375, 0.19676971435546875, 0.203857421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 11.0, 7.0, 12.0, 14.0, 18.0, 25.0, 36.0, 51.0, 48.0, 76.0, 114.0, 124.0, 165.0, 217.0, 270.0, 370.0, 393.0, 402.0, 349.0, 313.0, 257.0, 181.0, 170.0, 137.0, 72.0, 63.0, 44.0, 47.0, 29.0, 19.0, 11.0, 9.0, 7.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18651390075683594, -0.18052291870117188, -0.1745319366455078, -0.16854095458984375, -0.1625499725341797, -0.15655899047851562, -0.15056800842285156, -0.1445770263671875, -0.13858604431152344, -0.13259506225585938, -0.1266040802001953, -0.12061309814453125, -0.11462211608886719, -0.10863113403320312, -0.10264015197753906, -0.096649169921875, -0.09065818786621094, -0.08466720581054688, -0.07867622375488281, -0.07268524169921875, -0.06669425964355469, -0.060703277587890625, -0.05471229553222656, -0.0487213134765625, -0.04273033142089844, -0.036739349365234375, -0.030748367309570312, -0.02475738525390625, -0.018766403198242188, -0.012775421142578125, -0.0067844390869140625, -0.00079345703125, 0.0051975250244140625, 0.011188507080078125, 0.017179489135742188, 0.02317047119140625, 0.029161453247070312, 0.035152435302734375, 0.04114341735839844, 0.0471343994140625, 0.05312538146972656, 0.059116363525390625, 0.06510734558105469, 0.07109832763671875, 0.07708930969238281, 0.08308029174804688, 0.08907127380371094, 0.095062255859375, 0.10105323791503906, 0.10704421997070312, 0.11303520202636719, 0.11902618408203125, 0.1250171661376953, 0.13100814819335938, 0.13699913024902344, 0.1429901123046875, 0.14898109436035156, 0.15497207641601562, 0.1609630584716797, 0.16695404052734375, 0.1729450225830078, 0.17893600463867188, 0.18492698669433594, 0.19091796875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 15.0, 52.0, 106.0, 192.0, 223.0, 189.0, 125.0, 61.0, 26.0, 11.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.874919891357422, -3.801196575164795, -3.727473258972168, -3.65375018119812, -3.580026865005493, -3.506303548812866, -3.4325804710388184, -3.3588571548461914, -3.2851338386535645, -3.2114105224609375, -3.1376872062683105, -3.0639641284942627, -2.9902408123016357, -2.916517496109009, -2.842794418334961, -2.769071102142334, -2.695347785949707, -2.62162446975708, -2.547901153564453, -2.4741780757904053, -2.4004547595977783, -2.3267314434051514, -2.2530083656311035, -2.1792850494384766, -2.1055617332458496, -2.0318384170532227, -1.9581152200698853, -1.8843920230865479, -1.810668706893921, -1.736945390701294, -1.6632221937179565, -1.5894989967346191, -1.5157756805419922, -1.4420523643493652, -1.3683291673660278, -1.2946059703826904, -1.2208826541900635, -1.1471593379974365, -1.0734361410140991, -0.9997128844261169, -0.9259896874427795, -0.8522664308547974, -0.7785431742668152, -0.704819917678833, -0.6310966610908508, -0.5573734045028687, -0.4836501479148865, -0.4099268913269043, -0.3362036347389221, -0.26248037815093994, -0.18875712156295776, -0.11503386497497559, -0.04131060838699341, 0.03241264820098877, 0.10613590478897095, 0.17985916137695312, 0.2535824179649353, 0.3273056745529175, 0.40102893114089966, 0.47475218772888184, 0.548475444316864, 0.6221987009048462, 0.6959219574928284, 0.7696452140808105, 0.8433684706687927]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 4.0, 4.0, 8.0, 7.0, 8.0, 13.0, 12.0, 12.0, 19.0, 12.0, 24.0, 33.0, 35.0, 36.0, 33.0, 47.0, 39.0, 39.0, 43.0, 36.0, 52.0, 37.0, 30.0, 48.0, 33.0, 29.0, 51.0, 38.0, 38.0, 35.0, 24.0, 19.0, 15.0, 19.0, 7.0, 18.0, 11.0, 5.0, 6.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.661861002445221, -0.6409622430801392, -0.6200634837150574, -0.5991647243499756, -0.5782659649848938, -0.557367205619812, -0.5364683866500854, -0.5155696272850037, -0.4946708679199219, -0.4737721085548401, -0.4528733491897583, -0.4319745898246765, -0.41107580065727234, -0.39017704129219055, -0.36927828192710876, -0.3483794927597046, -0.3274807631969452, -0.3065820038318634, -0.2856832444667816, -0.26478445529937744, -0.24388569593429565, -0.22298693656921387, -0.20208817720413208, -0.1811894029378891, -0.1602906435728073, -0.13939188420772552, -0.11849310994148254, -0.09759435057640076, -0.07669558376073837, -0.05579681694507599, -0.0348980575799942, -0.01399928331375122, 0.006899476051330566, 0.0277982410043478, 0.048697005957365036, 0.06959576904773712, 0.0904945358633995, 0.11139330267906189, 0.13229206204414368, 0.15319083631038666, 0.17408959567546844, 0.19498835504055023, 0.2158871293067932, 0.236785888671875, 0.2576846480369568, 0.2785834074020386, 0.29948216676712036, 0.32038095593452454, 0.3412797152996063, 0.3621784746646881, 0.3830772340297699, 0.4039760231971741, 0.42487478256225586, 0.44577354192733765, 0.46667230129241943, 0.4875710606575012, 0.508469820022583, 0.5293685793876648, 0.5502673387527466, 0.5711660981178284, 0.5920648574829102, 0.6129636764526367, 0.6338623762130737, 0.6547611951828003, 0.6756599545478821]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 12.0, 25.0, 30.0, 61.0, 91.0, 181.0, 317.0, 561.0, 959.0, 1781.0, 3366.0, 6408.0, 12381.0, 24849.0, 50923.0, 103512.0, 183665.0, 241774.0, 194216.0, 111886.0, 56277.0, 26977.0, 13496.0, 6747.0, 3598.0, 2017.0, 1091.0, 553.0, 302.0, 196.0, 100.0, 65.0, 35.0, 28.0, 21.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2724609375, -0.2638282775878906, -0.25519561767578125, -0.24656295776367188, -0.2379302978515625, -0.22929763793945312, -0.22066497802734375, -0.21203231811523438, -0.203399658203125, -0.19476699829101562, -0.18613433837890625, -0.17750167846679688, -0.1688690185546875, -0.16023635864257812, -0.15160369873046875, -0.14297103881835938, -0.13433837890625, -0.12570571899414062, -0.11707305908203125, -0.10844039916992188, -0.0998077392578125, -0.09117507934570312, -0.08254241943359375, -0.07390975952148438, -0.065277099609375, -0.056644439697265625, -0.04801177978515625, -0.039379119873046875, -0.0307464599609375, -0.022113800048828125, -0.01348114013671875, -0.004848480224609375, 0.0037841796875, 0.012416839599609375, 0.02104949951171875, 0.029682159423828125, 0.0383148193359375, 0.046947479248046875, 0.05558013916015625, 0.06421279907226562, 0.072845458984375, 0.08147811889648438, 0.09011077880859375, 0.09874343872070312, 0.1073760986328125, 0.11600875854492188, 0.12464141845703125, 0.13327407836914062, 0.14190673828125, 0.15053939819335938, 0.15917205810546875, 0.16780471801757812, 0.1764373779296875, 0.18507003784179688, 0.19370269775390625, 0.20233535766601562, 0.210968017578125, 0.21960067749023438, 0.22823333740234375, 0.23686599731445312, 0.2454986572265625, 0.2541313171386719, 0.26276397705078125, 0.2713966369628906, 0.280029296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 1.0, 4.0, 6.0, 12.0, 7.0, 12.0, 25.0, 18.0, 37.0, 42.0, 29.0, 35.0, 39.0, 51.0, 49.0, 50.0, 51.0, 50.0, 47.0, 41.0, 43.0, 35.0, 55.0, 46.0, 38.0, 28.0, 22.0, 36.0, 22.0, 10.0, 15.0, 16.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.133056640625, -0.12950992584228516, -0.1259632110595703, -0.12241649627685547, -0.11886978149414062, -0.11532306671142578, -0.11177635192871094, -0.1082296371459961, -0.10468292236328125, -0.1011362075805664, -0.09758949279785156, -0.09404277801513672, -0.09049606323242188, -0.08694934844970703, -0.08340263366699219, -0.07985591888427734, -0.0763092041015625, -0.07276248931884766, -0.06921577453613281, -0.06566905975341797, -0.062122344970703125, -0.05857563018798828, -0.05502891540527344, -0.051482200622558594, -0.04793548583984375, -0.044388771057128906, -0.04084205627441406, -0.03729534149169922, -0.033748626708984375, -0.03020191192626953, -0.026655197143554688, -0.023108482360839844, -0.019561767578125, -0.016015052795410156, -0.012468338012695312, -0.008921623229980469, -0.005374908447265625, -0.0018281936645507812, 0.0017185211181640625, 0.005265235900878906, 0.00881195068359375, 0.012358665466308594, 0.015905380249023438, 0.01945209503173828, 0.022998809814453125, 0.02654552459716797, 0.030092239379882812, 0.033638954162597656, 0.0371856689453125, 0.040732383728027344, 0.04427909851074219, 0.04782581329345703, 0.051372528076171875, 0.05491924285888672, 0.05846595764160156, 0.062012672424316406, 0.06555938720703125, 0.0691061019897461, 0.07265281677246094, 0.07619953155517578, 0.07974624633789062, 0.08329296112060547, 0.08683967590332031, 0.09038639068603516, 0.09393310546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 6.0, 13.0, 15.0, 40.0, 41.0, 50.0, 66.0, 114.0, 138.0, 202.0, 317.0, 533.0, 920.0, 1659.0, 3438.0, 7167.0, 15560.0, 34657.0, 74910.0, 145387.0, 226879.0, 233116.0, 152508.0, 80570.0, 37772.0, 16770.0, 7591.0, 3632.0, 1805.0, 918.0, 585.0, 326.0, 264.0, 158.0, 116.0, 85.0, 63.0, 53.0, 35.0, 22.0, 17.0, 11.0, 10.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262939453125, -0.2544708251953125, -0.246002197265625, -0.2375335693359375, -0.22906494140625, -0.2205963134765625, -0.212127685546875, -0.2036590576171875, -0.1951904296875, -0.1867218017578125, -0.178253173828125, -0.1697845458984375, -0.16131591796875, -0.1528472900390625, -0.144378662109375, -0.1359100341796875, -0.12744140625, -0.1189727783203125, -0.110504150390625, -0.1020355224609375, -0.09356689453125, -0.0850982666015625, -0.076629638671875, -0.0681610107421875, -0.0596923828125, -0.0512237548828125, -0.042755126953125, -0.0342864990234375, -0.02581787109375, -0.0173492431640625, -0.008880615234375, -0.0004119873046875, 0.008056640625, 0.0165252685546875, 0.024993896484375, 0.0334625244140625, 0.04193115234375, 0.0503997802734375, 0.058868408203125, 0.0673370361328125, 0.0758056640625, 0.0842742919921875, 0.092742919921875, 0.1012115478515625, 0.10968017578125, 0.1181488037109375, 0.126617431640625, 0.1350860595703125, 0.1435546875, 0.1520233154296875, 0.160491943359375, 0.1689605712890625, 0.17742919921875, 0.1858978271484375, 0.194366455078125, 0.2028350830078125, 0.2113037109375, 0.2197723388671875, 0.228240966796875, 0.2367095947265625, 0.24517822265625, 0.2536468505859375, 0.262115478515625, 0.2705841064453125, 0.279052734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 6.0, 1.0, 7.0, 10.0, 10.0, 9.0, 10.0, 12.0, 8.0, 11.0, 18.0, 33.0, 23.0, 28.0, 22.0, 34.0, 48.0, 40.0, 25.0, 36.0, 24.0, 26.0, 46.0, 32.0, 40.0, 33.0, 35.0, 46.0, 33.0, 30.0, 27.0, 37.0, 36.0, 21.0, 17.0, 20.0, 23.0, 10.0, 11.0, 4.0, 9.0, 12.0, 6.0, 11.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.26171875, -0.25424766540527344, -0.24677658081054688, -0.2393054962158203, -0.23183441162109375, -0.2243633270263672, -0.21689224243164062, -0.20942115783691406, -0.2019500732421875, -0.19447898864746094, -0.18700790405273438, -0.1795368194580078, -0.17206573486328125, -0.1645946502685547, -0.15712356567382812, -0.14965248107910156, -0.142181396484375, -0.13471031188964844, -0.12723922729492188, -0.11976814270019531, -0.11229705810546875, -0.10482597351074219, -0.09735488891601562, -0.08988380432128906, -0.0824127197265625, -0.07494163513183594, -0.06747055053710938, -0.05999946594238281, -0.05252838134765625, -0.04505729675292969, -0.037586212158203125, -0.030115127563476562, -0.02264404296875, -0.015172958374023438, -0.007701873779296875, -0.0002307891845703125, 0.00724029541015625, 0.014711380004882812, 0.022182464599609375, 0.029653549194335938, 0.0371246337890625, 0.04459571838378906, 0.052066802978515625, 0.05953788757324219, 0.06700897216796875, 0.07448005676269531, 0.08195114135742188, 0.08942222595214844, 0.096893310546875, 0.10436439514160156, 0.11183547973632812, 0.11930656433105469, 0.12677764892578125, 0.1342487335205078, 0.14171981811523438, 0.14919090270996094, 0.1566619873046875, 0.16413307189941406, 0.17160415649414062, 0.1790752410888672, 0.18654632568359375, 0.1940174102783203, 0.20148849487304688, 0.20895957946777344, 0.2164306640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 16.0, 18.0, 34.0, 68.0, 112.0, 271.0, 700.0, 1880.0, 6061.0, 22966.0, 99122.0, 343345.0, 397231.0, 134111.0, 30716.0, 7995.0, 2377.0, 882.0, 314.0, 162.0, 74.0, 38.0, 25.0, 11.0, 5.0, 2.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.150634765625, -0.14594268798828125, -0.1412506103515625, -0.13655853271484375, -0.131866455078125, -0.12717437744140625, -0.1224822998046875, -0.11779022216796875, -0.11309814453125, -0.10840606689453125, -0.1037139892578125, -0.09902191162109375, -0.094329833984375, -0.08963775634765625, -0.0849456787109375, -0.08025360107421875, -0.0755615234375, -0.07086944580078125, -0.0661773681640625, -0.06148529052734375, -0.056793212890625, -0.05210113525390625, -0.0474090576171875, -0.04271697998046875, -0.03802490234375, -0.03333282470703125, -0.0286407470703125, -0.02394866943359375, -0.019256591796875, -0.01456451416015625, -0.0098724365234375, -0.00518035888671875, -0.00048828125, 0.00420379638671875, 0.0088958740234375, 0.01358795166015625, 0.018280029296875, 0.02297210693359375, 0.0276641845703125, 0.03235626220703125, 0.03704833984375, 0.04174041748046875, 0.0464324951171875, 0.05112457275390625, 0.055816650390625, 0.06050872802734375, 0.0652008056640625, 0.06989288330078125, 0.0745849609375, 0.07927703857421875, 0.0839691162109375, 0.08866119384765625, 0.093353271484375, 0.09804534912109375, 0.1027374267578125, 0.10742950439453125, 0.11212158203125, 0.11681365966796875, 0.1215057373046875, 0.12619781494140625, 0.130889892578125, 0.13558197021484375, 0.1402740478515625, 0.14496612548828125, 0.149658203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 2.0, 7.0, 6.0, 10.0, 8.0, 15.0, 15.0, 23.0, 37.0, 28.0, 49.0, 51.0, 70.0, 78.0, 86.0, 84.0, 69.0, 77.0, 62.0, 48.0, 39.0, 35.0, 18.0, 20.0, 16.0, 7.0, 7.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.288818359375e-05, -2.215523272752762e-05, -2.1422281861305237e-05, -2.0689330995082855e-05, -1.9956380128860474e-05, -1.9223429262638092e-05, -1.849047839641571e-05, -1.775752753019333e-05, -1.7024576663970947e-05, -1.6291625797748566e-05, -1.5558674931526184e-05, -1.4825724065303802e-05, -1.4092773199081421e-05, -1.335982233285904e-05, -1.2626871466636658e-05, -1.1893920600414276e-05, -1.1160969734191895e-05, -1.0428018867969513e-05, -9.695068001747131e-06, -8.96211713552475e-06, -8.229166269302368e-06, -7.4962154030799866e-06, -6.763264536857605e-06, -6.030313670635223e-06, -5.297362804412842e-06, -4.56441193819046e-06, -3.831461071968079e-06, -3.098510205745697e-06, -2.3655593395233154e-06, -1.6326084733009338e-06, -8.996576070785522e-07, -1.6670674085617065e-07, 5.662441253662109e-07, 1.2991949915885925e-06, 2.032145857810974e-06, 2.7650967240333557e-06, 3.4980475902557373e-06, 4.230998456478119e-06, 4.9639493227005005e-06, 5.696900188922882e-06, 6.429851055145264e-06, 7.162801921367645e-06, 7.895752787590027e-06, 8.628703653812408e-06, 9.36165452003479e-06, 1.0094605386257172e-05, 1.0827556252479553e-05, 1.1560507118701935e-05, 1.2293457984924316e-05, 1.3026408851146698e-05, 1.375935971736908e-05, 1.4492310583591461e-05, 1.5225261449813843e-05, 1.5958212316036224e-05, 1.6691163182258606e-05, 1.7424114048480988e-05, 1.815706491470337e-05, 1.889001578092575e-05, 1.9622966647148132e-05, 2.0355917513370514e-05, 2.1088868379592896e-05, 2.1821819245815277e-05, 2.255477011203766e-05, 2.328772097826004e-05, 2.4020671844482422e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 14.0, 23.0, 35.0, 50.0, 98.0, 189.0, 312.0, 668.0, 1405.0, 3967.0, 13224.0, 47966.0, 179690.0, 402722.0, 281803.0, 83804.0, 22093.0, 6460.0, 2189.0, 860.0, 419.0, 197.0, 134.0, 79.0, 55.0, 25.0, 17.0, 13.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.14937305450439453, -0.14530372619628906, -0.1412343978881836, -0.13716506958007812, -0.13309574127197266, -0.1290264129638672, -0.12495708465576172, -0.12088775634765625, -0.11681842803955078, -0.11274909973144531, -0.10867977142333984, -0.10461044311523438, -0.1005411148071289, -0.09647178649902344, -0.09240245819091797, -0.0883331298828125, -0.08426380157470703, -0.08019447326660156, -0.0761251449584961, -0.07205581665039062, -0.06798648834228516, -0.06391716003417969, -0.05984783172607422, -0.05577850341796875, -0.05170917510986328, -0.04763984680175781, -0.043570518493652344, -0.039501190185546875, -0.035431861877441406, -0.03136253356933594, -0.02729320526123047, -0.023223876953125, -0.01915454864501953, -0.015085220336914062, -0.011015892028808594, -0.006946563720703125, -0.0028772354125976562, 0.0011920928955078125, 0.005261421203613281, 0.00933074951171875, 0.013400077819824219, 0.017469406127929688, 0.021538734436035156, 0.025608062744140625, 0.029677391052246094, 0.03374671936035156, 0.03781604766845703, 0.0418853759765625, 0.04595470428466797, 0.05002403259277344, 0.054093360900878906, 0.058162689208984375, 0.062232017517089844, 0.06630134582519531, 0.07037067413330078, 0.07444000244140625, 0.07850933074951172, 0.08257865905761719, 0.08664798736572266, 0.09071731567382812, 0.0947866439819336, 0.09885597229003906, 0.10292530059814453, 0.10699462890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 8.0, 3.0, 13.0, 10.0, 13.0, 14.0, 13.0, 25.0, 34.0, 39.0, 43.0, 53.0, 60.0, 61.0, 62.0, 60.0, 74.0, 63.0, 68.0, 32.0, 46.0, 49.0, 43.0, 25.0, 14.0, 24.0, 4.0, 8.0, 9.0, 9.0, 5.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06589603424072266, -0.06367683410644531, -0.06145763397216797, -0.059238433837890625, -0.05701923370361328, -0.05480003356933594, -0.052580833435058594, -0.05036163330078125, -0.048142433166503906, -0.04592323303222656, -0.04370403289794922, -0.041484832763671875, -0.03926563262939453, -0.03704643249511719, -0.034827232360839844, -0.0326080322265625, -0.030388832092285156, -0.028169631958007812, -0.02595043182373047, -0.023731231689453125, -0.02151203155517578, -0.019292831420898438, -0.017073631286621094, -0.01485443115234375, -0.012635231018066406, -0.010416030883789062, -0.008196830749511719, -0.005977630615234375, -0.0037584304809570312, -0.0015392303466796875, 0.0006799697875976562, 0.002899169921875, 0.005118370056152344, 0.0073375701904296875, 0.009556770324707031, 0.011775970458984375, 0.013995170593261719, 0.016214370727539062, 0.018433570861816406, 0.02065277099609375, 0.022871971130371094, 0.025091171264648438, 0.02731037139892578, 0.029529571533203125, 0.03174877166748047, 0.03396797180175781, 0.036187171936035156, 0.0384063720703125, 0.040625572204589844, 0.04284477233886719, 0.04506397247314453, 0.047283172607421875, 0.04950237274169922, 0.05172157287597656, 0.053940773010253906, 0.05615997314453125, 0.058379173278808594, 0.06059837341308594, 0.06281757354736328, 0.06503677368164062, 0.06725597381591797, 0.06947517395019531, 0.07169437408447266, 0.07391357421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 30.0, 111.0, 261.0, 327.0, 181.0, 78.0, 11.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.086669445037842, -2.9812710285186768, -2.875872850418091, -2.770474433898926, -2.6650760173797607, -2.5596776008605957, -2.4542794227600098, -2.3488810062408447, -2.2434825897216797, -2.1380841732025146, -2.0326859951019287, -1.9272875785827637, -1.8218891620635986, -1.7164908647537231, -1.6110925674438477, -1.5056941509246826, -1.4002959728240967, -1.2948976755142212, -1.1894992589950562, -1.0841009616851807, -0.9787026047706604, -0.8733042478561401, -0.7679059505462646, -0.6625075936317444, -0.5571092367172241, -0.45171087980270386, -0.346312552690506, -0.2409142255783081, -0.13551586866378784, -0.030117511749267578, 0.07528078556060791, 0.18067914247512817, 0.28607726097106934, 0.3914756178855896, 0.4968739449977875, 0.6022722721099854, 0.7076706290245056, 0.8130689859390259, 0.9184672832489014, 1.0238656997680664, 1.129263997077942, 1.2346622943878174, 1.3400607109069824, 1.445459008216858, 1.5508573055267334, 1.6562557220458984, 1.761654019355774, 1.8670523166656494, 1.9724507331848145, 2.0778491497039795, 2.1832473278045654, 2.2886457443237305, 2.3940441608428955, 2.4994425773620605, 2.6048407554626465, 2.7102391719818115, 2.8156375885009766, 2.9210360050201416, 3.0264341831207275, 3.1318325996398926, 3.2372310161590576, 3.3426294326782227, 3.4480276107788086, 3.5534260272979736, 3.6588242053985596]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 6.0, 3.0, 9.0, 12.0, 12.0, 23.0, 28.0, 28.0, 25.0, 27.0, 47.0, 33.0, 42.0, 49.0, 52.0, 49.0, 40.0, 49.0, 65.0, 41.0, 53.0, 35.0, 39.0, 39.0, 38.0, 28.0, 28.0, 22.0, 15.0, 18.0, 15.0, 6.0, 10.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7350797057151794, -0.7062202095985413, -0.6773606538772583, -0.6485011577606201, -0.6196416616439819, -0.5907821655273438, -0.5619226694107056, -0.5330631136894226, -0.5042036175727844, -0.47534412145614624, -0.44648459553718567, -0.4176250696182251, -0.3887655735015869, -0.35990607738494873, -0.33104655146598816, -0.3021870255470276, -0.2733275294303894, -0.24446801841259003, -0.21560850739479065, -0.18674899637699127, -0.1578894853591919, -0.12902997434139252, -0.10017046332359314, -0.07131095230579376, -0.042451441287994385, -0.013591930270195007, 0.01526758074760437, 0.04412709176540375, 0.07298660278320312, 0.1018461138010025, 0.13070562481880188, 0.15956513583660126, 0.18842458724975586, 0.21728409826755524, 0.24614360928535461, 0.2750031352043152, 0.30386263132095337, 0.33272212743759155, 0.3615816533565521, 0.3904411792755127, 0.4193006753921509, 0.44816017150878906, 0.47701969742774963, 0.5058792233467102, 0.5347387194633484, 0.5635982155799866, 0.5924577713012695, 0.6213172674179077, 0.6501767635345459, 0.6790362596511841, 0.7078957557678223, 0.7367553114891052, 0.7656148076057434, 0.7944743037223816, 0.8233338594436646, 0.8521933555603027, 0.8810528516769409, 0.9099123477935791, 0.9387718439102173, 0.9676313996315002, 0.9964908957481384, 1.0253504514694214, 1.0542099475860596, 1.0830694437026978, 1.111928939819336]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 14.0, 7.0, 12.0, 29.0, 35.0, 40.0, 65.0, 78.0, 107.0, 187.0, 233.0, 415.0, 639.0, 993.0, 1567.0, 2776.0, 4446.0, 8431.0, 15537.0, 31299.0, 67415.0, 166003.0, 501450.0, 1272089.0, 1301510.0, 510362.0, 171747.0, 69329.0, 32166.0, 15719.0, 8500.0, 4453.0, 2635.0, 1490.0, 940.0, 568.0, 373.0, 234.0, 154.0, 99.0, 44.0, 27.0, 18.0, 18.0, 9.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1473388671875, -0.14313030242919922, -0.13892173767089844, -0.13471317291259766, -0.13050460815429688, -0.1262960433959961, -0.12208747863769531, -0.11787891387939453, -0.11367034912109375, -0.10946178436279297, -0.10525321960449219, -0.1010446548461914, -0.09683609008789062, -0.09262752532958984, -0.08841896057128906, -0.08421039581298828, -0.0800018310546875, -0.07579326629638672, -0.07158470153808594, -0.06737613677978516, -0.06316757202148438, -0.058959007263183594, -0.05475044250488281, -0.05054187774658203, -0.04633331298828125, -0.04212474822998047, -0.03791618347167969, -0.033707618713378906, -0.029499053955078125, -0.025290489196777344, -0.021081924438476562, -0.01687335968017578, -0.012664794921875, -0.008456230163574219, -0.0042476654052734375, -3.910064697265625e-05, 0.004169464111328125, 0.008378028869628906, 0.012586593627929688, 0.01679515838623047, 0.02100372314453125, 0.02521228790283203, 0.029420852661132812, 0.033629417419433594, 0.037837982177734375, 0.042046546936035156, 0.04625511169433594, 0.05046367645263672, 0.0546722412109375, 0.05888080596923828, 0.06308937072753906, 0.06729793548583984, 0.07150650024414062, 0.0757150650024414, 0.07992362976074219, 0.08413219451904297, 0.08834075927734375, 0.09254932403564453, 0.09675788879394531, 0.1009664535522461, 0.10517501831054688, 0.10938358306884766, 0.11359214782714844, 0.11780071258544922, 0.12200927734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 9.0, 6.0, 14.0, 13.0, 13.0, 21.0, 13.0, 21.0, 32.0, 30.0, 35.0, 31.0, 41.0, 47.0, 50.0, 52.0, 47.0, 37.0, 44.0, 49.0, 38.0, 40.0, 35.0, 24.0, 35.0, 32.0, 28.0, 30.0, 19.0, 20.0, 11.0, 21.0, 15.0, 14.0, 6.0, 7.0, 2.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.104736328125, -0.10153865814208984, -0.09834098815917969, -0.09514331817626953, -0.09194564819335938, -0.08874797821044922, -0.08555030822753906, -0.0823526382446289, -0.07915496826171875, -0.0759572982788086, -0.07275962829589844, -0.06956195831298828, -0.06636428833007812, -0.06316661834716797, -0.05996894836425781, -0.056771278381347656, -0.0535736083984375, -0.050375938415527344, -0.04717826843261719, -0.04398059844970703, -0.040782928466796875, -0.03758525848388672, -0.03438758850097656, -0.031189918518066406, -0.02799224853515625, -0.024794578552246094, -0.021596908569335938, -0.01839923858642578, -0.015201568603515625, -0.012003898620605469, -0.008806228637695312, -0.005608558654785156, -0.002410888671875, 0.0007867813110351562, 0.0039844512939453125, 0.007182121276855469, 0.010379791259765625, 0.013577461242675781, 0.016775131225585938, 0.019972801208496094, 0.02317047119140625, 0.026368141174316406, 0.029565811157226562, 0.03276348114013672, 0.035961151123046875, 0.03915882110595703, 0.04235649108886719, 0.045554161071777344, 0.0487518310546875, 0.051949501037597656, 0.05514717102050781, 0.05834484100341797, 0.061542510986328125, 0.06474018096923828, 0.06793785095214844, 0.0711355209350586, 0.07433319091796875, 0.0775308609008789, 0.08072853088378906, 0.08392620086669922, 0.08712387084960938, 0.09032154083251953, 0.09351921081542969, 0.09671688079833984, 0.09991455078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 8.0, 22.0, 24.0, 43.0, 40.0, 103.0, 168.0, 286.0, 667.0, 1836.0, 5293.0, 18770.0, 71141.0, 309187.0, 1385003.0, 1814398.0, 449506.0, 101490.0, 25072.0, 7238.0, 2289.0, 841.0, 377.0, 190.0, 117.0, 45.0, 38.0, 24.0, 10.0, 14.0, 11.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24860382080078125, -0.2406158447265625, -0.23262786865234375, -0.224639892578125, -0.21665191650390625, -0.2086639404296875, -0.20067596435546875, -0.19268798828125, -0.18470001220703125, -0.1767120361328125, -0.16872406005859375, -0.160736083984375, -0.15274810791015625, -0.1447601318359375, -0.13677215576171875, -0.1287841796875, -0.12079620361328125, -0.1128082275390625, -0.10482025146484375, -0.096832275390625, -0.08884429931640625, -0.0808563232421875, -0.07286834716796875, -0.06488037109375, -0.05689239501953125, -0.0489044189453125, -0.04091644287109375, -0.032928466796875, -0.02494049072265625, -0.0169525146484375, -0.00896453857421875, -0.0009765625, 0.00701141357421875, 0.0149993896484375, 0.02298736572265625, 0.030975341796875, 0.03896331787109375, 0.0469512939453125, 0.05493927001953125, 0.06292724609375, 0.07091522216796875, 0.0789031982421875, 0.08689117431640625, 0.094879150390625, 0.10286712646484375, 0.1108551025390625, 0.11884307861328125, 0.1268310546875, 0.13481903076171875, 0.1428070068359375, 0.15079498291015625, 0.158782958984375, 0.16677093505859375, 0.1747589111328125, 0.18274688720703125, 0.19073486328125, 0.19872283935546875, 0.2067108154296875, 0.21469879150390625, 0.222686767578125, 0.23067474365234375, 0.2386627197265625, 0.24665069580078125, 0.254638671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 15.0, 15.0, 19.0, 21.0, 33.0, 49.0, 63.0, 76.0, 127.0, 138.0, 157.0, 230.0, 276.0, 331.0, 410.0, 410.0, 351.0, 281.0, 229.0, 187.0, 155.0, 134.0, 88.0, 59.0, 43.0, 38.0, 31.0, 27.0, 21.0, 16.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1898193359375, -0.1842632293701172, -0.17870712280273438, -0.17315101623535156, -0.16759490966796875, -0.16203880310058594, -0.15648269653320312, -0.1509265899658203, -0.1453704833984375, -0.1398143768310547, -0.13425827026367188, -0.12870216369628906, -0.12314605712890625, -0.11758995056152344, -0.11203384399414062, -0.10647773742675781, -0.100921630859375, -0.09536552429199219, -0.08980941772460938, -0.08425331115722656, -0.07869720458984375, -0.07314109802246094, -0.06758499145507812, -0.06202888488769531, -0.0564727783203125, -0.05091667175292969, -0.045360565185546875, -0.03980445861816406, -0.03424835205078125, -0.028692245483398438, -0.023136138916015625, -0.017580032348632812, -0.01202392578125, -0.0064678192138671875, -0.000911712646484375, 0.0046443939208984375, 0.01020050048828125, 0.015756607055664062, 0.021312713623046875, 0.026868820190429688, 0.0324249267578125, 0.03798103332519531, 0.043537139892578125, 0.04909324645996094, 0.05464935302734375, 0.06020545959472656, 0.06576156616210938, 0.07131767272949219, 0.076873779296875, 0.08242988586425781, 0.08798599243164062, 0.09354209899902344, 0.09909820556640625, 0.10465431213378906, 0.11021041870117188, 0.11576652526855469, 0.1213226318359375, 0.1268787384033203, 0.13243484497070312, 0.13799095153808594, 0.14354705810546875, 0.14910316467285156, 0.15465927124023438, 0.1602153778076172, 0.165771484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 16.0, 20.0, 25.0, 38.0, 61.0, 96.0, 111.0, 115.0, 115.0, 120.0, 95.0, 60.0, 46.0, 30.0, 20.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8820130825042725, -0.841962456703186, -0.8019118309020996, -0.7618612051010132, -0.7218105792999268, -0.6817599534988403, -0.6417093276977539, -0.6016587018966675, -0.561608076095581, -0.5215574502944946, -0.4815068244934082, -0.4414561986923218, -0.40140557289123535, -0.3613549470901489, -0.3213043212890625, -0.2812536954879761, -0.24120306968688965, -0.20115244388580322, -0.1611018180847168, -0.12105119228363037, -0.08100056648254395, -0.04094994068145752, -0.0008993148803710938, 0.03915131092071533, 0.07920193672180176, 0.11925256252288818, 0.1593031883239746, 0.19935381412506104, 0.23940443992614746, 0.2794550657272339, 0.3195056915283203, 0.35955631732940674, 0.3996068239212036, 0.43965744972229004, 0.47970807552337646, 0.5197587013244629, 0.5598093271255493, 0.5998599529266357, 0.6399105787277222, 0.6799612045288086, 0.720011830329895, 0.7600624561309814, 0.8001130819320679, 0.8401637077331543, 0.8802143335342407, 0.9202649593353271, 0.9603155851364136, 1.0003662109375, 1.0404168367385864, 1.0804674625396729, 1.1205180883407593, 1.1605687141418457, 1.2006193399429321, 1.2406699657440186, 1.280720591545105, 1.3207712173461914, 1.3608218431472778, 1.4008724689483643, 1.4409230947494507, 1.480973720550537, 1.5210243463516235, 1.56107497215271, 1.6011255979537964, 1.6411762237548828, 1.6812268495559692]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 5.0, 12.0, 17.0, 11.0, 15.0, 17.0, 10.0, 21.0, 23.0, 28.0, 22.0, 29.0, 30.0, 43.0, 34.0, 37.0, 37.0, 41.0, 44.0, 39.0, 34.0, 35.0, 33.0, 38.0, 38.0, 33.0, 31.0, 26.0, 25.0, 24.0, 17.0, 21.0, 35.0, 10.0, 10.0, 10.0, 11.0, 9.0, 6.0, 4.0, 10.0, 0.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.6030954718589783, -0.5853657126426697, -0.5676358938217163, -0.5499061346054077, -0.5321763157844543, -0.5144465565681458, -0.4967167377471924, -0.4789869785308838, -0.4612571597099304, -0.44352737069129944, -0.42579758167266846, -0.4080677926540375, -0.3903380036354065, -0.3726082146167755, -0.35487842559814453, -0.33714866638183594, -0.31941887736320496, -0.301689088344574, -0.283959299325943, -0.266229510307312, -0.24849972128868103, -0.23076993227005005, -0.21304015815258026, -0.19531036913394928, -0.1775805801153183, -0.15985079109668732, -0.14212100207805634, -0.12439122051000595, -0.10666143149137497, -0.08893164247274399, -0.0712018609046936, -0.05347207188606262, -0.03574228286743164, -0.01801249571144581, -0.0002827085554599762, 0.017447076737880707, 0.03517686575651169, 0.05290665477514267, 0.07063643634319305, 0.08836622536182404, 0.10609601438045502, 0.123825803399086, 0.14155559241771698, 0.15928536653518677, 0.17701515555381775, 0.19474494457244873, 0.2124747335910797, 0.2302045226097107, 0.24793431162834167, 0.26566410064697266, 0.28339388966560364, 0.3011236786842346, 0.3188534677028656, 0.3365832567214966, 0.3543130159378052, 0.37204283475875854, 0.38977259397506714, 0.4075023829936981, 0.4252321720123291, 0.4429619610309601, 0.46069175004959106, 0.47842153906822205, 0.496151328086853, 0.5138810873031616, 0.531610906124115]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 3.0, 7.0, 10.0, 12.0, 19.0, 16.0, 27.0, 41.0, 71.0, 102.0, 173.0, 253.0, 418.0, 708.0, 1254.0, 2132.0, 4076.0, 7234.0, 13056.0, 23778.0, 43876.0, 77518.0, 130588.0, 188748.0, 199790.0, 148343.0, 91025.0, 51599.0, 28677.0, 15411.0, 8616.0, 4700.0, 2537.0, 1511.0, 866.0, 497.0, 301.0, 190.0, 118.0, 85.0, 50.0, 41.0, 27.0, 17.0, 12.0, 8.0, 9.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.22900390625, -0.22266769409179688, -0.21633148193359375, -0.20999526977539062, -0.2036590576171875, -0.19732284545898438, -0.19098663330078125, -0.18465042114257812, -0.178314208984375, -0.17197799682617188, -0.16564178466796875, -0.15930557250976562, -0.1529693603515625, -0.14663314819335938, -0.14029693603515625, -0.13396072387695312, -0.12762451171875, -0.12128829956054688, -0.11495208740234375, -0.10861587524414062, -0.1022796630859375, -0.09594345092773438, -0.08960723876953125, -0.08327102661132812, -0.076934814453125, -0.07059860229492188, -0.06426239013671875, -0.057926177978515625, -0.0515899658203125, -0.045253753662109375, -0.03891754150390625, -0.032581329345703125, -0.0262451171875, -0.019908905029296875, -0.01357269287109375, -0.007236480712890625, -0.0009002685546875, 0.005435943603515625, 0.01177215576171875, 0.018108367919921875, 0.024444580078125, 0.030780792236328125, 0.03711700439453125, 0.043453216552734375, 0.0497894287109375, 0.056125640869140625, 0.06246185302734375, 0.06879806518554688, 0.07513427734375, 0.08147048950195312, 0.08780670166015625, 0.09414291381835938, 0.1004791259765625, 0.10681533813476562, 0.11315155029296875, 0.11948776245117188, 0.125823974609375, 0.13216018676757812, 0.13849639892578125, 0.14483261108398438, 0.1511688232421875, 0.15750503540039062, 0.16384124755859375, 0.17017745971679688, 0.176513671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 15.0, 12.0, 12.0, 30.0, 23.0, 25.0, 29.0, 28.0, 47.0, 37.0, 38.0, 52.0, 46.0, 49.0, 39.0, 57.0, 45.0, 36.0, 39.0, 46.0, 26.0, 22.0, 33.0, 35.0, 27.0, 30.0, 26.0, 18.0, 10.0, 16.0, 8.0, 9.0, 12.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.12005615234375, -0.11682987213134766, -0.11360359191894531, -0.11037731170654297, -0.10715103149414062, -0.10392475128173828, -0.10069847106933594, -0.0974721908569336, -0.09424591064453125, -0.0910196304321289, -0.08779335021972656, -0.08456707000732422, -0.08134078979492188, -0.07811450958251953, -0.07488822937011719, -0.07166194915771484, -0.0684356689453125, -0.06520938873291016, -0.06198310852050781, -0.05875682830810547, -0.055530548095703125, -0.05230426788330078, -0.04907798767089844, -0.045851707458496094, -0.04262542724609375, -0.039399147033691406, -0.03617286682128906, -0.03294658660888672, -0.029720306396484375, -0.02649402618408203, -0.023267745971679688, -0.020041465759277344, -0.016815185546875, -0.013588905334472656, -0.010362625122070312, -0.007136344909667969, -0.003910064697265625, -0.0006837844848632812, 0.0025424957275390625, 0.005768775939941406, 0.00899505615234375, 0.012221336364746094, 0.015447616577148438, 0.01867389678955078, 0.021900177001953125, 0.02512645721435547, 0.028352737426757812, 0.031579017639160156, 0.0348052978515625, 0.038031578063964844, 0.04125785827636719, 0.04448413848876953, 0.047710418701171875, 0.05093669891357422, 0.05416297912597656, 0.057389259338378906, 0.06061553955078125, 0.0638418197631836, 0.06706809997558594, 0.07029438018798828, 0.07352066040039062, 0.07674694061279297, 0.07997322082519531, 0.08319950103759766, 0.08642578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 15.0, 22.0, 28.0, 47.0, 63.0, 97.0, 126.0, 204.0, 342.0, 603.0, 1140.0, 2084.0, 3740.0, 7098.0, 12961.0, 23252.0, 41111.0, 69668.0, 112072.0, 161170.0, 185944.0, 158832.0, 109612.0, 67615.0, 40227.0, 22842.0, 12487.0, 6865.0, 3633.0, 1974.0, 1049.0, 602.0, 341.0, 232.0, 135.0, 102.0, 72.0, 37.0, 25.0, 22.0, 16.0, 10.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.1905994415283203, -0.18454360961914062, -0.17848777770996094, -0.17243194580078125, -0.16637611389160156, -0.16032028198242188, -0.1542644500732422, -0.1482086181640625, -0.1421527862548828, -0.13609695434570312, -0.13004112243652344, -0.12398529052734375, -0.11792945861816406, -0.11187362670898438, -0.10581779479980469, -0.099761962890625, -0.09370613098144531, -0.08765029907226562, -0.08159446716308594, -0.07553863525390625, -0.06948280334472656, -0.06342697143554688, -0.05737113952636719, -0.0513153076171875, -0.04525947570800781, -0.039203643798828125, -0.03314781188964844, -0.02709197998046875, -0.021036148071289062, -0.014980316162109375, -0.008924484252929688, -0.00286865234375, 0.0031871795654296875, 0.009243011474609375, 0.015298843383789062, 0.02135467529296875, 0.027410507202148438, 0.033466339111328125, 0.03952217102050781, 0.0455780029296875, 0.05163383483886719, 0.057689666748046875, 0.06374549865722656, 0.06980133056640625, 0.07585716247558594, 0.08191299438476562, 0.08796882629394531, 0.094024658203125, 0.10008049011230469, 0.10613632202148438, 0.11219215393066406, 0.11824798583984375, 0.12430381774902344, 0.13035964965820312, 0.1364154815673828, 0.1424713134765625, 0.1485271453857422, 0.15458297729492188, 0.16063880920410156, 0.16669464111328125, 0.17275047302246094, 0.17880630493164062, 0.1848621368408203, 0.19091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 7.0, 15.0, 17.0, 19.0, 25.0, 30.0, 23.0, 36.0, 31.0, 42.0, 45.0, 38.0, 47.0, 36.0, 38.0, 37.0, 37.0, 41.0, 57.0, 45.0, 38.0, 31.0, 26.0, 34.0, 30.0, 16.0, 18.0, 22.0, 15.0, 19.0, 16.0, 9.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2529869079589844, -0.24474334716796875, -0.23649978637695312, -0.2282562255859375, -0.22001266479492188, -0.21176910400390625, -0.20352554321289062, -0.195281982421875, -0.18703842163085938, -0.17879486083984375, -0.17055130004882812, -0.1623077392578125, -0.15406417846679688, -0.14582061767578125, -0.13757705688476562, -0.12933349609375, -0.12108993530273438, -0.11284637451171875, -0.10460281372070312, -0.0963592529296875, -0.08811569213867188, -0.07987213134765625, -0.07162857055664062, -0.063385009765625, -0.055141448974609375, -0.04689788818359375, -0.038654327392578125, -0.0304107666015625, -0.022167205810546875, -0.01392364501953125, -0.005680084228515625, 0.0025634765625, 0.010807037353515625, 0.01905059814453125, 0.027294158935546875, 0.0355377197265625, 0.043781280517578125, 0.05202484130859375, 0.060268402099609375, 0.068511962890625, 0.07675552368164062, 0.08499908447265625, 0.09324264526367188, 0.1014862060546875, 0.10972976684570312, 0.11797332763671875, 0.12621688842773438, 0.13446044921875, 0.14270401000976562, 0.15094757080078125, 0.15919113159179688, 0.1674346923828125, 0.17567825317382812, 0.18392181396484375, 0.19216537475585938, 0.200408935546875, 0.20865249633789062, 0.21689605712890625, 0.22513961791992188, 0.2333831787109375, 0.24162673950195312, 0.24987030029296875, 0.2581138610839844, 0.266357421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 5.0, 9.0, 13.0, 36.0, 61.0, 85.0, 190.0, 342.0, 711.0, 1883.0, 5156.0, 15195.0, 48061.0, 138654.0, 290525.0, 307345.0, 156813.0, 55826.0, 18020.0, 5860.0, 2111.0, 881.0, 385.0, 165.0, 93.0, 56.0, 31.0, 9.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.0940542221069336, -0.09081840515136719, -0.08758258819580078, -0.08434677124023438, -0.08111095428466797, -0.07787513732910156, -0.07463932037353516, -0.07140350341796875, -0.06816768646240234, -0.06493186950683594, -0.06169605255126953, -0.058460235595703125, -0.05522441864013672, -0.05198860168457031, -0.048752784729003906, -0.0455169677734375, -0.042281150817871094, -0.03904533386230469, -0.03580951690673828, -0.032573699951171875, -0.02933788299560547, -0.026102066040039062, -0.022866249084472656, -0.01963043212890625, -0.016394615173339844, -0.013158798217773438, -0.009922981262207031, -0.006687164306640625, -0.0034513473510742188, -0.0002155303955078125, 0.0030202865600585938, 0.006256103515625, 0.009491920471191406, 0.012727737426757812, 0.01596355438232422, 0.019199371337890625, 0.02243518829345703, 0.025671005249023438, 0.028906822204589844, 0.03214263916015625, 0.035378456115722656, 0.03861427307128906, 0.04185009002685547, 0.045085906982421875, 0.04832172393798828, 0.05155754089355469, 0.054793357849121094, 0.0580291748046875, 0.061264991760253906, 0.06450080871582031, 0.06773662567138672, 0.07097244262695312, 0.07420825958251953, 0.07744407653808594, 0.08067989349365234, 0.08391571044921875, 0.08715152740478516, 0.09038734436035156, 0.09362316131591797, 0.09685897827148438, 0.10009479522705078, 0.10333061218261719, 0.1065664291381836, 0.10980224609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 12.0, 13.0, 23.0, 28.0, 29.0, 57.0, 45.0, 59.0, 73.0, 69.0, 87.0, 94.0, 85.0, 58.0, 42.0, 40.0, 35.0, 26.0, 27.0, 7.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193450927734375e-05, -2.1209940314292908e-05, -2.0485371351242065e-05, -1.9760802388191223e-05, -1.903623342514038e-05, -1.831166446208954e-05, -1.7587095499038696e-05, -1.6862526535987854e-05, -1.6137957572937012e-05, -1.541338860988617e-05, -1.4688819646835327e-05, -1.3964250683784485e-05, -1.3239681720733643e-05, -1.25151127576828e-05, -1.1790543794631958e-05, -1.1065974831581116e-05, -1.0341405868530273e-05, -9.616836905479431e-06, -8.892267942428589e-06, -8.167698979377747e-06, -7.443130016326904e-06, -6.718561053276062e-06, -5.99399209022522e-06, -5.2694231271743774e-06, -4.544854164123535e-06, -3.820285201072693e-06, -3.0957162380218506e-06, -2.3711472749710083e-06, -1.646578311920166e-06, -9.220093488693237e-07, -1.9744038581848145e-07, 5.271285772323608e-07, 1.2516975402832031e-06, 1.9762665033340454e-06, 2.7008354663848877e-06, 3.42540442943573e-06, 4.149973392486572e-06, 4.8745423555374146e-06, 5.599111318588257e-06, 6.323680281639099e-06, 7.048249244689941e-06, 7.772818207740784e-06, 8.497387170791626e-06, 9.221956133842468e-06, 9.94652509689331e-06, 1.0671094059944153e-05, 1.1395663022994995e-05, 1.2120231986045837e-05, 1.284480094909668e-05, 1.3569369912147522e-05, 1.4293938875198364e-05, 1.5018507838249207e-05, 1.574307680130005e-05, 1.646764576435089e-05, 1.7192214727401733e-05, 1.7916783690452576e-05, 1.8641352653503418e-05, 1.936592161655426e-05, 2.0090490579605103e-05, 2.0815059542655945e-05, 2.1539628505706787e-05, 2.226419746875763e-05, 2.298876643180847e-05, 2.3713335394859314e-05, 2.4437904357910156e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 19.0, 19.0, 28.0, 59.0, 95.0, 205.0, 347.0, 632.0, 1182.0, 2652.0, 5883.0, 13263.0, 29954.0, 65498.0, 128343.0, 205318.0, 231091.0, 176303.0, 100217.0, 48284.0, 21298.0, 9488.0, 4198.0, 2036.0, 1018.0, 492.0, 290.0, 141.0, 73.0, 47.0, 25.0, 11.0, 11.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.05937480926513672, -0.05734825134277344, -0.055321693420410156, -0.053295135498046875, -0.051268577575683594, -0.04924201965332031, -0.04721546173095703, -0.04518890380859375, -0.04316234588623047, -0.04113578796386719, -0.039109230041503906, -0.037082672119140625, -0.035056114196777344, -0.03302955627441406, -0.03100299835205078, -0.0289764404296875, -0.02694988250732422, -0.024923324584960938, -0.022896766662597656, -0.020870208740234375, -0.018843650817871094, -0.016817092895507812, -0.014790534973144531, -0.01276397705078125, -0.010737419128417969, -0.008710861206054688, -0.006684303283691406, -0.004657745361328125, -0.0026311874389648438, -0.0006046295166015625, 0.0014219284057617188, 0.003448486328125, 0.005475044250488281, 0.0075016021728515625, 0.009528160095214844, 0.011554718017578125, 0.013581275939941406, 0.015607833862304688, 0.01763439178466797, 0.01966094970703125, 0.02168750762939453, 0.023714065551757812, 0.025740623474121094, 0.027767181396484375, 0.029793739318847656, 0.03182029724121094, 0.03384685516357422, 0.0358734130859375, 0.03789997100830078, 0.03992652893066406, 0.041953086853027344, 0.043979644775390625, 0.046006202697753906, 0.04803276062011719, 0.05005931854248047, 0.05208587646484375, 0.05411243438720703, 0.05613899230957031, 0.058165550231933594, 0.060192108154296875, 0.062218666076660156, 0.06424522399902344, 0.06627178192138672, 0.06829833984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 12.0, 8.0, 11.0, 29.0, 33.0, 42.0, 42.0, 59.0, 52.0, 57.0, 57.0, 75.0, 69.0, 72.0, 60.0, 51.0, 48.0, 46.0, 32.0, 35.0, 32.0, 19.0, 20.0, 7.0, 9.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06175518035888672, -0.05966758728027344, -0.057579994201660156, -0.055492401123046875, -0.053404808044433594, -0.05131721496582031, -0.04922962188720703, -0.04714202880859375, -0.04505443572998047, -0.04296684265136719, -0.040879249572753906, -0.038791656494140625, -0.036704063415527344, -0.03461647033691406, -0.03252887725830078, -0.0304412841796875, -0.02835369110107422, -0.026266098022460938, -0.024178504943847656, -0.022090911865234375, -0.020003318786621094, -0.017915725708007812, -0.01582813262939453, -0.01374053955078125, -0.011652946472167969, -0.009565353393554688, -0.007477760314941406, -0.005390167236328125, -0.0033025741577148438, -0.0012149810791015625, 0.0008726119995117188, 0.002960205078125, 0.005047798156738281, 0.0071353912353515625, 0.009222984313964844, 0.011310577392578125, 0.013398170471191406, 0.015485763549804688, 0.01757335662841797, 0.01966094970703125, 0.02174854278564453, 0.023836135864257812, 0.025923728942871094, 0.028011322021484375, 0.030098915100097656, 0.03218650817871094, 0.03427410125732422, 0.0363616943359375, 0.03844928741455078, 0.04053688049316406, 0.042624473571777344, 0.044712066650390625, 0.046799659729003906, 0.04888725280761719, 0.05097484588623047, 0.05306243896484375, 0.05515003204345703, 0.05723762512207031, 0.059325218200683594, 0.061412811279296875, 0.06350040435791016, 0.06558799743652344, 0.06767559051513672, 0.06976318359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 8.0, 16.0, 29.0, 57.0, 112.0, 126.0, 192.0, 174.0, 140.0, 60.0, 37.0, 34.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8707690238952637, -0.8124346733093262, -0.7541002631187439, -0.6957659125328064, -0.6374315023422241, -0.5790971517562866, -0.5207628011703491, -0.46242842078208923, -0.40409404039382935, -0.34575966000556946, -0.28742527961730957, -0.22909092903137207, -0.17075654864311218, -0.1124221682548523, -0.054087817668914795, 0.004246562719345093, 0.06258094310760498, 0.12091531604528427, 0.17924968898296356, 0.23758405447006226, 0.29591843485832214, 0.35425281524658203, 0.41258716583251953, 0.4709215462207794, 0.5292559266090393, 0.5875902771949768, 0.6459246873855591, 0.7042590379714966, 0.7625933885574341, 0.8209277987480164, 0.8792621493339539, 0.9375965595245361, 0.9959309101104736, 1.0542652606964111, 1.1125996112823486, 1.1709339618682861, 1.2292684316635132, 1.2876027822494507, 1.3459371328353882, 1.4042714834213257, 1.4626059532165527, 1.5209403038024902, 1.5792746543884277, 1.6376090049743652, 1.6959434747695923, 1.7542778253555298, 1.8126121759414673, 1.8709465265274048, 1.9292808771133423, 1.9876152276992798, 2.045949697494507, 2.1042840480804443, 2.162618398666382, 2.2209527492523193, 2.279287099838257, 2.3376214504241943, 2.395955801010132, 2.4542901515960693, 2.512624502182007, 2.5709588527679443, 2.629293203353882, 2.6876277923583984, 2.745962142944336, 2.8042964935302734, 2.862630844116211]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 1.0, 9.0, 12.0, 8.0, 7.0, 18.0, 12.0, 26.0, 23.0, 35.0, 43.0, 38.0, 36.0, 44.0, 54.0, 53.0, 44.0, 52.0, 58.0, 46.0, 41.0, 43.0, 46.0, 45.0, 16.0, 30.0, 28.0, 18.0, 18.0, 19.0, 13.0, 10.0, 17.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.791124165058136, -0.7636244893074036, -0.7361248135566711, -0.7086251378059387, -0.6811254620552063, -0.6536257863044739, -0.6261261105537415, -0.598626434803009, -0.5711267590522766, -0.5436270833015442, -0.5161274075508118, -0.48862773180007935, -0.4611280560493469, -0.4336283802986145, -0.4061287045478821, -0.37862902879714966, -0.35112935304641724, -0.3236296772956848, -0.2961300015449524, -0.26863032579421997, -0.24113065004348755, -0.21363097429275513, -0.1861312985420227, -0.15863162279129028, -0.13113194704055786, -0.10363227128982544, -0.07613259553909302, -0.048632919788360596, -0.021133244037628174, 0.006366431713104248, 0.03386610746383667, 0.06136578321456909, 0.08886545896530151, 0.11636513471603394, 0.14386481046676636, 0.17136448621749878, 0.1988641619682312, 0.22636383771896362, 0.25386351346969604, 0.28136318922042847, 0.3088628649711609, 0.3363625407218933, 0.36386221647262573, 0.39136189222335815, 0.4188615679740906, 0.446361243724823, 0.4738609194755554, 0.5013605952262878, 0.5288602709770203, 0.5563599467277527, 0.5838596224784851, 0.6113592982292175, 0.63885897397995, 0.6663586497306824, 0.6938583254814148, 0.7213580012321472, 0.7488576769828796, 0.7763573527336121, 0.8038570284843445, 0.8313567042350769, 0.8588563799858093, 0.8863560557365417, 0.9138557314872742, 0.9413554072380066, 0.968855082988739]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 7.0, 12.0, 9.0, 12.0, 15.0, 31.0, 44.0, 50.0, 88.0, 120.0, 223.0, 358.0, 706.0, 1343.0, 2673.0, 5980.0, 15207.0, 43388.0, 154964.0, 817244.0, 2199277.0, 738848.0, 146830.0, 42023.0, 14449.0, 5591.0, 2407.0, 1100.0, 563.0, 289.0, 166.0, 101.0, 48.0, 39.0, 22.0, 15.0, 19.0, 6.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.21142196655273438, -0.20470428466796875, -0.19798660278320312, -0.1912689208984375, -0.18455123901367188, -0.17783355712890625, -0.17111587524414062, -0.164398193359375, -0.15768051147460938, -0.15096282958984375, -0.14424514770507812, -0.1375274658203125, -0.13080978393554688, -0.12409210205078125, -0.11737442016601562, -0.11065673828125, -0.10393905639648438, -0.09722137451171875, -0.09050369262695312, -0.0837860107421875, -0.07706832885742188, -0.07035064697265625, -0.06363296508789062, -0.056915283203125, -0.050197601318359375, -0.04347991943359375, -0.036762237548828125, -0.0300445556640625, -0.023326873779296875, -0.01660919189453125, -0.009891510009765625, -0.003173828125, 0.003543853759765625, 0.01026153564453125, 0.016979217529296875, 0.0236968994140625, 0.030414581298828125, 0.03713226318359375, 0.043849945068359375, 0.050567626953125, 0.057285308837890625, 0.06400299072265625, 0.07072067260742188, 0.0774383544921875, 0.08415603637695312, 0.09087371826171875, 0.09759140014648438, 0.10430908203125, 0.11102676391601562, 0.11774444580078125, 0.12446212768554688, 0.1311798095703125, 0.13789749145507812, 0.14461517333984375, 0.15133285522460938, 0.158050537109375, 0.16476821899414062, 0.17148590087890625, 0.17820358276367188, 0.1849212646484375, 0.19163894653320312, 0.19835662841796875, 0.20507431030273438, 0.2117919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 7.0, 8.0, 12.0, 15.0, 20.0, 26.0, 16.0, 41.0, 39.0, 49.0, 41.0, 44.0, 57.0, 42.0, 49.0, 45.0, 54.0, 53.0, 50.0, 46.0, 39.0, 32.0, 34.0, 44.0, 21.0, 17.0, 23.0, 21.0, 8.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117919921875, -0.11414623260498047, -0.11037254333496094, -0.1065988540649414, -0.10282516479492188, -0.09905147552490234, -0.09527778625488281, -0.09150409698486328, -0.08773040771484375, -0.08395671844482422, -0.08018302917480469, -0.07640933990478516, -0.07263565063476562, -0.0688619613647461, -0.06508827209472656, -0.06131458282470703, -0.0575408935546875, -0.05376720428466797, -0.04999351501464844, -0.046219825744628906, -0.042446136474609375, -0.038672447204589844, -0.03489875793457031, -0.03112506866455078, -0.02735137939453125, -0.02357769012451172, -0.019804000854492188, -0.016030311584472656, -0.012256622314453125, -0.008482933044433594, -0.0047092437744140625, -0.0009355545043945312, 0.002838134765625, 0.006611824035644531, 0.010385513305664062, 0.014159202575683594, 0.017932891845703125, 0.021706581115722656, 0.025480270385742188, 0.02925395965576172, 0.03302764892578125, 0.03680133819580078, 0.04057502746582031, 0.044348716735839844, 0.048122406005859375, 0.051896095275878906, 0.05566978454589844, 0.05944347381591797, 0.0632171630859375, 0.06699085235595703, 0.07076454162597656, 0.0745382308959961, 0.07831192016601562, 0.08208560943603516, 0.08585929870605469, 0.08963298797607422, 0.09340667724609375, 0.09718036651611328, 0.10095405578613281, 0.10472774505615234, 0.10850143432617188, 0.1122751235961914, 0.11604881286621094, 0.11982250213623047, 0.12359619140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 20.0, 27.0, 37.0, 70.0, 193.0, 351.0, 1009.0, 3348.0, 13052.0, 59775.0, 319367.0, 1815096.0, 1632465.0, 280557.0, 52796.0, 11550.0, 3037.0, 919.0, 334.0, 135.0, 65.0, 27.0, 15.0, 15.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2619514465332031, -0.25290679931640625, -0.24386215209960938, -0.2348175048828125, -0.22577285766601562, -0.21672821044921875, -0.20768356323242188, -0.198638916015625, -0.18959426879882812, -0.18054962158203125, -0.17150497436523438, -0.1624603271484375, -0.15341567993164062, -0.14437103271484375, -0.13532638549804688, -0.12628173828125, -0.11723709106445312, -0.10819244384765625, -0.09914779663085938, -0.0901031494140625, -0.08105850219726562, -0.07201385498046875, -0.06296920776367188, -0.053924560546875, -0.044879913330078125, -0.03583526611328125, -0.026790618896484375, -0.0177459716796875, -0.008701324462890625, 0.00034332275390625, 0.009387969970703125, 0.0184326171875, 0.027477264404296875, 0.03652191162109375, 0.045566558837890625, 0.0546112060546875, 0.06365585327148438, 0.07270050048828125, 0.08174514770507812, 0.090789794921875, 0.09983444213867188, 0.10887908935546875, 0.11792373657226562, 0.1269683837890625, 0.13601303100585938, 0.14505767822265625, 0.15410232543945312, 0.16314697265625, 0.17219161987304688, 0.18123626708984375, 0.19028091430664062, 0.1993255615234375, 0.20837020874023438, 0.21741485595703125, 0.22645950317382812, 0.235504150390625, 0.24454879760742188, 0.25359344482421875, 0.2626380920410156, 0.2716827392578125, 0.2807273864746094, 0.28977203369140625, 0.2988166809082031, 0.307861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 1.0, 7.0, 18.0, 21.0, 19.0, 37.0, 49.0, 45.0, 57.0, 85.0, 109.0, 130.0, 145.0, 232.0, 279.0, 343.0, 417.0, 427.0, 344.0, 282.0, 219.0, 172.0, 118.0, 119.0, 93.0, 65.0, 55.0, 41.0, 28.0, 23.0, 14.0, 15.0, 11.0, 10.0, 9.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1552734375, -0.15009307861328125, -0.1449127197265625, -0.13973236083984375, -0.134552001953125, -0.12937164306640625, -0.1241912841796875, -0.11901092529296875, -0.11383056640625, -0.10865020751953125, -0.1034698486328125, -0.09828948974609375, -0.093109130859375, -0.08792877197265625, -0.0827484130859375, -0.07756805419921875, -0.0723876953125, -0.06720733642578125, -0.0620269775390625, -0.05684661865234375, -0.051666259765625, -0.04648590087890625, -0.0413055419921875, -0.03612518310546875, -0.03094482421875, -0.02576446533203125, -0.0205841064453125, -0.01540374755859375, -0.010223388671875, -0.00504302978515625, 0.0001373291015625, 0.00531768798828125, 0.010498046875, 0.01567840576171875, 0.0208587646484375, 0.02603912353515625, 0.031219482421875, 0.03639984130859375, 0.0415802001953125, 0.04676055908203125, 0.05194091796875, 0.05712127685546875, 0.0623016357421875, 0.06748199462890625, 0.072662353515625, 0.07784271240234375, 0.0830230712890625, 0.08820343017578125, 0.0933837890625, 0.09856414794921875, 0.1037445068359375, 0.10892486572265625, 0.114105224609375, 0.11928558349609375, 0.1244659423828125, 0.12964630126953125, 0.13482666015625, 0.14000701904296875, 0.1451873779296875, 0.15036773681640625, 0.155548095703125, 0.16072845458984375, 0.1659088134765625, 0.17108917236328125, 0.17626953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 11.0, 14.0, 27.0, 42.0, 35.0, 67.0, 94.0, 94.0, 107.0, 111.0, 89.0, 91.0, 69.0, 56.0, 29.0, 23.0, 13.0, 17.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5622539520263672, -1.5258125066757202, -1.4893710613250732, -1.4529296159744263, -1.4164881706237793, -1.3800467252731323, -1.3436052799224854, -1.307163953781128, -1.2707223892211914, -1.2342809438705444, -1.1978394985198975, -1.1613980531692505, -1.1249566078186035, -1.0885151624679565, -1.0520737171173096, -1.0156323909759521, -0.9791909456253052, -0.9427495002746582, -0.9063080549240112, -0.8698666095733643, -0.8334251642227173, -0.7969837188720703, -0.7605423331260681, -0.7241008877754211, -0.6876594424247742, -0.6512179970741272, -0.6147765517234802, -0.5783351063728333, -0.541893720626831, -0.5054522752761841, -0.4690108299255371, -0.43256938457489014, -0.3961278796195984, -0.3596864342689514, -0.32324498891830444, -0.28680357336997986, -0.2503621280193329, -0.2139206826686859, -0.17747925221920013, -0.14103782176971436, -0.10459637641906738, -0.06815493851900101, -0.03171350061893463, 0.004727937281131744, 0.04116937518119812, 0.07761082053184509, 0.11405225098133087, 0.15049368143081665, 0.18693512678146362, 0.2233765721321106, 0.25981801748275757, 0.29625943303108215, 0.3327008783817291, 0.3691423237323761, 0.4055837392807007, 0.44202518463134766, 0.47846662998199463, 0.5149080753326416, 0.5513495206832886, 0.5877909660339355, 0.6242324113845825, 0.6606738567352295, 0.6971152424812317, 0.7335566878318787, 0.7699981331825256]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 9.0, 9.0, 3.0, 7.0, 10.0, 10.0, 13.0, 15.0, 10.0, 19.0, 20.0, 16.0, 35.0, 23.0, 29.0, 25.0, 22.0, 34.0, 36.0, 28.0, 44.0, 41.0, 46.0, 35.0, 41.0, 36.0, 25.0, 46.0, 30.0, 32.0, 30.0, 33.0, 31.0, 26.0, 17.0, 17.0, 16.0, 18.0, 16.0, 8.0, 16.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.5353688597679138, -0.5183150768280029, -0.5012613534927368, -0.4842075705528259, -0.46715378761291504, -0.45010003447532654, -0.43304628133773804, -0.41599249839782715, -0.39893874526023865, -0.38188499212265015, -0.36483120918273926, -0.34777745604515076, -0.33072370290756226, -0.31366991996765137, -0.29661616683006287, -0.27956241369247437, -0.2625086307525635, -0.24545486271381378, -0.2284010946750641, -0.21134734153747559, -0.1942935734987259, -0.1772398054599762, -0.1601860523223877, -0.143132284283638, -0.1260785162448883, -0.10902474820613861, -0.09197098761796951, -0.07491722702980042, -0.05786345899105072, -0.040809690952301025, -0.023755930364131927, -0.00670216977596283, 0.010351598262786865, 0.02740536257624626, 0.04445912688970566, 0.061512891203165054, 0.07856665551662445, 0.09562042355537415, 0.11267418414354324, 0.12972794473171234, 0.14678171277046204, 0.16383548080921173, 0.18088924884796143, 0.19794300198554993, 0.21499677002429962, 0.23205053806304932, 0.24910429120063782, 0.2661580443382263, 0.2832118272781372, 0.3002655804157257, 0.3173193633556366, 0.3343731164932251, 0.351426899433136, 0.3684806525707245, 0.385534405708313, 0.4025881886482239, 0.4196419417858124, 0.4366956949234009, 0.45374947786331177, 0.47080323100090027, 0.48785698413848877, 0.5049107670783997, 0.5219645500183105, 0.5390182733535767, 0.5560720562934875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 5.0, 11.0, 16.0, 17.0, 33.0, 42.0, 74.0, 112.0, 178.0, 377.0, 677.0, 1266.0, 2352.0, 4756.0, 9494.0, 19492.0, 40917.0, 84172.0, 157854.0, 230392.0, 217913.0, 138613.0, 72362.0, 34570.0, 16501.0, 7977.0, 3951.0, 1964.0, 1104.0, 564.0, 316.0, 192.0, 93.0, 71.0, 48.0, 23.0, 25.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3212890625, -0.3108863830566406, -0.30048370361328125, -0.2900810241699219, -0.2796783447265625, -0.2692756652832031, -0.25887298583984375, -0.24847030639648438, -0.238067626953125, -0.22766494750976562, -0.21726226806640625, -0.20685958862304688, -0.1964569091796875, -0.18605422973632812, -0.17565155029296875, -0.16524887084960938, -0.15484619140625, -0.14444351196289062, -0.13404083251953125, -0.12363815307617188, -0.1132354736328125, -0.10283279418945312, -0.09243011474609375, -0.08202743530273438, -0.071624755859375, -0.061222076416015625, -0.05081939697265625, -0.040416717529296875, -0.0300140380859375, -0.019611358642578125, -0.00920867919921875, 0.001194000244140625, 0.0115966796875, 0.021999359130859375, 0.03240203857421875, 0.042804718017578125, 0.0532073974609375, 0.06361007690429688, 0.07401275634765625, 0.08441543579101562, 0.094818115234375, 0.10522079467773438, 0.11562347412109375, 0.12602615356445312, 0.1364288330078125, 0.14683151245117188, 0.15723419189453125, 0.16763687133789062, 0.17803955078125, 0.18844223022460938, 0.19884490966796875, 0.20924758911132812, 0.2196502685546875, 0.23005294799804688, 0.24045562744140625, 0.2508583068847656, 0.261260986328125, 0.2716636657714844, 0.28206634521484375, 0.2924690246582031, 0.3028717041015625, 0.3132743835449219, 0.32367706298828125, 0.3340797424316406, 0.344482421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 17.0, 6.0, 16.0, 20.0, 30.0, 29.0, 22.0, 33.0, 29.0, 40.0, 48.0, 35.0, 50.0, 51.0, 48.0, 54.0, 41.0, 48.0, 38.0, 53.0, 51.0, 27.0, 30.0, 32.0, 26.0, 16.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.1078042984008789, -0.10434150695800781, -0.10087871551513672, -0.09741592407226562, -0.09395313262939453, -0.09049034118652344, -0.08702754974365234, -0.08356475830078125, -0.08010196685791016, -0.07663917541503906, -0.07317638397216797, -0.06971359252929688, -0.06625080108642578, -0.06278800964355469, -0.059325218200683594, -0.0558624267578125, -0.052399635314941406, -0.04893684387207031, -0.04547405242919922, -0.042011260986328125, -0.03854846954345703, -0.03508567810058594, -0.031622886657714844, -0.02816009521484375, -0.024697303771972656, -0.021234512329101562, -0.01777172088623047, -0.014308929443359375, -0.010846138000488281, -0.0073833465576171875, -0.003920555114746094, -0.000457763671875, 0.0030050277709960938, 0.0064678192138671875, 0.009930610656738281, 0.013393402099609375, 0.01685619354248047, 0.020318984985351562, 0.023781776428222656, 0.02724456787109375, 0.030707359313964844, 0.03417015075683594, 0.03763294219970703, 0.041095733642578125, 0.04455852508544922, 0.04802131652832031, 0.051484107971191406, 0.0549468994140625, 0.058409690856933594, 0.06187248229980469, 0.06533527374267578, 0.06879806518554688, 0.07226085662841797, 0.07572364807128906, 0.07918643951416016, 0.08264923095703125, 0.08611202239990234, 0.08957481384277344, 0.09303760528564453, 0.09650039672851562, 0.09996318817138672, 0.10342597961425781, 0.1068887710571289, 0.1103515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 10.0, 12.0, 17.0, 10.0, 27.0, 47.0, 59.0, 80.0, 126.0, 153.0, 226.0, 388.0, 642.0, 1130.0, 1988.0, 3761.0, 7152.0, 14022.0, 27596.0, 52949.0, 93032.0, 144365.0, 185561.0, 183647.0, 140104.0, 87959.0, 49505.0, 25959.0, 12968.0, 6828.0, 3458.0, 1885.0, 1099.0, 637.0, 366.0, 231.0, 166.0, 129.0, 81.0, 47.0, 52.0, 24.0, 11.0, 14.0, 10.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2362060546875, -0.2285747528076172, -0.22094345092773438, -0.21331214904785156, -0.20568084716796875, -0.19804954528808594, -0.19041824340820312, -0.1827869415283203, -0.1751556396484375, -0.1675243377685547, -0.15989303588867188, -0.15226173400878906, -0.14463043212890625, -0.13699913024902344, -0.12936782836914062, -0.12173652648925781, -0.114105224609375, -0.10647392272949219, -0.09884262084960938, -0.09121131896972656, -0.08358001708984375, -0.07594871520996094, -0.06831741333007812, -0.06068611145019531, -0.0530548095703125, -0.04542350769042969, -0.037792205810546875, -0.030160903930664062, -0.02252960205078125, -0.014898300170898438, -0.007266998291015625, 0.0003643035888671875, 0.00799560546875, 0.015626907348632812, 0.023258209228515625, 0.030889511108398438, 0.03852081298828125, 0.04615211486816406, 0.053783416748046875, 0.06141471862792969, 0.0690460205078125, 0.07667732238769531, 0.08430862426757812, 0.09193992614746094, 0.09957122802734375, 0.10720252990722656, 0.11483383178710938, 0.12246513366699219, 0.130096435546875, 0.1377277374267578, 0.14535903930664062, 0.15299034118652344, 0.16062164306640625, 0.16825294494628906, 0.17588424682617188, 0.1835155487060547, 0.1911468505859375, 0.1987781524658203, 0.20640945434570312, 0.21404075622558594, 0.22167205810546875, 0.22930335998535156, 0.23693466186523438, 0.2445659637451172, 0.252197265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 7.0, 4.0, 6.0, 5.0, 4.0, 8.0, 9.0, 12.0, 14.0, 14.0, 29.0, 18.0, 31.0, 33.0, 35.0, 36.0, 32.0, 33.0, 39.0, 40.0, 25.0, 40.0, 55.0, 44.0, 42.0, 52.0, 45.0, 35.0, 30.0, 30.0, 32.0, 23.0, 29.0, 24.0, 15.0, 14.0, 15.0, 4.0, 10.0, 10.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2958984375, -0.28714752197265625, -0.2783966064453125, -0.26964569091796875, -0.260894775390625, -0.25214385986328125, -0.2433929443359375, -0.23464202880859375, -0.22589111328125, -0.21714019775390625, -0.2083892822265625, -0.19963836669921875, -0.190887451171875, -0.18213653564453125, -0.1733856201171875, -0.16463470458984375, -0.1558837890625, -0.14713287353515625, -0.1383819580078125, -0.12963104248046875, -0.120880126953125, -0.11212921142578125, -0.1033782958984375, -0.09462738037109375, -0.08587646484375, -0.07712554931640625, -0.0683746337890625, -0.05962371826171875, -0.050872802734375, -0.04212188720703125, -0.0333709716796875, -0.02462005615234375, -0.015869140625, -0.00711822509765625, 0.0016326904296875, 0.01038360595703125, 0.019134521484375, 0.02788543701171875, 0.0366363525390625, 0.04538726806640625, 0.05413818359375, 0.06288909912109375, 0.0716400146484375, 0.08039093017578125, 0.089141845703125, 0.09789276123046875, 0.1066436767578125, 0.11539459228515625, 0.1241455078125, 0.13289642333984375, 0.1416473388671875, 0.15039825439453125, 0.159149169921875, 0.16790008544921875, 0.1766510009765625, 0.18540191650390625, 0.19415283203125, 0.20290374755859375, 0.2116546630859375, 0.22040557861328125, 0.229156494140625, 0.23790740966796875, 0.2466583251953125, 0.25540924072265625, 0.26416015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 15.0, 12.0, 29.0, 38.0, 57.0, 109.0, 161.0, 305.0, 510.0, 869.0, 1671.0, 3116.0, 5958.0, 11731.0, 23691.0, 50187.0, 105027.0, 192436.0, 248800.0, 195280.0, 107635.0, 51300.0, 24393.0, 11939.0, 6090.0, 3222.0, 1717.0, 925.0, 522.0, 298.0, 206.0, 114.0, 71.0, 45.0, 30.0, 12.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09979248046875, -0.09672355651855469, -0.09365463256835938, -0.09058570861816406, -0.08751678466796875, -0.08444786071777344, -0.08137893676757812, -0.07831001281738281, -0.0752410888671875, -0.07217216491699219, -0.06910324096679688, -0.06603431701660156, -0.06296539306640625, -0.05989646911621094, -0.056827545166015625, -0.05375862121582031, -0.050689697265625, -0.04762077331542969, -0.044551849365234375, -0.04148292541503906, -0.03841400146484375, -0.03534507751464844, -0.032276153564453125, -0.029207229614257812, -0.0261383056640625, -0.023069381713867188, -0.020000457763671875, -0.016931533813476562, -0.01386260986328125, -0.010793685913085938, -0.007724761962890625, -0.0046558380126953125, -0.0015869140625, 0.0014820098876953125, 0.004550933837890625, 0.0076198577880859375, 0.01068878173828125, 0.013757705688476562, 0.016826629638671875, 0.019895553588867188, 0.0229644775390625, 0.026033401489257812, 0.029102325439453125, 0.03217124938964844, 0.03524017333984375, 0.03830909729003906, 0.041378021240234375, 0.04444694519042969, 0.047515869140625, 0.05058479309082031, 0.053653717041015625, 0.05672264099121094, 0.05979156494140625, 0.06286048889160156, 0.06592941284179688, 0.06899833679199219, 0.0720672607421875, 0.07513618469238281, 0.07820510864257812, 0.08127403259277344, 0.08434295654296875, 0.08741188049316406, 0.09048080444335938, 0.09354972839355469, 0.09661865234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 11.0, 2.0, 9.0, 12.0, 16.0, 16.0, 20.0, 37.0, 37.0, 49.0, 50.0, 66.0, 69.0, 87.0, 87.0, 70.0, 64.0, 63.0, 49.0, 32.0, 34.0, 32.0, 26.0, 13.0, 10.0, 7.0, 11.0, 3.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.17692756652832e-05, -3.0782073736190796e-05, -2.979487180709839e-05, -2.880766987800598e-05, -2.7820467948913574e-05, -2.6833266019821167e-05, -2.584606409072876e-05, -2.4858862161636353e-05, -2.3871660232543945e-05, -2.2884458303451538e-05, -2.189725637435913e-05, -2.0910054445266724e-05, -1.9922852516174316e-05, -1.893565058708191e-05, -1.7948448657989502e-05, -1.6961246728897095e-05, -1.5974044799804688e-05, -1.498684287071228e-05, -1.3999640941619873e-05, -1.3012439012527466e-05, -1.2025237083435059e-05, -1.1038035154342651e-05, -1.0050833225250244e-05, -9.063631296157837e-06, -8.07642936706543e-06, -7.0892274379730225e-06, -6.102025508880615e-06, -5.114823579788208e-06, -4.127621650695801e-06, -3.1404197216033936e-06, -2.1532177925109863e-06, -1.166015863418579e-06, -1.7881393432617188e-07, 8.083879947662354e-07, 1.7955899238586426e-06, 2.78279185295105e-06, 3.769993782043457e-06, 4.757195711135864e-06, 5.7443976402282715e-06, 6.731599569320679e-06, 7.718801498413086e-06, 8.706003427505493e-06, 9.6932053565979e-06, 1.0680407285690308e-05, 1.1667609214782715e-05, 1.2654811143875122e-05, 1.364201307296753e-05, 1.4629215002059937e-05, 1.5616416931152344e-05, 1.660361886024475e-05, 1.7590820789337158e-05, 1.8578022718429565e-05, 1.9565224647521973e-05, 2.055242657661438e-05, 2.1539628505706787e-05, 2.2526830434799194e-05, 2.35140323638916e-05, 2.450123429298401e-05, 2.5488436222076416e-05, 2.6475638151168823e-05, 2.746284008026123e-05, 2.8450042009353638e-05, 2.9437243938446045e-05, 3.0424445867538452e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 12.0, 15.0, 14.0, 24.0, 32.0, 66.0, 97.0, 158.0, 237.0, 382.0, 732.0, 1250.0, 2413.0, 4740.0, 10606.0, 28131.0, 83558.0, 228165.0, 350553.0, 214649.0, 77145.0, 25787.0, 10041.0, 4559.0, 2194.0, 1277.0, 676.0, 370.0, 253.0, 130.0, 87.0, 57.0, 42.0, 32.0, 23.0, 13.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11920166015625, -0.11528873443603516, -0.11137580871582031, -0.10746288299560547, -0.10354995727539062, -0.09963703155517578, -0.09572410583496094, -0.0918111801147461, -0.08789825439453125, -0.0839853286743164, -0.08007240295410156, -0.07615947723388672, -0.07224655151367188, -0.06833362579345703, -0.06442070007324219, -0.060507774353027344, -0.0565948486328125, -0.052681922912597656, -0.04876899719238281, -0.04485607147216797, -0.040943145751953125, -0.03703022003173828, -0.03311729431152344, -0.029204368591308594, -0.02529144287109375, -0.021378517150878906, -0.017465591430664062, -0.013552665710449219, -0.009639739990234375, -0.005726814270019531, -0.0018138885498046875, 0.0020990371704101562, 0.006011962890625, 0.009924888610839844, 0.013837814331054688, 0.01775074005126953, 0.021663665771484375, 0.02557659149169922, 0.029489517211914062, 0.033402442932128906, 0.03731536865234375, 0.041228294372558594, 0.04514122009277344, 0.04905414581298828, 0.052967071533203125, 0.05687999725341797, 0.06079292297363281, 0.06470584869384766, 0.0686187744140625, 0.07253170013427734, 0.07644462585449219, 0.08035755157470703, 0.08427047729492188, 0.08818340301513672, 0.09209632873535156, 0.0960092544555664, 0.09992218017578125, 0.1038351058959961, 0.10774803161621094, 0.11166095733642578, 0.11557388305664062, 0.11948680877685547, 0.12339973449707031, 0.12731266021728516, 0.1312255859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 9.0, 13.0, 11.0, 22.0, 22.0, 31.0, 32.0, 42.0, 56.0, 70.0, 85.0, 69.0, 84.0, 80.0, 61.0, 59.0, 53.0, 36.0, 32.0, 31.0, 17.0, 18.0, 14.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09039306640625, -0.08748340606689453, -0.08457374572753906, -0.0816640853881836, -0.07875442504882812, -0.07584476470947266, -0.07293510437011719, -0.07002544403076172, -0.06711578369140625, -0.06420612335205078, -0.06129646301269531, -0.058386802673339844, -0.055477142333984375, -0.052567481994628906, -0.04965782165527344, -0.04674816131591797, -0.0438385009765625, -0.04092884063720703, -0.03801918029785156, -0.035109519958496094, -0.032199859619140625, -0.029290199279785156, -0.026380538940429688, -0.02347087860107422, -0.02056121826171875, -0.01765155792236328, -0.014741897583007812, -0.011832237243652344, -0.008922576904296875, -0.006012916564941406, -0.0031032562255859375, -0.00019359588623046875, 0.002716064453125, 0.005625724792480469, 0.008535385131835938, 0.011445045471191406, 0.014354705810546875, 0.017264366149902344, 0.020174026489257812, 0.02308368682861328, 0.02599334716796875, 0.02890300750732422, 0.03181266784667969, 0.034722328186035156, 0.037631988525390625, 0.040541648864746094, 0.04345130920410156, 0.04636096954345703, 0.0492706298828125, 0.05218029022216797, 0.05508995056152344, 0.057999610900878906, 0.060909271240234375, 0.06381893157958984, 0.06672859191894531, 0.06963825225830078, 0.07254791259765625, 0.07545757293701172, 0.07836723327636719, 0.08127689361572266, 0.08418655395507812, 0.0870962142944336, 0.09000587463378906, 0.09291553497314453, 0.0958251953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 18.0, 19.0, 31.0, 46.0, 59.0, 85.0, 113.0, 116.0, 116.0, 101.0, 95.0, 59.0, 56.0, 28.0, 19.0, 8.0, 8.0, 9.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1217647790908813, -1.0725327730178833, -1.0233006477355957, -0.9740686416625977, -0.9248365759849548, -0.875604510307312, -0.826372504234314, -0.7771404385566711, -0.7279083728790283, -0.6786763072013855, -0.6294442415237427, -0.5802122354507446, -0.5309801697731018, -0.481748104095459, -0.43251606822013855, -0.3832840323448181, -0.3340519666671753, -0.28481990098953247, -0.23558786511421204, -0.1863558143377304, -0.13712376356124878, -0.08789171278476715, -0.03865966200828552, 0.010572373867034912, 0.059804439544677734, 0.10903649032115936, 0.158268541097641, 0.20750059187412262, 0.25673264265060425, 0.30596470832824707, 0.3551967442035675, 0.40442878007888794, 0.4536607265472412, 0.502892792224884, 0.5521248579025269, 0.6013568639755249, 0.6505889296531677, 0.6998209953308105, 0.7490530014038086, 0.7982850670814514, 0.8475171327590942, 0.8967491984367371, 0.9459812641143799, 0.9952132701873779, 1.044445276260376, 1.0936774015426636, 1.1429094076156616, 1.1921415328979492, 1.2413735389709473, 1.2906055450439453, 1.339837670326233, 1.389069676399231, 1.4383018016815186, 1.4875338077545166, 1.5367658138275146, 1.5859978199005127, 1.6352299451828003, 1.6844619512557983, 1.733694076538086, 1.782926082611084, 1.832158088684082, 1.8813902139663696, 1.9306222200393677, 1.9798543453216553, 2.0290863513946533]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 8.0, 6.0, 15.0, 23.0, 12.0, 23.0, 23.0, 37.0, 27.0, 27.0, 40.0, 38.0, 47.0, 47.0, 46.0, 55.0, 51.0, 46.0, 41.0, 38.0, 47.0, 43.0, 36.0, 26.0, 29.0, 23.0, 32.0, 24.0, 18.0, 16.0, 13.0, 13.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1989262104034424, -1.166624903678894, -1.1343235969543457, -1.102022409439087, -1.0697211027145386, -1.0374197959899902, -1.0051186084747314, -0.9728173017501831, -0.9405159950256348, -0.9082146883010864, -0.8759134411811829, -0.8436121940612793, -0.811310887336731, -0.7790095806121826, -0.746708333492279, -0.7144070863723755, -0.6821057796478271, -0.6498044729232788, -0.6175032258033752, -0.5852019786834717, -0.5529006719589233, -0.520599365234375, -0.48829811811447144, -0.4559968411922455, -0.42369556427001953, -0.3913942873477936, -0.3590930104255676, -0.3267917335033417, -0.2944904565811157, -0.26218917965888977, -0.22988790273666382, -0.19758662581443787, -0.16528522968292236, -0.1329839527606964, -0.10068267583847046, -0.0683813989162445, -0.036080121994018555, -0.0037788450717926025, 0.02852243185043335, 0.0608237087726593, 0.09312498569488525, 0.1254262626171112, 0.15772753953933716, 0.1900288164615631, 0.22233009338378906, 0.254631370306015, 0.28693264722824097, 0.3192339241504669, 0.35153520107269287, 0.3838364779949188, 0.4161377549171448, 0.4484390318393707, 0.4807403087615967, 0.513041615486145, 0.5453428626060486, 0.5776441097259521, 0.6099454164505005, 0.6422467231750488, 0.6745479702949524, 0.706849217414856, 0.7391505241394043, 0.7714518308639526, 0.8037530779838562, 0.8360543251037598, 0.8683556318283081]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 9.0, 16.0, 22.0, 23.0, 46.0, 57.0, 94.0, 133.0, 198.0, 295.0, 439.0, 756.0, 1152.0, 1984.0, 3547.0, 6527.0, 13102.0, 27169.0, 62468.0, 170870.0, 574417.0, 1488432.0, 1223699.0, 395118.0, 127072.0, 49615.0, 22674.0, 11126.0, 5780.0, 3086.0, 1754.0, 976.0, 609.0, 356.0, 242.0, 153.0, 98.0, 53.0, 36.0, 24.0, 15.0, 9.0, 3.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.1669921875, -0.16205978393554688, -0.15712738037109375, -0.15219497680664062, -0.1472625732421875, -0.14233016967773438, -0.13739776611328125, -0.13246536254882812, -0.127532958984375, -0.12260055541992188, -0.11766815185546875, -0.11273574829101562, -0.1078033447265625, -0.10287094116210938, -0.09793853759765625, -0.09300613403320312, -0.08807373046875, -0.08314132690429688, -0.07820892333984375, -0.07327651977539062, -0.0683441162109375, -0.06341171264648438, -0.05847930908203125, -0.053546905517578125, -0.048614501953125, -0.043682098388671875, -0.03874969482421875, -0.033817291259765625, -0.0288848876953125, -0.023952484130859375, -0.01902008056640625, -0.014087677001953125, -0.0091552734375, -0.004222869873046875, 0.00070953369140625, 0.005641937255859375, 0.0105743408203125, 0.015506744384765625, 0.02043914794921875, 0.025371551513671875, 0.030303955078125, 0.035236358642578125, 0.04016876220703125, 0.045101165771484375, 0.0500335693359375, 0.054965972900390625, 0.05989837646484375, 0.06483078002929688, 0.06976318359375, 0.07469558715820312, 0.07962799072265625, 0.08456039428710938, 0.0894927978515625, 0.09442520141601562, 0.09935760498046875, 0.10429000854492188, 0.109222412109375, 0.11415481567382812, 0.11908721923828125, 0.12401962280273438, 0.1289520263671875, 0.13388442993164062, 0.13881683349609375, 0.14374923706054688, 0.148681640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 9.0, 10.0, 14.0, 13.0, 13.0, 18.0, 25.0, 26.0, 27.0, 42.0, 37.0, 32.0, 40.0, 41.0, 44.0, 37.0, 51.0, 39.0, 44.0, 40.0, 42.0, 38.0, 32.0, 39.0, 36.0, 32.0, 17.0, 27.0, 16.0, 15.0, 23.0, 12.0, 14.0, 9.0, 12.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1258544921875, -0.12205219268798828, -0.11824989318847656, -0.11444759368896484, -0.11064529418945312, -0.1068429946899414, -0.10304069519042969, -0.09923839569091797, -0.09543609619140625, -0.09163379669189453, -0.08783149719238281, -0.0840291976928711, -0.08022689819335938, -0.07642459869384766, -0.07262229919433594, -0.06881999969482422, -0.0650177001953125, -0.06121540069580078, -0.05741310119628906, -0.053610801696777344, -0.049808502197265625, -0.046006202697753906, -0.04220390319824219, -0.03840160369873047, -0.03459930419921875, -0.03079700469970703, -0.026994705200195312, -0.023192405700683594, -0.019390106201171875, -0.015587806701660156, -0.011785507202148438, -0.007983207702636719, -0.004180908203125, -0.00037860870361328125, 0.0034236907958984375, 0.007225990295410156, 0.011028289794921875, 0.014830589294433594, 0.018632888793945312, 0.02243518829345703, 0.02623748779296875, 0.03003978729248047, 0.03384208679199219, 0.037644386291503906, 0.041446685791015625, 0.045248985290527344, 0.04905128479003906, 0.05285358428955078, 0.0566558837890625, 0.06045818328857422, 0.06426048278808594, 0.06806278228759766, 0.07186508178710938, 0.0756673812866211, 0.07946968078613281, 0.08327198028564453, 0.08707427978515625, 0.09087657928466797, 0.09467887878417969, 0.0984811782836914, 0.10228347778320312, 0.10608577728271484, 0.10988807678222656, 0.11369037628173828, 0.11749267578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 16.0, 11.0, 29.0, 36.0, 53.0, 87.0, 139.0, 248.0, 488.0, 900.0, 1858.0, 3793.0, 8889.0, 21211.0, 56031.0, 159324.0, 483393.0, 1481617.0, 1333008.0, 420411.0, 139335.0, 49470.0, 18872.0, 7896.0, 3555.0, 1738.0, 809.0, 455.0, 241.0, 142.0, 83.0, 49.0, 32.0, 17.0, 16.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.22216796875, -0.2159862518310547, -0.20980453491210938, -0.20362281799316406, -0.19744110107421875, -0.19125938415527344, -0.18507766723632812, -0.1788959503173828, -0.1727142333984375, -0.1665325164794922, -0.16035079956054688, -0.15416908264160156, -0.14798736572265625, -0.14180564880371094, -0.13562393188476562, -0.1294422149658203, -0.123260498046875, -0.11707878112792969, -0.11089706420898438, -0.10471534729003906, -0.09853363037109375, -0.09235191345214844, -0.08617019653320312, -0.07998847961425781, -0.0738067626953125, -0.06762504577636719, -0.061443328857421875, -0.05526161193847656, -0.04907989501953125, -0.04289817810058594, -0.036716461181640625, -0.030534744262695312, -0.02435302734375, -0.018171310424804688, -0.011989593505859375, -0.0058078765869140625, 0.00037384033203125, 0.0065555572509765625, 0.012737274169921875, 0.018918991088867188, 0.0251007080078125, 0.03128242492675781, 0.037464141845703125, 0.04364585876464844, 0.04982757568359375, 0.05600929260253906, 0.062191009521484375, 0.06837272644042969, 0.074554443359375, 0.08073616027832031, 0.08691787719726562, 0.09309959411621094, 0.09928131103515625, 0.10546302795410156, 0.11164474487304688, 0.11782646179199219, 0.1240081787109375, 0.1301898956298828, 0.13637161254882812, 0.14255332946777344, 0.14873504638671875, 0.15491676330566406, 0.16109848022460938, 0.1672801971435547, 0.1734619140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 6.0, 11.0, 13.0, 9.0, 19.0, 31.0, 23.0, 45.0, 49.0, 61.0, 93.0, 112.0, 129.0, 162.0, 231.0, 276.0, 400.0, 399.0, 404.0, 350.0, 276.0, 198.0, 174.0, 124.0, 101.0, 90.0, 61.0, 51.0, 21.0, 30.0, 23.0, 15.0, 17.0, 14.0, 6.0, 9.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.199951171875, -0.19408416748046875, -0.1882171630859375, -0.18235015869140625, -0.176483154296875, -0.17061614990234375, -0.1647491455078125, -0.15888214111328125, -0.15301513671875, -0.14714813232421875, -0.1412811279296875, -0.13541412353515625, -0.129547119140625, -0.12368011474609375, -0.1178131103515625, -0.11194610595703125, -0.1060791015625, -0.10021209716796875, -0.0943450927734375, -0.08847808837890625, -0.082611083984375, -0.07674407958984375, -0.0708770751953125, -0.06501007080078125, -0.05914306640625, -0.05327606201171875, -0.0474090576171875, -0.04154205322265625, -0.035675048828125, -0.02980804443359375, -0.0239410400390625, -0.01807403564453125, -0.01220703125, -0.00634002685546875, -0.0004730224609375, 0.00539398193359375, 0.011260986328125, 0.01712799072265625, 0.0229949951171875, 0.02886199951171875, 0.03472900390625, 0.04059600830078125, 0.0464630126953125, 0.05233001708984375, 0.058197021484375, 0.06406402587890625, 0.0699310302734375, 0.07579803466796875, 0.0816650390625, 0.08753204345703125, 0.0933990478515625, 0.09926605224609375, 0.105133056640625, 0.11100006103515625, 0.1168670654296875, 0.12273406982421875, 0.12860107421875, 0.13446807861328125, 0.1403350830078125, 0.14620208740234375, 0.152069091796875, 0.15793609619140625, 0.1638031005859375, 0.16967010498046875, 0.175537109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 22.0, 26.0, 35.0, 49.0, 61.0, 76.0, 75.0, 115.0, 111.0, 95.0, 74.0, 63.0, 45.0, 45.0, 34.0, 14.0, 15.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4031206369400024, -1.3667858839035034, -1.330451250076294, -1.294116497039795, -1.2577818632125854, -1.2214471101760864, -1.185112476348877, -1.148777723312378, -1.112442970275879, -1.0761082172393799, -1.0397735834121704, -1.0034388303756714, -0.9671041965484619, -0.9307694435119629, -0.8944347500801086, -0.8581000566482544, -0.8217654228210449, -0.7854307293891907, -0.7490960359573364, -0.7127613425254822, -0.6764266490936279, -0.6400918960571289, -0.6037572026252747, -0.5674225091934204, -0.5310878157615662, -0.4947531223297119, -0.45841842889785767, -0.42208370566368103, -0.3857490122318268, -0.34941431879997253, -0.3130795955657959, -0.27674490213394165, -0.2404102087020874, -0.20407551527023315, -0.1677408069372177, -0.13140609860420227, -0.09507140517234802, -0.058736711740493774, -0.022402003407478333, 0.01393270492553711, 0.05026739835739136, 0.0866020992398262, 0.12293680012226105, 0.1592715084552765, 0.19560620188713074, 0.23194089531898499, 0.2682756185531616, 0.30461031198501587, 0.3409450054168701, 0.37727969884872437, 0.4136143922805786, 0.44994911551475525, 0.4862838089466095, 0.5226185321807861, 0.5589532256126404, 0.5952879190444946, 0.6316226124763489, 0.6679573059082031, 0.7042919993400574, 0.7406266927719116, 0.7769614458084106, 0.8132960796356201, 0.8496308326721191, 0.8859655261039734, 0.9223002195358276]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 3.0, 4.0, 7.0, 10.0, 10.0, 9.0, 10.0, 8.0, 14.0, 19.0, 17.0, 15.0, 30.0, 22.0, 38.0, 30.0, 27.0, 35.0, 26.0, 39.0, 35.0, 53.0, 45.0, 40.0, 40.0, 45.0, 24.0, 42.0, 37.0, 23.0, 30.0, 26.0, 17.0, 29.0, 21.0, 18.0, 16.0, 14.0, 12.0, 11.0, 7.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.6756497621536255, -0.6547505855560303, -0.6338513493537903, -0.6129521727561951, -0.5920529365539551, -0.5711537599563599, -0.5502545833587646, -0.5293553471565247, -0.5084561109542847, -0.48755690455436707, -0.46665769815444946, -0.44575852155685425, -0.42485928535461426, -0.40396010875701904, -0.38306090235710144, -0.36216169595718384, -0.3412625193595886, -0.320363312959671, -0.2994641065597534, -0.2785649299621582, -0.2576656937599182, -0.2367665022611618, -0.2158673107624054, -0.1949681043624878, -0.1740688979625702, -0.1531696915626526, -0.13227048516273499, -0.11137129366397858, -0.09047208726406097, -0.06957288086414337, -0.04867368936538696, -0.02777448296546936, -0.006875216960906982, 0.014023985713720322, 0.034923188388347626, 0.05582238733768463, 0.07672159373760223, 0.09762080013751984, 0.11851999163627625, 0.13941919803619385, 0.16031840443611145, 0.18121761083602905, 0.20211681723594666, 0.22301600873470306, 0.24391521513462067, 0.26481443643569946, 0.2857136130332947, 0.3066128194332123, 0.3275120258331299, 0.3484112322330475, 0.3693104386329651, 0.3902096152305603, 0.4111088514328003, 0.4320080280303955, 0.4529072344303131, 0.4738064408302307, 0.4947056472301483, 0.5156048536300659, 0.5365040302276611, 0.5574032664299011, 0.5783024430274963, 0.5992016792297363, 0.6201008558273315, 0.6410000324249268, 0.6618992686271667]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 17.0, 9.0, 20.0, 43.0, 46.0, 64.0, 112.0, 157.0, 233.0, 382.0, 605.0, 1075.0, 1659.0, 3090.0, 5297.0, 9340.0, 16183.0, 28120.0, 47789.0, 82249.0, 137493.0, 200356.0, 196614.0, 131657.0, 77457.0, 45329.0, 26534.0, 15529.0, 8808.0, 5208.0, 2855.0, 1661.0, 977.0, 569.0, 349.0, 220.0, 139.0, 75.0, 64.0, 39.0, 22.0, 23.0, 18.0, 21.0, 4.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.2235107421875, -0.21628952026367188, -0.20906829833984375, -0.20184707641601562, -0.1946258544921875, -0.18740463256835938, -0.18018341064453125, -0.17296218872070312, -0.165740966796875, -0.15851974487304688, -0.15129852294921875, -0.14407730102539062, -0.1368560791015625, -0.12963485717773438, -0.12241363525390625, -0.11519241333007812, -0.10797119140625, -0.10074996948242188, -0.09352874755859375, -0.08630752563476562, -0.0790863037109375, -0.07186508178710938, -0.06464385986328125, -0.057422637939453125, -0.050201416015625, -0.042980194091796875, -0.03575897216796875, -0.028537750244140625, -0.0213165283203125, -0.014095306396484375, -0.00687408447265625, 0.000347137451171875, 0.007568359375, 0.014789581298828125, 0.02201080322265625, 0.029232025146484375, 0.0364532470703125, 0.043674468994140625, 0.05089569091796875, 0.058116912841796875, 0.065338134765625, 0.07255935668945312, 0.07978057861328125, 0.08700180053710938, 0.0942230224609375, 0.10144424438476562, 0.10866546630859375, 0.11588668823242188, 0.12310791015625, 0.13032913208007812, 0.13755035400390625, 0.14477157592773438, 0.1519927978515625, 0.15921401977539062, 0.16643524169921875, 0.17365646362304688, 0.180877685546875, 0.18809890747070312, 0.19532012939453125, 0.20254135131835938, 0.2097625732421875, 0.21698379516601562, 0.22420501708984375, 0.23142623901367188, 0.2386474609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 5.0, 8.0, 22.0, 11.0, 13.0, 19.0, 30.0, 22.0, 27.0, 29.0, 35.0, 37.0, 37.0, 47.0, 38.0, 56.0, 46.0, 48.0, 38.0, 44.0, 43.0, 41.0, 32.0, 26.0, 29.0, 31.0, 26.0, 27.0, 15.0, 15.0, 19.0, 16.0, 9.0, 9.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.124267578125, -0.12069225311279297, -0.11711692810058594, -0.1135416030883789, -0.10996627807617188, -0.10639095306396484, -0.10281562805175781, -0.09924030303955078, -0.09566497802734375, -0.09208965301513672, -0.08851432800292969, -0.08493900299072266, -0.08136367797851562, -0.0777883529663086, -0.07421302795410156, -0.07063770294189453, -0.0670623779296875, -0.06348705291748047, -0.05991172790527344, -0.056336402893066406, -0.052761077880859375, -0.049185752868652344, -0.04561042785644531, -0.04203510284423828, -0.03845977783203125, -0.03488445281982422, -0.03130912780761719, -0.027733802795410156, -0.024158477783203125, -0.020583152770996094, -0.017007827758789062, -0.013432502746582031, -0.009857177734375, -0.006281852722167969, -0.0027065277099609375, 0.0008687973022460938, 0.004444122314453125, 0.008019447326660156, 0.011594772338867188, 0.015170097351074219, 0.01874542236328125, 0.02232074737548828, 0.025896072387695312, 0.029471397399902344, 0.033046722412109375, 0.036622047424316406, 0.04019737243652344, 0.04377269744873047, 0.0473480224609375, 0.05092334747314453, 0.05449867248535156, 0.058073997497558594, 0.061649322509765625, 0.06522464752197266, 0.06879997253417969, 0.07237529754638672, 0.07595062255859375, 0.07952594757080078, 0.08310127258300781, 0.08667659759521484, 0.09025192260742188, 0.0938272476196289, 0.09740257263183594, 0.10097789764404297, 0.10455322265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 9.0, 10.0, 19.0, 35.0, 50.0, 82.0, 105.0, 177.0, 310.0, 700.0, 1718.0, 5153.0, 16969.0, 56681.0, 168839.0, 356665.0, 282997.0, 107798.0, 34140.0, 10468.0, 3244.0, 1170.0, 504.0, 276.0, 159.0, 104.0, 57.0, 43.0, 26.0, 12.0, 12.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.38391876220703125, -0.3718414306640625, -0.35976409912109375, -0.347686767578125, -0.33560943603515625, -0.3235321044921875, -0.31145477294921875, -0.29937744140625, -0.28730010986328125, -0.2752227783203125, -0.26314544677734375, -0.251068115234375, -0.23899078369140625, -0.2269134521484375, -0.21483612060546875, -0.2027587890625, -0.19068145751953125, -0.1786041259765625, -0.16652679443359375, -0.154449462890625, -0.14237213134765625, -0.1302947998046875, -0.11821746826171875, -0.10614013671875, -0.09406280517578125, -0.0819854736328125, -0.06990814208984375, -0.057830810546875, -0.04575347900390625, -0.0336761474609375, -0.02159881591796875, -0.009521484375, 0.00255584716796875, 0.0146331787109375, 0.02671051025390625, 0.038787841796875, 0.05086517333984375, 0.0629425048828125, 0.07501983642578125, 0.08709716796875, 0.09917449951171875, 0.1112518310546875, 0.12332916259765625, 0.135406494140625, 0.14748382568359375, 0.1595611572265625, 0.17163848876953125, 0.1837158203125, 0.19579315185546875, 0.2078704833984375, 0.21994781494140625, 0.232025146484375, 0.24410247802734375, 0.2561798095703125, 0.26825714111328125, 0.28033447265625, 0.29241180419921875, 0.3044891357421875, 0.31656646728515625, 0.328643798828125, 0.34072113037109375, 0.3527984619140625, 0.36487579345703125, 0.376953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 9.0, 6.0, 11.0, 13.0, 18.0, 16.0, 16.0, 22.0, 19.0, 36.0, 32.0, 30.0, 37.0, 34.0, 45.0, 56.0, 37.0, 52.0, 38.0, 44.0, 53.0, 52.0, 37.0, 42.0, 41.0, 41.0, 23.0, 20.0, 17.0, 22.0, 17.0, 11.0, 12.0, 13.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27014923095703125, -0.2597808837890625, -0.24941253662109375, -0.239044189453125, -0.22867584228515625, -0.2183074951171875, -0.20793914794921875, -0.19757080078125, -0.18720245361328125, -0.1768341064453125, -0.16646575927734375, -0.156097412109375, -0.14572906494140625, -0.1353607177734375, -0.12499237060546875, -0.1146240234375, -0.10425567626953125, -0.0938873291015625, -0.08351898193359375, -0.073150634765625, -0.06278228759765625, -0.0524139404296875, -0.04204559326171875, -0.03167724609375, -0.02130889892578125, -0.0109405517578125, -0.00057220458984375, 0.009796142578125, 0.02016448974609375, 0.0305328369140625, 0.04090118408203125, 0.05126953125, 0.06163787841796875, 0.0720062255859375, 0.08237457275390625, 0.092742919921875, 0.10311126708984375, 0.1134796142578125, 0.12384796142578125, 0.13421630859375, 0.14458465576171875, 0.1549530029296875, 0.16532135009765625, 0.175689697265625, 0.18605804443359375, 0.1964263916015625, 0.20679473876953125, 0.2171630859375, 0.22753143310546875, 0.2378997802734375, 0.24826812744140625, 0.258636474609375, 0.26900482177734375, 0.2793731689453125, 0.28974151611328125, 0.30010986328125, 0.31047821044921875, 0.3208465576171875, 0.33121490478515625, 0.341583251953125, 0.35195159912109375, 0.3623199462890625, 0.37268829345703125, 0.383056640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 4.0, 4.0, 14.0, 27.0, 39.0, 68.0, 115.0, 216.0, 454.0, 815.0, 1660.0, 3428.0, 7411.0, 15822.0, 33211.0, 75328.0, 186174.0, 324384.0, 228208.0, 94229.0, 40803.0, 18978.0, 8971.0, 4160.0, 1896.0, 984.0, 523.0, 249.0, 144.0, 81.0, 59.0, 26.0, 22.0, 13.0, 10.0, 8.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1277914047241211, -0.12399101257324219, -0.12019062042236328, -0.11639022827148438, -0.11258983612060547, -0.10878944396972656, -0.10498905181884766, -0.10118865966796875, -0.09738826751708984, -0.09358787536621094, -0.08978748321533203, -0.08598709106445312, -0.08218669891357422, -0.07838630676269531, -0.0745859146118164, -0.0707855224609375, -0.0669851303100586, -0.06318473815917969, -0.05938434600830078, -0.055583953857421875, -0.05178356170654297, -0.04798316955566406, -0.044182777404785156, -0.04038238525390625, -0.036581993103027344, -0.03278160095214844, -0.02898120880126953, -0.025180816650390625, -0.02138042449951172, -0.017580032348632812, -0.013779640197753906, -0.009979248046875, -0.006178855895996094, -0.0023784637451171875, 0.0014219284057617188, 0.005222320556640625, 0.009022712707519531, 0.012823104858398438, 0.016623497009277344, 0.02042388916015625, 0.024224281311035156, 0.028024673461914062, 0.03182506561279297, 0.035625457763671875, 0.03942584991455078, 0.04322624206542969, 0.047026634216308594, 0.0508270263671875, 0.054627418518066406, 0.05842781066894531, 0.06222820281982422, 0.06602859497070312, 0.06982898712158203, 0.07362937927246094, 0.07742977142333984, 0.08123016357421875, 0.08503055572509766, 0.08883094787597656, 0.09263134002685547, 0.09643173217773438, 0.10023212432861328, 0.10403251647949219, 0.1078329086303711, 0.11163330078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 13.0, 12.0, 15.0, 15.0, 18.0, 17.0, 31.0, 42.0, 41.0, 60.0, 85.0, 108.0, 81.0, 92.0, 69.0, 53.0, 55.0, 28.0, 30.0, 31.0, 20.0, 22.0, 9.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9385089874267578e-05, -2.838950604200363e-05, -2.7393922209739685e-05, -2.639833837747574e-05, -2.5402754545211792e-05, -2.4407170712947845e-05, -2.34115868806839e-05, -2.2416003048419952e-05, -2.1420419216156006e-05, -2.042483538389206e-05, -1.9429251551628113e-05, -1.8433667719364166e-05, -1.743808388710022e-05, -1.6442500054836273e-05, -1.5446916222572327e-05, -1.445133239030838e-05, -1.3455748558044434e-05, -1.2460164725780487e-05, -1.146458089351654e-05, -1.0468997061252594e-05, -9.473413228988647e-06, -8.477829396724701e-06, -7.482245564460754e-06, -6.486661732196808e-06, -5.491077899932861e-06, -4.495494067668915e-06, -3.4999102354049683e-06, -2.5043264031410217e-06, -1.5087425708770752e-06, -5.131587386131287e-07, 4.824250936508179e-07, 1.4780089259147644e-06, 2.473592758178711e-06, 3.4691765904426575e-06, 4.464760422706604e-06, 5.4603442549705505e-06, 6.455928087234497e-06, 7.451511919498444e-06, 8.44709575176239e-06, 9.442679584026337e-06, 1.0438263416290283e-05, 1.143384724855423e-05, 1.2429431080818176e-05, 1.3425014913082123e-05, 1.442059874534607e-05, 1.5416182577610016e-05, 1.6411766409873962e-05, 1.740735024213791e-05, 1.8402934074401855e-05, 1.9398517906665802e-05, 2.039410173892975e-05, 2.1389685571193695e-05, 2.238526940345764e-05, 2.3380853235721588e-05, 2.4376437067985535e-05, 2.537202090024948e-05, 2.6367604732513428e-05, 2.7363188564777374e-05, 2.835877239704132e-05, 2.9354356229305267e-05, 3.0349940061569214e-05, 3.134552389383316e-05, 3.234110772609711e-05, 3.3336691558361053e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 13.0, 8.0, 8.0, 24.0, 22.0, 31.0, 38.0, 55.0, 74.0, 112.0, 166.0, 244.0, 431.0, 841.0, 1546.0, 3588.0, 7715.0, 17941.0, 39491.0, 97033.0, 271888.0, 353975.0, 151329.0, 56211.0, 24692.0, 11246.0, 4940.0, 2241.0, 1103.0, 625.0, 332.0, 214.0, 118.0, 69.0, 48.0, 45.0, 26.0, 13.0, 10.0, 12.0, 14.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.12164306640625, -0.11786651611328125, -0.1140899658203125, -0.11031341552734375, -0.106536865234375, -0.10276031494140625, -0.0989837646484375, -0.09520721435546875, -0.0914306640625, -0.08765411376953125, -0.0838775634765625, -0.08010101318359375, -0.076324462890625, -0.07254791259765625, -0.0687713623046875, -0.06499481201171875, -0.06121826171875, -0.05744171142578125, -0.0536651611328125, -0.04988861083984375, -0.046112060546875, -0.04233551025390625, -0.0385589599609375, -0.03478240966796875, -0.031005859375, -0.02722930908203125, -0.0234527587890625, -0.01967620849609375, -0.015899658203125, -0.01212310791015625, -0.0083465576171875, -0.00457000732421875, -0.00079345703125, 0.00298309326171875, 0.0067596435546875, 0.01053619384765625, 0.014312744140625, 0.01808929443359375, 0.0218658447265625, 0.02564239501953125, 0.0294189453125, 0.03319549560546875, 0.0369720458984375, 0.04074859619140625, 0.044525146484375, 0.04830169677734375, 0.0520782470703125, 0.05585479736328125, 0.05963134765625, 0.06340789794921875, 0.0671844482421875, 0.07096099853515625, 0.074737548828125, 0.07851409912109375, 0.0822906494140625, 0.08606719970703125, 0.08984375, 0.09362030029296875, 0.0973968505859375, 0.10117340087890625, 0.104949951171875, 0.10872650146484375, 0.1125030517578125, 0.11627960205078125, 0.12005615234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 12.0, 9.0, 13.0, 22.0, 38.0, 59.0, 53.0, 86.0, 115.0, 103.0, 105.0, 80.0, 77.0, 66.0, 43.0, 27.0, 28.0, 11.0, 13.0, 3.0, 13.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.130950927734375, -0.12640380859375, -0.121856689453125, -0.1173095703125, -0.112762451171875, -0.10821533203125, -0.103668212890625, -0.09912109375, -0.094573974609375, -0.09002685546875, -0.085479736328125, -0.0809326171875, -0.076385498046875, -0.07183837890625, -0.067291259765625, -0.062744140625, -0.058197021484375, -0.05364990234375, -0.049102783203125, -0.0445556640625, -0.040008544921875, -0.03546142578125, -0.030914306640625, -0.0263671875, -0.021820068359375, -0.01727294921875, -0.012725830078125, -0.0081787109375, -0.003631591796875, 0.00091552734375, 0.005462646484375, 0.010009765625, 0.014556884765625, 0.01910400390625, 0.023651123046875, 0.0281982421875, 0.032745361328125, 0.03729248046875, 0.041839599609375, 0.04638671875, 0.050933837890625, 0.05548095703125, 0.060028076171875, 0.0645751953125, 0.069122314453125, 0.07366943359375, 0.078216552734375, 0.082763671875, 0.087310791015625, 0.09185791015625, 0.096405029296875, 0.1009521484375, 0.105499267578125, 0.11004638671875, 0.114593505859375, 0.119140625, 0.123687744140625, 0.12823486328125, 0.132781982421875, 0.1373291015625, 0.141876220703125, 0.14642333984375, 0.150970458984375, 0.155517578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 40.0, 85.0, 150.0, 216.0, 202.0, 154.0, 78.0, 40.0, 16.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9534810781478882, -1.8747016191482544, -1.7959221601486206, -1.7171427011489868, -1.6383633613586426, -1.5595839023590088, -1.480804443359375, -1.4020249843597412, -1.3232455253601074, -1.2444660663604736, -1.1656866073608398, -1.086907148361206, -1.0081276893615723, -0.9293482899665833, -0.8505688905715942, -0.7717894315719604, -0.6930099725723267, -0.6142305135726929, -0.5354510545730591, -0.45667165517807007, -0.3778921961784363, -0.2991127371788025, -0.2203333079814911, -0.1415538787841797, -0.0627744197845459, 0.016005024313926697, 0.09478446841239929, 0.1735639125108719, 0.2523433566093445, 0.33112281560897827, 0.4099022448062897, 0.4886816740036011, 0.5674610137939453, 0.6462404727935791, 0.7250199317932129, 0.8037993311882019, 0.8825787901878357, 0.9613582491874695, 1.0401376485824585, 1.1189171075820923, 1.197696566581726, 1.2764760255813599, 1.3552554845809937, 1.4340349435806274, 1.5128142833709717, 1.5915937423706055, 1.6703732013702393, 1.749152660369873, 1.8279321193695068, 1.9067115783691406, 1.9854910373687744, 2.064270496368408, 2.143049955368042, 2.221829414367676, 2.3006088733673096, 2.3793883323669434, 2.458167552947998, 2.536947011947632, 2.6157264709472656, 2.6945059299468994, 2.773285388946533, 2.852064847946167, 2.930844306945801, 3.0096235275268555, 3.0884032249450684]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 11.0, 16.0, 10.0, 12.0, 21.0, 24.0, 29.0, 36.0, 42.0, 38.0, 38.0, 40.0, 38.0, 31.0, 46.0, 34.0, 42.0, 42.0, 34.0, 44.0, 42.0, 39.0, 37.0, 23.0, 36.0, 30.0, 27.0, 24.0, 18.0, 13.0, 19.0, 11.0, 9.0, 10.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9091084599494934, -0.8811596035957336, -0.8532107472419739, -0.8252619504928589, -0.7973130941390991, -0.7693642377853394, -0.7414153814315796, -0.7134665250778198, -0.6855176687240601, -0.6575688123703003, -0.6296199560165405, -0.6016710996627808, -0.5737223029136658, -0.545773446559906, -0.5178245902061462, -0.4898757338523865, -0.4619269371032715, -0.4339780807495117, -0.40602925419807434, -0.3780803978443146, -0.3501315712928772, -0.32218271493911743, -0.29423385858535767, -0.2662850022315979, -0.23833617568016052, -0.21038733422756195, -0.18243849277496338, -0.1544896364212036, -0.12654079496860504, -0.09859195351600647, -0.0706430971622467, -0.04269425570964813, -0.014745473861694336, 0.013203371316194534, 0.041152216494083405, 0.06910106539726257, 0.09704990684986115, 0.12499874830245972, 0.15294760465621948, 0.18089644610881805, 0.20884528756141663, 0.2367941290140152, 0.26474297046661377, 0.29269182682037354, 0.3206406831741333, 0.3485895097255707, 0.37653836607933044, 0.4044871926307678, 0.4324360489845276, 0.46038490533828735, 0.48833373188972473, 0.5162825584411621, 0.5442314147949219, 0.5721802711486816, 0.6001291275024414, 0.6280779838562012, 0.6560268402099609, 0.6839756965637207, 0.7119245529174805, 0.7398734092712402, 0.7678222060203552, 0.795771062374115, 0.8237199187278748, 0.8516687750816345, 0.8796175718307495]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 14.0, 18.0, 24.0, 35.0, 52.0, 67.0, 116.0, 198.0, 302.0, 542.0, 1095.0, 2104.0, 4443.0, 9853.0, 23771.0, 64329.0, 204638.0, 838113.0, 1980389.0, 769270.0, 191383.0, 62000.0, 23449.0, 9524.0, 4301.0, 2011.0, 996.0, 562.0, 286.0, 155.0, 94.0, 50.0, 36.0, 17.0, 10.0, 5.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.25146484375, -0.24492835998535156, -0.23839187622070312, -0.2318553924560547, -0.22531890869140625, -0.2187824249267578, -0.21224594116210938, -0.20570945739746094, -0.1991729736328125, -0.19263648986816406, -0.18610000610351562, -0.1795635223388672, -0.17302703857421875, -0.1664905548095703, -0.15995407104492188, -0.15341758728027344, -0.146881103515625, -0.14034461975097656, -0.13380813598632812, -0.1272716522216797, -0.12073516845703125, -0.11419868469238281, -0.10766220092773438, -0.10112571716308594, -0.0945892333984375, -0.08805274963378906, -0.08151626586914062, -0.07497978210449219, -0.06844329833984375, -0.06190681457519531, -0.055370330810546875, -0.04883384704589844, -0.04229736328125, -0.03576087951660156, -0.029224395751953125, -0.022687911987304688, -0.01615142822265625, -0.009614944458007812, -0.003078460693359375, 0.0034580230712890625, 0.0099945068359375, 0.016530990600585938, 0.023067474365234375, 0.029603958129882812, 0.03614044189453125, 0.04267692565917969, 0.049213409423828125, 0.05574989318847656, 0.062286376953125, 0.06882286071777344, 0.07535934448242188, 0.08189582824707031, 0.08843231201171875, 0.09496879577636719, 0.10150527954101562, 0.10804176330566406, 0.1145782470703125, 0.12111473083496094, 0.12765121459960938, 0.1341876983642578, 0.14072418212890625, 0.1472606658935547, 0.15379714965820312, 0.16033363342285156, 0.1668701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 7.0, 7.0, 11.0, 16.0, 19.0, 20.0, 23.0, 16.0, 21.0, 30.0, 28.0, 35.0, 30.0, 41.0, 38.0, 43.0, 43.0, 37.0, 41.0, 45.0, 45.0, 55.0, 38.0, 33.0, 41.0, 27.0, 23.0, 25.0, 24.0, 25.0, 13.0, 24.0, 9.0, 3.0, 8.0, 8.0, 8.0, 6.0, 4.0, 9.0, 1.0, 7.0, 2.0, 4.0, 1.0], "bins": [-0.1402587890625, -0.13648509979248047, -0.13271141052246094, -0.1289377212524414, -0.12516403198242188, -0.12139034271240234, -0.11761665344238281, -0.11384296417236328, -0.11006927490234375, -0.10629558563232422, -0.10252189636230469, -0.09874820709228516, -0.09497451782226562, -0.0912008285522461, -0.08742713928222656, -0.08365345001220703, -0.0798797607421875, -0.07610607147216797, -0.07233238220214844, -0.0685586929321289, -0.06478500366210938, -0.061011314392089844, -0.05723762512207031, -0.05346393585205078, -0.04969024658203125, -0.04591655731201172, -0.04214286804199219, -0.038369178771972656, -0.034595489501953125, -0.030821800231933594, -0.027048110961914062, -0.02327442169189453, -0.019500732421875, -0.01572704315185547, -0.011953353881835938, -0.008179664611816406, -0.004405975341796875, -0.0006322860717773438, 0.0031414031982421875, 0.006915092468261719, 0.01068878173828125, 0.014462471008300781, 0.018236160278320312, 0.022009849548339844, 0.025783538818359375, 0.029557228088378906, 0.03333091735839844, 0.03710460662841797, 0.0408782958984375, 0.04465198516845703, 0.04842567443847656, 0.052199363708496094, 0.055973052978515625, 0.059746742248535156, 0.06352043151855469, 0.06729412078857422, 0.07106781005859375, 0.07484149932861328, 0.07861518859863281, 0.08238887786865234, 0.08616256713867188, 0.0899362564086914, 0.09370994567871094, 0.09748363494873047, 0.10125732421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 10.0, 25.0, 17.0, 28.0, 50.0, 78.0, 115.0, 152.0, 262.0, 421.0, 827.0, 1393.0, 2736.0, 5472.0, 10964.0, 23738.0, 53686.0, 124371.0, 299705.0, 758373.0, 1468235.0, 856040.0, 337399.0, 138758.0, 60081.0, 26680.0, 12200.0, 5774.0, 2878.0, 1549.0, 899.0, 491.0, 289.0, 183.0, 130.0, 67.0, 63.0, 46.0, 27.0, 18.0, 16.0, 8.0, 5.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.16363906860351562, -0.15845489501953125, -0.15327072143554688, -0.1480865478515625, -0.14290237426757812, -0.13771820068359375, -0.13253402709960938, -0.127349853515625, -0.12216567993164062, -0.11698150634765625, -0.11179733276367188, -0.1066131591796875, -0.10142898559570312, -0.09624481201171875, -0.09106063842773438, -0.08587646484375, -0.08069229125976562, -0.07550811767578125, -0.07032394409179688, -0.0651397705078125, -0.059955596923828125, -0.05477142333984375, -0.049587249755859375, -0.044403076171875, -0.039218902587890625, -0.03403472900390625, -0.028850555419921875, -0.0236663818359375, -0.018482208251953125, -0.01329803466796875, -0.008113861083984375, -0.0029296875, 0.002254486083984375, 0.00743865966796875, 0.012622833251953125, 0.0178070068359375, 0.022991180419921875, 0.02817535400390625, 0.033359527587890625, 0.038543701171875, 0.043727874755859375, 0.04891204833984375, 0.054096221923828125, 0.0592803955078125, 0.06446456909179688, 0.06964874267578125, 0.07483291625976562, 0.08001708984375, 0.08520126342773438, 0.09038543701171875, 0.09556961059570312, 0.1007537841796875, 0.10593795776367188, 0.11112213134765625, 0.11630630493164062, 0.121490478515625, 0.12667465209960938, 0.13185882568359375, 0.13704299926757812, 0.1422271728515625, 0.14741134643554688, 0.15259552001953125, 0.15777969360351562, 0.1629638671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 19.0, 31.0, 21.0, 42.0, 54.0, 52.0, 106.0, 157.0, 221.0, 301.0, 450.0, 540.0, 551.0, 427.0, 287.0, 198.0, 149.0, 123.0, 73.0, 67.0, 54.0, 32.0, 31.0, 12.0, 16.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.19412994384765625, -0.1863555908203125, -0.17858123779296875, -0.170806884765625, -0.16303253173828125, -0.1552581787109375, -0.14748382568359375, -0.13970947265625, -0.13193511962890625, -0.1241607666015625, -0.11638641357421875, -0.108612060546875, -0.10083770751953125, -0.0930633544921875, -0.08528900146484375, -0.0775146484375, -0.06974029541015625, -0.0619659423828125, -0.05419158935546875, -0.046417236328125, -0.03864288330078125, -0.0308685302734375, -0.02309417724609375, -0.01531982421875, -0.00754547119140625, 0.0002288818359375, 0.00800323486328125, 0.015777587890625, 0.02355194091796875, 0.0313262939453125, 0.03910064697265625, 0.046875, 0.05464935302734375, 0.0624237060546875, 0.07019805908203125, 0.077972412109375, 0.08574676513671875, 0.0935211181640625, 0.10129547119140625, 0.10906982421875, 0.11684417724609375, 0.1246185302734375, 0.13239288330078125, 0.140167236328125, 0.14794158935546875, 0.1557159423828125, 0.16349029541015625, 0.1712646484375, 0.17903900146484375, 0.1868133544921875, 0.19458770751953125, 0.202362060546875, 0.21013641357421875, 0.2179107666015625, 0.22568511962890625, 0.23345947265625, 0.24123382568359375, 0.2490081787109375, 0.25678253173828125, 0.264556884765625, 0.27233123779296875, 0.2801055908203125, 0.28787994384765625, 0.295654296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 9.0, 18.0, 20.0, 25.0, 33.0, 37.0, 61.0, 72.0, 75.0, 73.0, 79.0, 76.0, 74.0, 67.0, 52.0, 40.0, 52.0, 31.0, 29.0, 20.0, 13.0, 12.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013108611106873, -0.8709077835083008, -0.8405046463012695, -0.8101015686988831, -0.7796984314918518, -0.7492953538894653, -0.7188922166824341, -0.6884891390800476, -0.6580860614776611, -0.6276829838752747, -0.5972798466682434, -0.5668767690658569, -0.5364736318588257, -0.5060705542564392, -0.47566744685173035, -0.4452643394470215, -0.41486120223999023, -0.38445809483528137, -0.3540549874305725, -0.32365190982818604, -0.2932487726211548, -0.2628456950187683, -0.23244258761405945, -0.20203948020935059, -0.17163637280464172, -0.14123326539993286, -0.1108301654458046, -0.08042706549167633, -0.05002395808696747, -0.019620850682258606, 0.010782241821289062, 0.041185349225997925, 0.07158839702606201, 0.10199150443077087, 0.13239461183547974, 0.1627977043390274, 0.19320081174373627, 0.22360391914844513, 0.2540070116519928, 0.28441011905670166, 0.3148132264614105, 0.3452163338661194, 0.37561944127082825, 0.4060225486755371, 0.4364256262779236, 0.46682876348495483, 0.4972318410873413, 0.5276349782943726, 0.558038055896759, 0.5884411334991455, 0.6188442707061768, 0.6492473483085632, 0.6796504855155945, 0.710053563117981, 0.7404567003250122, 0.7708597779273987, 0.8012628555297852, 0.8316659331321716, 0.8620690703392029, 0.8924721479415894, 0.9228752851486206, 0.9532783627510071, 0.9836814403533936, 1.0140845775604248, 1.044487714767456]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 11.0, 9.0, 15.0, 19.0, 31.0, 24.0, 32.0, 30.0, 32.0, 40.0, 42.0, 38.0, 42.0, 38.0, 46.0, 43.0, 52.0, 42.0, 33.0, 32.0, 44.0, 45.0, 29.0, 32.0, 31.0, 21.0, 21.0, 28.0, 13.0, 8.0, 11.0, 12.0, 4.0, 5.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6664804816246033, -0.6417678594589233, -0.6170551776885986, -0.5923425555229187, -0.5676299333572388, -0.5429172515869141, -0.5182046294212341, -0.4934920072555542, -0.4687793552875519, -0.44406670331954956, -0.41935408115386963, -0.3946414291858673, -0.369928777217865, -0.34521615505218506, -0.32050350308418274, -0.2957908511161804, -0.2710782289505005, -0.24636559188365936, -0.22165295481681824, -0.19694030284881592, -0.1722276657819748, -0.14751502871513367, -0.12280237674713135, -0.09808973968029022, -0.0733771026134491, -0.04866446182131767, -0.02395182102918625, 0.0007608234882354736, 0.0254734605550766, 0.050186097621917725, 0.07489874958992004, 0.09961138665676117, 0.12432408332824707, 0.1490367203950882, 0.17374935746192932, 0.19846200942993164, 0.22317464649677277, 0.2478872835636139, 0.2725999355316162, 0.29731255769729614, 0.32202520966529846, 0.3467378616333008, 0.3714504837989807, 0.39616313576698303, 0.42087578773498535, 0.4455884099006653, 0.4703010618686676, 0.4950137138366699, 0.5197263360023499, 0.5444389581680298, 0.5691516399383545, 0.5938642621040344, 0.6185768842697144, 0.6432895660400391, 0.668002188205719, 0.6927148103713989, 0.7174274921417236, 0.7421401143074036, 0.7668527960777283, 0.7915654182434082, 0.8162780404090881, 0.8409906625747681, 0.8657033443450928, 0.8904159665107727, 0.9151285886764526]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 20.0, 15.0, 25.0, 29.0, 35.0, 47.0, 103.0, 135.0, 224.0, 325.0, 585.0, 972.0, 1795.0, 3131.0, 5548.0, 9845.0, 17481.0, 29939.0, 49923.0, 81526.0, 123659.0, 171249.0, 180242.0, 138900.0, 92431.0, 58222.0, 34889.0, 20297.0, 11817.0, 6517.0, 3643.0, 2128.0, 1115.0, 655.0, 376.0, 262.0, 152.0, 105.0, 56.0, 39.0, 26.0, 25.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2490234375, -0.24151039123535156, -0.23399734497070312, -0.2264842987060547, -0.21897125244140625, -0.2114582061767578, -0.20394515991210938, -0.19643211364746094, -0.1889190673828125, -0.18140602111816406, -0.17389297485351562, -0.1663799285888672, -0.15886688232421875, -0.1513538360595703, -0.14384078979492188, -0.13632774353027344, -0.128814697265625, -0.12130165100097656, -0.11378860473632812, -0.10627555847167969, -0.09876251220703125, -0.09124946594238281, -0.08373641967773438, -0.07622337341308594, -0.0687103271484375, -0.06119728088378906, -0.053684234619140625, -0.04617118835449219, -0.03865814208984375, -0.031145095825195312, -0.023632049560546875, -0.016119003295898438, -0.00860595703125, -0.0010929107666015625, 0.006420135498046875, 0.013933181762695312, 0.02144622802734375, 0.028959274291992188, 0.036472320556640625, 0.04398536682128906, 0.0514984130859375, 0.05901145935058594, 0.06652450561523438, 0.07403755187988281, 0.08155059814453125, 0.08906364440917969, 0.09657669067382812, 0.10408973693847656, 0.111602783203125, 0.11911582946777344, 0.12662887573242188, 0.1341419219970703, 0.14165496826171875, 0.1491680145263672, 0.15668106079101562, 0.16419410705566406, 0.1717071533203125, 0.17922019958496094, 0.18673324584960938, 0.1942462921142578, 0.20175933837890625, 0.2092723846435547, 0.21678543090820312, 0.22429847717285156, 0.2318115234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 3.0, 4.0, 9.0, 12.0, 7.0, 14.0, 12.0, 23.0, 18.0, 25.0, 21.0, 25.0, 31.0, 34.0, 32.0, 41.0, 36.0, 38.0, 40.0, 34.0, 53.0, 49.0, 35.0, 42.0, 40.0, 31.0, 25.0, 32.0, 24.0, 37.0, 26.0, 24.0, 17.0, 13.0, 18.0, 8.0, 7.0, 11.0, 8.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1112060546875, -0.10775566101074219, -0.10430526733398438, -0.10085487365722656, -0.09740447998046875, -0.09395408630371094, -0.09050369262695312, -0.08705329895019531, -0.0836029052734375, -0.08015251159667969, -0.07670211791992188, -0.07325172424316406, -0.06980133056640625, -0.06635093688964844, -0.06290054321289062, -0.05945014953613281, -0.055999755859375, -0.05254936218261719, -0.049098968505859375, -0.04564857482910156, -0.04219818115234375, -0.03874778747558594, -0.035297393798828125, -0.03184700012207031, -0.0283966064453125, -0.024946212768554688, -0.021495819091796875, -0.018045425415039062, -0.01459503173828125, -0.011144638061523438, -0.007694244384765625, -0.0042438507080078125, -0.00079345703125, 0.0026569366455078125, 0.006107330322265625, 0.009557723999023438, 0.01300811767578125, 0.016458511352539062, 0.019908905029296875, 0.023359298706054688, 0.0268096923828125, 0.030260086059570312, 0.033710479736328125, 0.03716087341308594, 0.04061126708984375, 0.04406166076660156, 0.047512054443359375, 0.05096244812011719, 0.054412841796875, 0.05786323547363281, 0.061313629150390625, 0.06476402282714844, 0.06821441650390625, 0.07166481018066406, 0.07511520385742188, 0.07856559753417969, 0.0820159912109375, 0.08546638488769531, 0.08891677856445312, 0.09236717224121094, 0.09581756591796875, 0.09926795959472656, 0.10271835327148438, 0.10616874694824219, 0.109619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 10.0, 9.0, 18.0, 31.0, 33.0, 51.0, 60.0, 88.0, 121.0, 251.0, 420.0, 804.0, 1662.0, 3546.0, 7510.0, 16413.0, 34450.0, 70856.0, 131476.0, 210870.0, 231887.0, 161376.0, 90058.0, 45448.0, 21772.0, 10165.0, 4667.0, 2103.0, 1037.0, 524.0, 285.0, 187.0, 102.0, 57.0, 55.0, 45.0, 20.0, 16.0, 14.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24803543090820312, -0.23923492431640625, -0.23043441772460938, -0.2216339111328125, -0.21283340454101562, -0.20403289794921875, -0.19523239135742188, -0.186431884765625, -0.17763137817382812, -0.16883087158203125, -0.16003036499023438, -0.1512298583984375, -0.14242935180664062, -0.13362884521484375, -0.12482833862304688, -0.11602783203125, -0.10722732543945312, -0.09842681884765625, -0.08962631225585938, -0.0808258056640625, -0.07202529907226562, -0.06322479248046875, -0.054424285888671875, -0.045623779296875, -0.036823272705078125, -0.02802276611328125, -0.019222259521484375, -0.0104217529296875, -0.001621246337890625, 0.00717926025390625, 0.015979766845703125, 0.0247802734375, 0.033580780029296875, 0.04238128662109375, 0.051181793212890625, 0.0599822998046875, 0.06878280639648438, 0.07758331298828125, 0.08638381958007812, 0.095184326171875, 0.10398483276367188, 0.11278533935546875, 0.12158584594726562, 0.1303863525390625, 0.13918685913085938, 0.14798736572265625, 0.15678787231445312, 0.16558837890625, 0.17438888549804688, 0.18318939208984375, 0.19198989868164062, 0.2007904052734375, 0.20959091186523438, 0.21839141845703125, 0.22719192504882812, 0.235992431640625, 0.24479293823242188, 0.25359344482421875, 0.2623939514160156, 0.2711944580078125, 0.2799949645996094, 0.28879547119140625, 0.2975959777832031, 0.306396484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 11.0, 17.0, 12.0, 13.0, 25.0, 24.0, 38.0, 36.0, 29.0, 41.0, 40.0, 47.0, 38.0, 31.0, 45.0, 38.0, 46.0, 39.0, 51.0, 45.0, 36.0, 27.0, 31.0, 32.0, 29.0, 24.0, 24.0, 16.0, 17.0, 16.0, 14.0, 7.0, 7.0, 6.0, 8.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.3612098693847656, -0.35059356689453125, -0.3399772644042969, -0.3293609619140625, -0.3187446594238281, -0.30812835693359375, -0.2975120544433594, -0.286895751953125, -0.2762794494628906, -0.26566314697265625, -0.2550468444824219, -0.2444305419921875, -0.23381423950195312, -0.22319793701171875, -0.21258163452148438, -0.20196533203125, -0.19134902954101562, -0.18073272705078125, -0.17011642456054688, -0.1595001220703125, -0.14888381958007812, -0.13826751708984375, -0.12765121459960938, -0.117034912109375, -0.10641860961914062, -0.09580230712890625, -0.08518600463867188, -0.0745697021484375, -0.06395339965820312, -0.05333709716796875, -0.042720794677734375, -0.0321044921875, -0.021488189697265625, -0.01087188720703125, -0.000255584716796875, 0.0103607177734375, 0.020977020263671875, 0.03159332275390625, 0.042209625244140625, 0.052825927734375, 0.06344223022460938, 0.07405853271484375, 0.08467483520507812, 0.0952911376953125, 0.10590744018554688, 0.11652374267578125, 0.12714004516601562, 0.13775634765625, 0.14837265014648438, 0.15898895263671875, 0.16960525512695312, 0.1802215576171875, 0.19083786010742188, 0.20145416259765625, 0.21207046508789062, 0.222686767578125, 0.23330307006835938, 0.24391937255859375, 0.2545356750488281, 0.2651519775390625, 0.2757682800292969, 0.28638458251953125, 0.2970008850097656, 0.3076171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 13.0, 11.0, 14.0, 24.0, 33.0, 55.0, 111.0, 152.0, 255.0, 413.0, 700.0, 1305.0, 2378.0, 4249.0, 7600.0, 13902.0, 25046.0, 43501.0, 73482.0, 117287.0, 164099.0, 182994.0, 153573.0, 105560.0, 65078.0, 37969.0, 21792.0, 11990.0, 6699.0, 3571.0, 2042.0, 1089.0, 615.0, 357.0, 225.0, 128.0, 77.0, 62.0, 32.0, 18.0, 17.0, 16.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.08966064453125, -0.0869741439819336, -0.08428764343261719, -0.08160114288330078, -0.07891464233398438, -0.07622814178466797, -0.07354164123535156, -0.07085514068603516, -0.06816864013671875, -0.06548213958740234, -0.06279563903808594, -0.06010913848876953, -0.057422637939453125, -0.05473613739013672, -0.05204963684082031, -0.049363136291503906, -0.0466766357421875, -0.043990135192871094, -0.04130363464355469, -0.03861713409423828, -0.035930633544921875, -0.03324413299560547, -0.030557632446289062, -0.027871131896972656, -0.02518463134765625, -0.022498130798339844, -0.019811630249023438, -0.01712512969970703, -0.014438629150390625, -0.011752128601074219, -0.009065628051757812, -0.006379127502441406, -0.003692626953125, -0.0010061264038085938, 0.0016803741455078125, 0.004366874694824219, 0.007053375244140625, 0.009739875793457031, 0.012426376342773438, 0.015112876892089844, 0.01779937744140625, 0.020485877990722656, 0.023172378540039062, 0.02585887908935547, 0.028545379638671875, 0.03123188018798828, 0.03391838073730469, 0.036604881286621094, 0.0392913818359375, 0.041977882385253906, 0.04466438293457031, 0.04735088348388672, 0.050037384033203125, 0.05272388458251953, 0.05541038513183594, 0.058096885681152344, 0.06078338623046875, 0.06346988677978516, 0.06615638732910156, 0.06884288787841797, 0.07152938842773438, 0.07421588897705078, 0.07690238952636719, 0.0795888900756836, 0.082275390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 4.0, 8.0, 9.0, 14.0, 12.0, 21.0, 25.0, 31.0, 32.0, 29.0, 42.0, 62.0, 77.0, 73.0, 87.0, 94.0, 50.0, 60.0, 48.0, 38.0, 29.0, 31.0, 16.0, 20.0, 12.0, 7.0, 11.0, 12.0, 12.0, 6.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.641843795776367e-05, -3.539677709341049e-05, -3.437511622905731e-05, -3.335345536470413e-05, -3.233179450035095e-05, -3.131013363599777e-05, -3.0288472771644592e-05, -2.9266811907291412e-05, -2.8245151042938232e-05, -2.7223490178585052e-05, -2.6201829314231873e-05, -2.5180168449878693e-05, -2.4158507585525513e-05, -2.3136846721172333e-05, -2.2115185856819153e-05, -2.1093524992465973e-05, -2.0071864128112793e-05, -1.9050203263759613e-05, -1.8028542399406433e-05, -1.7006881535053253e-05, -1.5985220670700073e-05, -1.4963559806346893e-05, -1.3941898941993713e-05, -1.2920238077640533e-05, -1.1898577213287354e-05, -1.0876916348934174e-05, -9.855255484580994e-06, -8.833594620227814e-06, -7.811933755874634e-06, -6.790272891521454e-06, -5.768612027168274e-06, -4.746951162815094e-06, -3.725290298461914e-06, -2.703629434108734e-06, -1.6819685697555542e-06, -6.603077054023743e-07, 3.6135315895080566e-07, 1.3830140233039856e-06, 2.4046748876571655e-06, 3.4263357520103455e-06, 4.447996616363525e-06, 5.469657480716705e-06, 6.491318345069885e-06, 7.512979209423065e-06, 8.534640073776245e-06, 9.556300938129425e-06, 1.0577961802482605e-05, 1.1599622666835785e-05, 1.2621283531188965e-05, 1.3642944395542145e-05, 1.4664605259895325e-05, 1.5686266124248505e-05, 1.6707926988601685e-05, 1.7729587852954865e-05, 1.8751248717308044e-05, 1.9772909581661224e-05, 2.0794570446014404e-05, 2.1816231310367584e-05, 2.2837892174720764e-05, 2.3859553039073944e-05, 2.4881213903427124e-05, 2.5902874767780304e-05, 2.6924535632133484e-05, 2.7946196496486664e-05, 2.8967857360839844e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 12.0, 6.0, 13.0, 19.0, 39.0, 53.0, 54.0, 94.0, 153.0, 290.0, 535.0, 1237.0, 2597.0, 5428.0, 11988.0, 26274.0, 57560.0, 118648.0, 209842.0, 254092.0, 180138.0, 95778.0, 45455.0, 20616.0, 9444.0, 4235.0, 1933.0, 987.0, 455.0, 222.0, 136.0, 67.0, 46.0, 34.0, 23.0, 9.0, 15.0, 8.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.1032266616821289, -0.09982490539550781, -0.09642314910888672, -0.09302139282226562, -0.08961963653564453, -0.08621788024902344, -0.08281612396240234, -0.07941436767578125, -0.07601261138916016, -0.07261085510253906, -0.06920909881591797, -0.06580734252929688, -0.06240558624267578, -0.05900382995605469, -0.055602073669433594, -0.0522003173828125, -0.048798561096191406, -0.04539680480957031, -0.04199504852294922, -0.038593292236328125, -0.03519153594970703, -0.03178977966308594, -0.028388023376464844, -0.02498626708984375, -0.021584510803222656, -0.018182754516601562, -0.014780998229980469, -0.011379241943359375, -0.007977485656738281, -0.0045757293701171875, -0.0011739730834960938, 0.002227783203125, 0.005629539489746094, 0.009031295776367188, 0.012433052062988281, 0.015834808349609375, 0.01923656463623047, 0.022638320922851562, 0.026040077209472656, 0.02944183349609375, 0.032843589782714844, 0.03624534606933594, 0.03964710235595703, 0.043048858642578125, 0.04645061492919922, 0.04985237121582031, 0.053254127502441406, 0.0566558837890625, 0.060057640075683594, 0.06345939636230469, 0.06686115264892578, 0.07026290893554688, 0.07366466522216797, 0.07706642150878906, 0.08046817779541016, 0.08386993408203125, 0.08727169036865234, 0.09067344665527344, 0.09407520294189453, 0.09747695922851562, 0.10087871551513672, 0.10428047180175781, 0.1076822280883789, 0.111083984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 7.0, 7.0, 16.0, 18.0, 14.0, 26.0, 25.0, 26.0, 27.0, 32.0, 62.0, 42.0, 66.0, 58.0, 55.0, 62.0, 56.0, 60.0, 54.0, 36.0, 41.0, 34.0, 20.0, 26.0, 16.0, 22.0, 10.0, 10.0, 16.0, 10.0, 7.0, 9.0, 2.0, 5.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09320926666259766, -0.09028816223144531, -0.08736705780029297, -0.08444595336914062, -0.08152484893798828, -0.07860374450683594, -0.0756826400756836, -0.07276153564453125, -0.0698404312133789, -0.06691932678222656, -0.06399822235107422, -0.061077117919921875, -0.05815601348876953, -0.05523490905761719, -0.052313804626464844, -0.0493927001953125, -0.046471595764160156, -0.04355049133300781, -0.04062938690185547, -0.037708282470703125, -0.03478717803955078, -0.03186607360839844, -0.028944969177246094, -0.02602386474609375, -0.023102760314941406, -0.020181655883789062, -0.01726055145263672, -0.014339447021484375, -0.011418342590332031, -0.008497238159179688, -0.005576133728027344, -0.002655029296875, 0.00026607513427734375, 0.0031871795654296875, 0.006108283996582031, 0.009029388427734375, 0.011950492858886719, 0.014871597290039062, 0.017792701721191406, 0.02071380615234375, 0.023634910583496094, 0.026556015014648438, 0.02947711944580078, 0.032398223876953125, 0.03531932830810547, 0.03824043273925781, 0.041161537170410156, 0.0440826416015625, 0.047003746032714844, 0.04992485046386719, 0.05284595489501953, 0.055767059326171875, 0.05868816375732422, 0.06160926818847656, 0.0645303726196289, 0.06745147705078125, 0.0703725814819336, 0.07329368591308594, 0.07621479034423828, 0.07913589477539062, 0.08205699920654297, 0.08497810363769531, 0.08789920806884766, 0.0908203125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 6.0, 14.0, 29.0, 37.0, 45.0, 70.0, 78.0, 107.0, 111.0, 105.0, 107.0, 82.0, 60.0, 50.0, 39.0, 22.0, 12.0, 17.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.929495096206665, -1.8840177059173584, -1.8385404348373413, -1.7930631637573242, -1.7475857734680176, -1.702108383178711, -1.6566311120986938, -1.6111538410186768, -1.5656764507293701, -1.5201990604400635, -1.4747217893600464, -1.4292445182800293, -1.3837671279907227, -1.338289737701416, -1.292812466621399, -1.2473351955413818, -1.2018578052520752, -1.1563804149627686, -1.1109031438827515, -1.0654258728027344, -1.0199484825134277, -0.9744711518287659, -0.928993821144104, -0.8835164904594421, -0.8380391597747803, -0.7925618290901184, -0.7470844984054565, -0.7016071677207947, -0.6561298370361328, -0.610652506351471, -0.5651751756668091, -0.5196978449821472, -0.4742205739021301, -0.42874324321746826, -0.3832659125328064, -0.33778858184814453, -0.29231125116348267, -0.2468339204788208, -0.20135658979415894, -0.15587925910949707, -0.1104019284248352, -0.06492459774017334, -0.019447267055511475, 0.02603006362915039, 0.07150739431381226, 0.11698472499847412, 0.162462055683136, 0.20793938636779785, 0.2534167170524597, 0.2988940477371216, 0.34437137842178345, 0.3898487091064453, 0.4353260397911072, 0.48080337047576904, 0.5262807011604309, 0.5717580318450928, 0.6172353625297546, 0.6627126932144165, 0.7081900238990784, 0.7536673545837402, 0.7991446852684021, 0.844622015953064, 0.8900993466377258, 0.9355766773223877, 0.9810540080070496]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 12.0, 10.0, 12.0, 11.0, 14.0, 17.0, 23.0, 17.0, 26.0, 15.0, 17.0, 33.0, 26.0, 33.0, 25.0, 41.0, 52.0, 46.0, 53.0, 35.0, 36.0, 43.0, 42.0, 28.0, 27.0, 29.0, 36.0, 27.0, 28.0, 23.0, 20.0, 21.0, 15.0, 15.0, 8.0, 18.0, 12.0, 8.0, 8.0, 8.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.8066449761390686, -0.7823349833488464, -0.758025050163269, -0.7337150573730469, -0.7094050645828247, -0.6850950717926025, -0.6607850790023804, -0.636475145816803, -0.6121651530265808, -0.5878551602363586, -0.5635452270507812, -0.5392352342605591, -0.5149252414703369, -0.49061524868011475, -0.46630528569221497, -0.4419953227043152, -0.417685329914093, -0.39337533712387085, -0.36906537413597107, -0.3447554111480713, -0.3204454183578491, -0.29613542556762695, -0.2718254625797272, -0.2475154846906662, -0.22320550680160522, -0.19889552891254425, -0.17458555102348328, -0.1502755731344223, -0.12596559524536133, -0.10165561735630035, -0.07734563946723938, -0.053035661578178406, -0.028725624084472656, -0.004415646195411682, 0.019894331693649292, 0.044204309582710266, 0.06851428747177124, 0.09282426536083221, 0.11713424324989319, 0.14144422113895416, 0.16575419902801514, 0.1900641769170761, 0.21437415480613708, 0.23868413269519806, 0.26299411058425903, 0.2873041033744812, 0.311614066362381, 0.33592402935028076, 0.36023402214050293, 0.3845440149307251, 0.4088539779186249, 0.43316394090652466, 0.4574739336967468, 0.481783926486969, 0.5060938596725464, 0.5304038524627686, 0.5547138452529907, 0.5790238380432129, 0.6033338308334351, 0.6276437640190125, 0.6519537568092346, 0.6762637495994568, 0.7005736827850342, 0.7248836755752563, 0.7491936683654785]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 16.0, 16.0, 22.0, 26.0, 53.0, 78.0, 131.0, 184.0, 286.0, 464.0, 826.0, 1488.0, 3095.0, 6647.0, 14566.0, 35309.0, 94261.0, 305403.0, 1251536.0, 1800266.0, 466303.0, 131737.0, 46763.0, 18613.0, 8122.0, 3851.0, 1883.0, 997.0, 517.0, 311.0, 202.0, 118.0, 60.0, 31.0, 33.0, 21.0, 10.0, 8.0, 4.0, 10.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.19905471801757812, -0.19266510009765625, -0.18627548217773438, -0.1798858642578125, -0.17349624633789062, -0.16710662841796875, -0.16071701049804688, -0.154327392578125, -0.14793777465820312, -0.14154815673828125, -0.13515853881835938, -0.1287689208984375, -0.12237930297851562, -0.11598968505859375, -0.10960006713867188, -0.10321044921875, -0.09682083129882812, -0.09043121337890625, -0.08404159545898438, -0.0776519775390625, -0.07126235961914062, -0.06487274169921875, -0.058483123779296875, -0.052093505859375, -0.045703887939453125, -0.03931427001953125, -0.032924652099609375, -0.0265350341796875, -0.020145416259765625, -0.01375579833984375, -0.007366180419921875, -0.0009765625, 0.005413055419921875, 0.01180267333984375, 0.018192291259765625, 0.0245819091796875, 0.030971527099609375, 0.03736114501953125, 0.043750762939453125, 0.050140380859375, 0.056529998779296875, 0.06291961669921875, 0.06930923461914062, 0.0756988525390625, 0.08208847045898438, 0.08847808837890625, 0.09486770629882812, 0.10125732421875, 0.10764694213867188, 0.11403656005859375, 0.12042617797851562, 0.1268157958984375, 0.13320541381835938, 0.13959503173828125, 0.14598464965820312, 0.152374267578125, 0.15876388549804688, 0.16515350341796875, 0.17154312133789062, 0.1779327392578125, 0.18432235717773438, 0.19071197509765625, 0.19710159301757812, 0.2034912109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 7.0, 6.0, 9.0, 22.0, 16.0, 20.0, 26.0, 23.0, 20.0, 26.0, 35.0, 32.0, 29.0, 38.0, 32.0, 36.0, 48.0, 48.0, 41.0, 44.0, 51.0, 36.0, 36.0, 35.0, 46.0, 28.0, 33.0, 21.0, 21.0, 23.0, 10.0, 15.0, 12.0, 9.0, 12.0, 11.0, 6.0, 3.0, 2.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1309814453125, -0.12713909149169922, -0.12329673767089844, -0.11945438385009766, -0.11561203002929688, -0.1117696762084961, -0.10792732238769531, -0.10408496856689453, -0.10024261474609375, -0.09640026092529297, -0.09255790710449219, -0.0887155532836914, -0.08487319946289062, -0.08103084564208984, -0.07718849182128906, -0.07334613800048828, -0.0695037841796875, -0.06566143035888672, -0.06181907653808594, -0.057976722717285156, -0.054134368896484375, -0.050292015075683594, -0.04644966125488281, -0.04260730743408203, -0.03876495361328125, -0.03492259979248047, -0.031080245971679688, -0.027237892150878906, -0.023395538330078125, -0.019553184509277344, -0.015710830688476562, -0.011868476867675781, -0.008026123046875, -0.004183769226074219, -0.0003414154052734375, 0.0035009384155273438, 0.007343292236328125, 0.011185646057128906, 0.015027999877929688, 0.01887035369873047, 0.02271270751953125, 0.02655506134033203, 0.030397415161132812, 0.034239768981933594, 0.038082122802734375, 0.041924476623535156, 0.04576683044433594, 0.04960918426513672, 0.0534515380859375, 0.05729389190673828, 0.06113624572753906, 0.06497859954833984, 0.06882095336914062, 0.0726633071899414, 0.07650566101074219, 0.08034801483154297, 0.08419036865234375, 0.08803272247314453, 0.09187507629394531, 0.0957174301147461, 0.09955978393554688, 0.10340213775634766, 0.10724449157714844, 0.11108684539794922, 0.11492919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 10.0, 17.0, 24.0, 36.0, 38.0, 68.0, 82.0, 141.0, 208.0, 310.0, 459.0, 767.0, 1307.0, 2386.0, 4371.0, 8912.0, 18282.0, 40476.0, 93554.0, 233689.0, 621566.0, 1478330.0, 1039192.0, 384765.0, 148838.0, 61930.0, 27503.0, 12884.0, 6262.0, 3220.0, 1802.0, 1013.0, 623.0, 429.0, 227.0, 165.0, 103.0, 74.0, 55.0, 44.0, 24.0, 19.0, 19.0, 13.0, 7.0, 9.0, 8.0, 0.0, 3.0, 3.0, 2.0], "bins": [-0.2030029296875, -0.19716262817382812, -0.19132232666015625, -0.18548202514648438, -0.1796417236328125, -0.17380142211914062, -0.16796112060546875, -0.16212081909179688, -0.156280517578125, -0.15044021606445312, -0.14459991455078125, -0.13875961303710938, -0.1329193115234375, -0.12707901000976562, -0.12123870849609375, -0.11539840698242188, -0.10955810546875, -0.10371780395507812, -0.09787750244140625, -0.09203720092773438, -0.0861968994140625, -0.08035659790039062, -0.07451629638671875, -0.06867599487304688, -0.062835693359375, -0.056995391845703125, -0.05115509033203125, -0.045314788818359375, -0.0394744873046875, -0.033634185791015625, -0.02779388427734375, -0.021953582763671875, -0.01611328125, -0.010272979736328125, -0.00443267822265625, 0.001407623291015625, 0.0072479248046875, 0.013088226318359375, 0.01892852783203125, 0.024768829345703125, 0.030609130859375, 0.036449432373046875, 0.04228973388671875, 0.048130035400390625, 0.0539703369140625, 0.059810638427734375, 0.06565093994140625, 0.07149124145507812, 0.07733154296875, 0.08317184448242188, 0.08901214599609375, 0.09485244750976562, 0.1006927490234375, 0.10653305053710938, 0.11237335205078125, 0.11821365356445312, 0.124053955078125, 0.12989425659179688, 0.13573455810546875, 0.14157485961914062, 0.1474151611328125, 0.15325546264648438, 0.15909576416015625, 0.16493606567382812, 0.1707763671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 13.0, 14.0, 10.0, 8.0, 20.0, 21.0, 31.0, 47.0, 74.0, 102.0, 112.0, 164.0, 233.0, 339.0, 430.0, 558.0, 537.0, 415.0, 271.0, 197.0, 128.0, 93.0, 68.0, 49.0, 29.0, 25.0, 20.0, 16.0, 14.0, 10.0, 5.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1912841796875, -0.18386268615722656, -0.17644119262695312, -0.1690196990966797, -0.16159820556640625, -0.1541767120361328, -0.14675521850585938, -0.13933372497558594, -0.1319122314453125, -0.12449073791503906, -0.11706924438476562, -0.10964775085449219, -0.10222625732421875, -0.09480476379394531, -0.08738327026367188, -0.07996177673339844, -0.072540283203125, -0.06511878967285156, -0.057697296142578125, -0.05027580261230469, -0.04285430908203125, -0.03543281555175781, -0.028011322021484375, -0.020589828491210938, -0.0131683349609375, -0.0057468414306640625, 0.001674652099609375, 0.009096145629882812, 0.01651763916015625, 0.023939132690429688, 0.031360626220703125, 0.03878211975097656, 0.04620361328125, 0.05362510681152344, 0.061046600341796875, 0.06846809387207031, 0.07588958740234375, 0.08331108093261719, 0.09073257446289062, 0.09815406799316406, 0.1055755615234375, 0.11299705505371094, 0.12041854858398438, 0.1278400421142578, 0.13526153564453125, 0.1426830291748047, 0.15010452270507812, 0.15752601623535156, 0.164947509765625, 0.17236900329589844, 0.17979049682617188, 0.1872119903564453, 0.19463348388671875, 0.2020549774169922, 0.20947647094726562, 0.21689796447753906, 0.2243194580078125, 0.23174095153808594, 0.23916244506835938, 0.2465839385986328, 0.25400543212890625, 0.2614269256591797, 0.2688484191894531, 0.27626991271972656, 0.28369140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 12.0, 15.0, 21.0, 32.0, 29.0, 38.0, 50.0, 61.0, 78.0, 84.0, 74.0, 84.0, 74.0, 67.0, 66.0, 53.0, 47.0, 39.0, 22.0, 10.0, 6.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.221909999847412, -1.1901782751083374, -1.1584465503692627, -1.126714825630188, -1.0949831008911133, -1.0632513761520386, -1.0315196514129639, -0.9997879862785339, -0.9680562615394592, -0.9363245368003845, -0.9045928120613098, -0.8728610873222351, -0.8411294221878052, -0.8093976974487305, -0.7776659727096558, -0.745934247970581, -0.7142025232315063, -0.6824707984924316, -0.6507390737533569, -0.6190073490142822, -0.5872756242752075, -0.5555438995361328, -0.5238122344017029, -0.4920805096626282, -0.46034878492355347, -0.42861706018447876, -0.39688533544540405, -0.36515364050865173, -0.333421915769577, -0.3016901910305023, -0.26995849609375, -0.2382267713546753, -0.20649516582489014, -0.17476344108581543, -0.14303173124790192, -0.1113000139594078, -0.0795682966709137, -0.04783657193183899, -0.016104862093925476, 0.015626847743988037, 0.047358572483062744, 0.07909028977155685, 0.11082200706005096, 0.14255371689796448, 0.17428544163703918, 0.2060171663761139, 0.2377488762140274, 0.2694805860519409, 0.3012123107910156, 0.33294403553009033, 0.36467576026916504, 0.39640745520591736, 0.42813917994499207, 0.4598709046840668, 0.4916025996208191, 0.5233343243598938, 0.5550660490989685, 0.5867977738380432, 0.6185294985771179, 0.6502612233161926, 0.6819928884506226, 0.7137246131896973, 0.745456337928772, 0.7771880626678467, 0.8089197874069214]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 8.0, 8.0, 18.0, 15.0, 23.0, 24.0, 19.0, 31.0, 30.0, 26.0, 31.0, 39.0, 27.0, 32.0, 45.0, 38.0, 38.0, 42.0, 46.0, 39.0, 38.0, 45.0, 27.0, 24.0, 33.0, 26.0, 38.0, 27.0, 20.0, 10.0, 21.0, 16.0, 6.0, 10.0, 15.0, 6.0, 7.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5798817873001099, -0.5607486963272095, -0.5416156053543091, -0.5224825143814087, -0.5033494234085083, -0.4842163324356079, -0.46508321166038513, -0.44595012068748474, -0.42681702971458435, -0.40768393874168396, -0.38855084776878357, -0.3694177567958832, -0.3502846360206604, -0.33115154504776, -0.3120184540748596, -0.29288536310195923, -0.27375227212905884, -0.25461918115615845, -0.23548609018325806, -0.21635298430919647, -0.19721989333629608, -0.1780868023633957, -0.1589536964893341, -0.13982060551643372, -0.12068751454353333, -0.10155442357063293, -0.08242132514715195, -0.06328822672367096, -0.04415513575077057, -0.025022044777870178, -0.005888946354389191, 0.013244152069091797, 0.03237724304199219, 0.05151033774018288, 0.07064343243837357, 0.08977653086185455, 0.10890962183475494, 0.12804271280765533, 0.14717581868171692, 0.1663089096546173, 0.1854420006275177, 0.2045750916004181, 0.22370818257331848, 0.24284128844738007, 0.26197439432144165, 0.28110748529434204, 0.30024057626724243, 0.3193736672401428, 0.3385067582130432, 0.3576398491859436, 0.376772940158844, 0.3959060311317444, 0.4150391221046448, 0.43417221307754517, 0.45330533385276794, 0.47243842482566833, 0.4915715157985687, 0.5107046365737915, 0.5298377275466919, 0.5489708185195923, 0.5681039094924927, 0.5872370004653931, 0.6063700914382935, 0.6255031824111938, 0.6446362733840942]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 11.0, 19.0, 20.0, 42.0, 47.0, 66.0, 102.0, 175.0, 275.0, 512.0, 802.0, 1310.0, 2291.0, 3973.0, 6465.0, 10770.0, 18264.0, 30796.0, 53986.0, 96231.0, 165452.0, 218230.0, 182256.0, 109484.0, 61618.0, 34942.0, 20328.0, 12193.0, 7184.0, 4297.0, 2627.0, 1536.0, 860.0, 523.0, 322.0, 214.0, 116.0, 73.0, 46.0, 30.0, 15.0, 12.0, 6.0, 5.0, 5.0, 7.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2275390625, -0.22034072875976562, -0.21314239501953125, -0.20594406127929688, -0.1987457275390625, -0.19154739379882812, -0.18434906005859375, -0.17715072631835938, -0.169952392578125, -0.16275405883789062, -0.15555572509765625, -0.14835739135742188, -0.1411590576171875, -0.13396072387695312, -0.12676239013671875, -0.11956405639648438, -0.11236572265625, -0.10516738891601562, -0.09796905517578125, -0.09077072143554688, -0.0835723876953125, -0.07637405395507812, -0.06917572021484375, -0.061977386474609375, -0.054779052734375, -0.047580718994140625, -0.04038238525390625, -0.033184051513671875, -0.0259857177734375, -0.018787384033203125, -0.01158905029296875, -0.004390716552734375, 0.0028076171875, 0.010005950927734375, 0.01720428466796875, 0.024402618408203125, 0.0316009521484375, 0.038799285888671875, 0.04599761962890625, 0.053195953369140625, 0.060394287109375, 0.06759262084960938, 0.07479095458984375, 0.08198928833007812, 0.0891876220703125, 0.09638595581054688, 0.10358428955078125, 0.11078262329101562, 0.11798095703125, 0.12517929077148438, 0.13237762451171875, 0.13957595825195312, 0.1467742919921875, 0.15397262573242188, 0.16117095947265625, 0.16836929321289062, 0.175567626953125, 0.18276596069335938, 0.18996429443359375, 0.19716262817382812, 0.2043609619140625, 0.21155929565429688, 0.21875762939453125, 0.22595596313476562, 0.233154296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 3.0, 8.0, 6.0, 6.0, 20.0, 14.0, 13.0, 15.0, 25.0, 25.0, 28.0, 31.0, 19.0, 36.0, 22.0, 33.0, 42.0, 43.0, 57.0, 33.0, 41.0, 49.0, 37.0, 40.0, 40.0, 32.0, 43.0, 31.0, 30.0, 29.0, 31.0, 11.0, 18.0, 13.0, 12.0, 8.0, 13.0, 9.0, 6.0, 11.0, 4.0, 5.0, 0.0, 6.0, 2.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13410091400146484, -0.1303844451904297, -0.12666797637939453, -0.12295150756835938, -0.11923503875732422, -0.11551856994628906, -0.1118021011352539, -0.10808563232421875, -0.1043691635131836, -0.10065269470214844, -0.09693622589111328, -0.09321975708007812, -0.08950328826904297, -0.08578681945800781, -0.08207035064697266, -0.0783538818359375, -0.07463741302490234, -0.07092094421386719, -0.06720447540283203, -0.06348800659179688, -0.05977153778076172, -0.05605506896972656, -0.052338600158691406, -0.04862213134765625, -0.044905662536621094, -0.04118919372558594, -0.03747272491455078, -0.033756256103515625, -0.03003978729248047, -0.026323318481445312, -0.022606849670410156, -0.018890380859375, -0.015173912048339844, -0.011457443237304688, -0.007740974426269531, -0.004024505615234375, -0.00030803680419921875, 0.0034084320068359375, 0.007124900817871094, 0.01084136962890625, 0.014557838439941406, 0.018274307250976562, 0.02199077606201172, 0.025707244873046875, 0.02942371368408203, 0.03314018249511719, 0.036856651306152344, 0.0405731201171875, 0.044289588928222656, 0.04800605773925781, 0.05172252655029297, 0.055438995361328125, 0.05915546417236328, 0.06287193298339844, 0.0665884017944336, 0.07030487060546875, 0.0740213394165039, 0.07773780822753906, 0.08145427703857422, 0.08517074584960938, 0.08888721466064453, 0.09260368347167969, 0.09632015228271484, 0.10003662109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 6.0, 11.0, 19.0, 20.0, 29.0, 42.0, 51.0, 87.0, 124.0, 216.0, 332.0, 676.0, 1433.0, 3312.0, 7643.0, 19223.0, 49847.0, 137064.0, 328339.0, 304614.0, 121281.0, 44446.0, 17233.0, 6889.0, 2901.0, 1238.0, 628.0, 306.0, 179.0, 127.0, 66.0, 59.0, 43.0, 22.0, 7.0, 18.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.34468841552734375, -0.3331756591796875, -0.32166290283203125, -0.310150146484375, -0.29863739013671875, -0.2871246337890625, -0.27561187744140625, -0.26409912109375, -0.25258636474609375, -0.2410736083984375, -0.22956085205078125, -0.218048095703125, -0.20653533935546875, -0.1950225830078125, -0.18350982666015625, -0.1719970703125, -0.16048431396484375, -0.1489715576171875, -0.13745880126953125, -0.125946044921875, -0.11443328857421875, -0.1029205322265625, -0.09140777587890625, -0.07989501953125, -0.06838226318359375, -0.0568695068359375, -0.04535675048828125, -0.033843994140625, -0.02233123779296875, -0.0108184814453125, 0.00069427490234375, 0.01220703125, 0.02371978759765625, 0.0352325439453125, 0.04674530029296875, 0.058258056640625, 0.06977081298828125, 0.0812835693359375, 0.09279632568359375, 0.10430908203125, 0.11582183837890625, 0.1273345947265625, 0.13884735107421875, 0.150360107421875, 0.16187286376953125, 0.1733856201171875, 0.18489837646484375, 0.1964111328125, 0.20792388916015625, 0.2194366455078125, 0.23094940185546875, 0.242462158203125, 0.25397491455078125, 0.2654876708984375, 0.27700042724609375, 0.28851318359375, 0.30002593994140625, 0.3115386962890625, 0.32305145263671875, 0.334564208984375, 0.34607696533203125, 0.3575897216796875, 0.36910247802734375, 0.380615234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 16.0, 13.0, 17.0, 29.0, 33.0, 26.0, 32.0, 45.0, 58.0, 46.0, 48.0, 48.0, 50.0, 56.0, 50.0, 53.0, 54.0, 50.0, 47.0, 44.0, 36.0, 25.0, 19.0, 24.0, 18.0, 15.0, 9.0, 10.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.42333984375, -0.4097023010253906, -0.39606475830078125, -0.3824272155761719, -0.3687896728515625, -0.3551521301269531, -0.34151458740234375, -0.3278770446777344, -0.314239501953125, -0.3006019592285156, -0.28696441650390625, -0.2733268737792969, -0.2596893310546875, -0.24605178833007812, -0.23241424560546875, -0.21877670288085938, -0.20513916015625, -0.19150161743164062, -0.17786407470703125, -0.16422653198242188, -0.1505889892578125, -0.13695144653320312, -0.12331390380859375, -0.10967636108398438, -0.096038818359375, -0.08240127563476562, -0.06876373291015625, -0.055126190185546875, -0.0414886474609375, -0.027851104736328125, -0.01421356201171875, -0.000576019287109375, 0.0130615234375, 0.026699066162109375, 0.04033660888671875, 0.053974151611328125, 0.0676116943359375, 0.08124923706054688, 0.09488677978515625, 0.10852432250976562, 0.122161865234375, 0.13579940795898438, 0.14943695068359375, 0.16307449340820312, 0.1767120361328125, 0.19034957885742188, 0.20398712158203125, 0.21762466430664062, 0.23126220703125, 0.24489974975585938, 0.25853729248046875, 0.2721748352050781, 0.2858123779296875, 0.2994499206542969, 0.31308746337890625, 0.3267250061035156, 0.340362548828125, 0.3540000915527344, 0.36763763427734375, 0.3812751770019531, 0.3949127197265625, 0.4085502624511719, 0.42218780517578125, 0.4358253479003906, 0.449462890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 13.0, 14.0, 20.0, 35.0, 36.0, 57.0, 84.0, 121.0, 203.0, 281.0, 412.0, 591.0, 898.0, 1394.0, 2109.0, 3222.0, 5058.0, 8361.0, 13888.0, 23944.0, 43136.0, 84008.0, 165840.0, 248412.0, 206098.0, 110240.0, 55602.0, 29592.0, 17096.0, 10114.0, 6383.0, 3904.0, 2516.0, 1609.0, 1091.0, 727.0, 473.0, 320.0, 219.0, 156.0, 79.0, 61.0, 49.0, 36.0, 13.0, 17.0, 7.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09161376953125, -0.08852863311767578, -0.08544349670410156, -0.08235836029052734, -0.07927322387695312, -0.0761880874633789, -0.07310295104980469, -0.07001781463623047, -0.06693267822265625, -0.06384754180908203, -0.06076240539550781, -0.057677268981933594, -0.054592132568359375, -0.051506996154785156, -0.04842185974121094, -0.04533672332763672, -0.0422515869140625, -0.03916645050048828, -0.03608131408691406, -0.032996177673339844, -0.029911041259765625, -0.026825904846191406, -0.023740768432617188, -0.02065563201904297, -0.01757049560546875, -0.014485359191894531, -0.011400222778320312, -0.008315086364746094, -0.005229949951171875, -0.0021448135375976562, 0.0009403228759765625, 0.004025459289550781, 0.007110595703125, 0.010195732116699219, 0.013280868530273438, 0.016366004943847656, 0.019451141357421875, 0.022536277770996094, 0.025621414184570312, 0.02870655059814453, 0.03179168701171875, 0.03487682342529297, 0.03796195983886719, 0.041047096252441406, 0.044132232666015625, 0.047217369079589844, 0.05030250549316406, 0.05338764190673828, 0.0564727783203125, 0.05955791473388672, 0.06264305114746094, 0.06572818756103516, 0.06881332397460938, 0.0718984603881836, 0.07498359680175781, 0.07806873321533203, 0.08115386962890625, 0.08423900604248047, 0.08732414245605469, 0.0904092788696289, 0.09349441528320312, 0.09657955169677734, 0.09966468811035156, 0.10274982452392578, 0.1058349609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 8.0, 3.0, 4.0, 10.0, 12.0, 13.0, 21.0, 21.0, 26.0, 30.0, 45.0, 72.0, 94.0, 92.0, 116.0, 93.0, 82.0, 59.0, 44.0, 26.0, 20.0, 21.0, 14.0, 19.0, 7.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.266334533691406e-05, -3.161188215017319e-05, -3.056041896343231e-05, -2.9508955776691437e-05, -2.845749258995056e-05, -2.7406029403209686e-05, -2.635456621646881e-05, -2.5303103029727936e-05, -2.425163984298706e-05, -2.3200176656246185e-05, -2.214871346950531e-05, -2.1097250282764435e-05, -2.004578709602356e-05, -1.8994323909282684e-05, -1.794286072254181e-05, -1.6891397535800934e-05, -1.583993434906006e-05, -1.4788471162319183e-05, -1.3737007975578308e-05, -1.2685544788837433e-05, -1.1634081602096558e-05, -1.0582618415355682e-05, -9.531155228614807e-06, -8.479692041873932e-06, -7.428228855133057e-06, -6.376765668392181e-06, -5.325302481651306e-06, -4.273839294910431e-06, -3.2223761081695557e-06, -2.1709129214286804e-06, -1.1194497346878052e-06, -6.798654794692993e-08, 9.834766387939453e-07, 2.0349398255348206e-06, 3.086403012275696e-06, 4.137866199016571e-06, 5.189329385757446e-06, 6.2407925724983215e-06, 7.292255759239197e-06, 8.343718945980072e-06, 9.395182132720947e-06, 1.0446645319461823e-05, 1.1498108506202698e-05, 1.2549571692943573e-05, 1.3601034879684448e-05, 1.4652498066425323e-05, 1.57039612531662e-05, 1.6755424439907074e-05, 1.780688762664795e-05, 1.8858350813388824e-05, 1.99098140001297e-05, 2.0961277186870575e-05, 2.201274037361145e-05, 2.3064203560352325e-05, 2.41156667470932e-05, 2.5167129933834076e-05, 2.621859312057495e-05, 2.7270056307315826e-05, 2.83215194940567e-05, 2.9372982680797577e-05, 3.0424445867538452e-05, 3.147590905427933e-05, 3.25273722410202e-05, 3.357883542776108e-05, 3.463029861450195e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 14.0, 6.0, 13.0, 18.0, 31.0, 52.0, 97.0, 136.0, 327.0, 624.0, 1386.0, 3218.0, 7961.0, 21456.0, 66396.0, 230578.0, 436293.0, 192961.0, 56193.0, 18620.0, 6877.0, 2816.0, 1258.0, 577.0, 282.0, 137.0, 92.0, 50.0, 32.0, 20.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14384841918945312, -0.13840484619140625, -0.13296127319335938, -0.1275177001953125, -0.12207412719726562, -0.11663055419921875, -0.11118698120117188, -0.105743408203125, -0.10029983520507812, -0.09485626220703125, -0.08941268920898438, -0.0839691162109375, -0.07852554321289062, -0.07308197021484375, -0.06763839721679688, -0.06219482421875, -0.056751251220703125, -0.05130767822265625, -0.045864105224609375, -0.0404205322265625, -0.034976959228515625, -0.02953338623046875, -0.024089813232421875, -0.018646240234375, -0.013202667236328125, -0.00775909423828125, -0.002315521240234375, 0.0031280517578125, 0.008571624755859375, 0.01401519775390625, 0.019458770751953125, 0.02490234375, 0.030345916748046875, 0.03578948974609375, 0.041233062744140625, 0.0466766357421875, 0.052120208740234375, 0.05756378173828125, 0.06300735473632812, 0.068450927734375, 0.07389450073242188, 0.07933807373046875, 0.08478164672851562, 0.0902252197265625, 0.09566879272460938, 0.10111236572265625, 0.10655593872070312, 0.11199951171875, 0.11744308471679688, 0.12288665771484375, 0.12833023071289062, 0.1337738037109375, 0.13921737670898438, 0.14466094970703125, 0.15010452270507812, 0.155548095703125, 0.16099166870117188, 0.16643524169921875, 0.17187881469726562, 0.1773223876953125, 0.18276596069335938, 0.18820953369140625, 0.19365310668945312, 0.1990966796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 2.0, 4.0, 7.0, 9.0, 20.0, 26.0, 31.0, 36.0, 56.0, 72.0, 72.0, 92.0, 84.0, 97.0, 82.0, 62.0, 54.0, 46.0, 40.0, 24.0, 20.0, 15.0, 10.0, 6.0, 6.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15264415740966797, -0.14830589294433594, -0.1439676284790039, -0.13962936401367188, -0.13529109954833984, -0.1309528350830078, -0.12661457061767578, -0.12227630615234375, -0.11793804168701172, -0.11359977722167969, -0.10926151275634766, -0.10492324829101562, -0.1005849838256836, -0.09624671936035156, -0.09190845489501953, -0.0875701904296875, -0.08323192596435547, -0.07889366149902344, -0.0745553970336914, -0.07021713256835938, -0.06587886810302734, -0.06154060363769531, -0.05720233917236328, -0.05286407470703125, -0.04852581024169922, -0.04418754577636719, -0.039849281311035156, -0.035511016845703125, -0.031172752380371094, -0.026834487915039062, -0.02249622344970703, -0.018157958984375, -0.013819694519042969, -0.009481430053710938, -0.005143165588378906, -0.000804901123046875, 0.0035333633422851562, 0.007871627807617188, 0.012209892272949219, 0.01654815673828125, 0.02088642120361328, 0.025224685668945312, 0.029562950134277344, 0.033901214599609375, 0.038239479064941406, 0.04257774353027344, 0.04691600799560547, 0.0512542724609375, 0.05559253692626953, 0.05993080139160156, 0.0642690658569336, 0.06860733032226562, 0.07294559478759766, 0.07728385925292969, 0.08162212371826172, 0.08596038818359375, 0.09029865264892578, 0.09463691711425781, 0.09897518157958984, 0.10331344604492188, 0.1076517105102539, 0.11198997497558594, 0.11632823944091797, 0.12066650390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 6.0, 13.0, 17.0, 15.0, 24.0, 27.0, 24.0, 48.0, 44.0, 53.0, 61.0, 69.0, 73.0, 71.0, 69.0, 63.0, 51.0, 51.0, 32.0, 40.0, 31.0, 30.0, 14.0, 20.0, 12.0, 11.0, 11.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8308272957801819, -0.8008356690406799, -0.770844042301178, -0.740852415561676, -0.7108608484268188, -0.6808692216873169, -0.6508775949478149, -0.620885968208313, -0.590894341468811, -0.5609027147293091, -0.5309110879898071, -0.5009194612503052, -0.4709278643131256, -0.44093623757362366, -0.4109446406364441, -0.38095301389694214, -0.3509613871574402, -0.32096976041793823, -0.2909781336784363, -0.2609865367412567, -0.23099491000175476, -0.2010032832622528, -0.17101167142391205, -0.1410200595855713, -0.11102843284606934, -0.08103681355714798, -0.051045194268226624, -0.021053574979305267, 0.008938044309616089, 0.03892967104911804, 0.0689212828874588, 0.09891289472579956, 0.1289045810699463, 0.15889620780944824, 0.188887819647789, 0.21887943148612976, 0.2488710582256317, 0.27886268496513367, 0.30885428190231323, 0.3388459086418152, 0.36883753538131714, 0.3988291621208191, 0.42882078886032104, 0.4588123857975006, 0.48880401253700256, 0.5187956094741821, 0.5487872362136841, 0.578778862953186, 0.608770489692688, 0.6387621164321899, 0.6687537431716919, 0.6987453699111938, 0.7287369966506958, 0.7587286233901978, 0.7887201905250549, 0.8187118172645569, 0.8487034440040588, 0.8786950707435608, 0.9086866974830627, 0.9386783242225647, 0.9686698913574219, 0.9986615180969238, 1.0286531448364258, 1.0586447715759277, 1.0886363983154297]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 7.0, 8.0, 13.0, 15.0, 11.0, 14.0, 21.0, 21.0, 30.0, 31.0, 35.0, 30.0, 42.0, 29.0, 30.0, 35.0, 40.0, 41.0, 49.0, 38.0, 50.0, 38.0, 34.0, 30.0, 28.0, 28.0, 31.0, 28.0, 23.0, 23.0, 24.0, 16.0, 17.0, 12.0, 12.0, 14.0, 6.0, 5.0, 7.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8224474191665649, -0.7953444719314575, -0.7682415246963501, -0.7411385774612427, -0.7140356302261353, -0.6869326829910278, -0.6598297953605652, -0.6327268481254578, -0.6056239008903503, -0.5785209536552429, -0.5514180064201355, -0.5243150591850281, -0.49721214175224304, -0.4701091945171356, -0.4430062770843506, -0.41590332984924316, -0.38880038261413574, -0.3616974353790283, -0.3345944881439209, -0.30749157071113586, -0.28038862347602844, -0.253285676240921, -0.2261827439069748, -0.19907981157302856, -0.17197686433792114, -0.14487391710281372, -0.11777098476886749, -0.09066804498434067, -0.06356510519981384, -0.03646215796470642, -0.009359225630760193, 0.017743706703186035, 0.04484671354293823, 0.07194965332746506, 0.09905259311199188, 0.1261555254459381, 0.15325847268104553, 0.18036141991615295, 0.20746435225009918, 0.2345672845840454, 0.26167023181915283, 0.28877317905426025, 0.3158761262893677, 0.3429790437221527, 0.37008199095726013, 0.39718493819236755, 0.4242878556251526, 0.45139080286026, 0.47849375009536743, 0.5055966973304749, 0.5326996445655823, 0.5598025918006897, 0.5869054794311523, 0.6140084266662598, 0.6411113739013672, 0.6682143211364746, 0.695317268371582, 0.7224202156066895, 0.7495231628417969, 0.7766261100769043, 0.8037290573120117, 0.8308320045471191, 0.8579348921775818, 0.8850378394126892, 0.9121407866477966]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 12.0, 5.0, 11.0, 18.0, 19.0, 30.0, 53.0, 71.0, 122.0, 199.0, 337.0, 821.0, 2073.0, 6638.0, 25211.0, 128680.0, 1186571.0, 2535768.0, 251543.0, 41604.0, 9815.0, 2810.0, 1014.0, 345.0, 196.0, 103.0, 74.0, 40.0, 29.0, 20.0, 22.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.48291015625, -0.4711799621582031, -0.45944976806640625, -0.4477195739746094, -0.4359893798828125, -0.4242591857910156, -0.41252899169921875, -0.4007987976074219, -0.389068603515625, -0.3773384094238281, -0.36560821533203125, -0.3538780212402344, -0.3421478271484375, -0.3304176330566406, -0.31868743896484375, -0.3069572448730469, -0.29522705078125, -0.2834968566894531, -0.27176666259765625, -0.2600364685058594, -0.2483062744140625, -0.23657608032226562, -0.22484588623046875, -0.21311569213867188, -0.201385498046875, -0.18965530395507812, -0.17792510986328125, -0.16619491577148438, -0.1544647216796875, -0.14273452758789062, -0.13100433349609375, -0.11927413940429688, -0.1075439453125, -0.09581375122070312, -0.08408355712890625, -0.07235336303710938, -0.0606231689453125, -0.048892974853515625, -0.03716278076171875, -0.025432586669921875, -0.013702392578125, -0.001972198486328125, 0.00975799560546875, 0.021488189697265625, 0.0332183837890625, 0.044948577880859375, 0.05667877197265625, 0.06840896606445312, 0.08013916015625, 0.09186935424804688, 0.10359954833984375, 0.11532974243164062, 0.1270599365234375, 0.13879013061523438, 0.15052032470703125, 0.16225051879882812, 0.173980712890625, 0.18571090698242188, 0.19744110107421875, 0.20917129516601562, 0.2209014892578125, 0.23263168334960938, 0.24436187744140625, 0.2560920715332031, 0.267822265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 1.0, 7.0, 3.0, 4.0, 8.0, 10.0, 8.0, 12.0, 13.0, 13.0, 17.0, 10.0, 20.0, 20.0, 30.0, 28.0, 24.0, 36.0, 33.0, 36.0, 40.0, 51.0, 50.0, 43.0, 46.0, 45.0, 28.0, 36.0, 36.0, 33.0, 27.0, 39.0, 18.0, 33.0, 25.0, 23.0, 14.0, 9.0, 12.0, 15.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1292724609375, -0.12526702880859375, -0.1212615966796875, -0.11725616455078125, -0.113250732421875, -0.10924530029296875, -0.1052398681640625, -0.10123443603515625, -0.09722900390625, -0.09322357177734375, -0.0892181396484375, -0.08521270751953125, -0.081207275390625, -0.07720184326171875, -0.0731964111328125, -0.06919097900390625, -0.065185546875, -0.06118011474609375, -0.0571746826171875, -0.05316925048828125, -0.049163818359375, -0.04515838623046875, -0.0411529541015625, -0.03714752197265625, -0.03314208984375, -0.02913665771484375, -0.0251312255859375, -0.02112579345703125, -0.017120361328125, -0.01311492919921875, -0.0091094970703125, -0.00510406494140625, -0.0010986328125, 0.00290679931640625, 0.0069122314453125, 0.01091766357421875, 0.014923095703125, 0.01892852783203125, 0.0229339599609375, 0.02693939208984375, 0.03094482421875, 0.03495025634765625, 0.0389556884765625, 0.04296112060546875, 0.046966552734375, 0.05097198486328125, 0.0549774169921875, 0.05898284912109375, 0.06298828125, 0.06699371337890625, 0.0709991455078125, 0.07500457763671875, 0.079010009765625, 0.08301544189453125, 0.0870208740234375, 0.09102630615234375, 0.09503173828125, 0.09903717041015625, 0.1030426025390625, 0.10704803466796875, 0.111053466796875, 0.11505889892578125, 0.1190643310546875, 0.12306976318359375, 0.1270751953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 12.0, 21.0, 18.0, 41.0, 49.0, 62.0, 104.0, 166.0, 215.0, 425.0, 784.0, 1569.0, 3431.0, 8146.0, 22223.0, 71210.0, 257656.0, 1083535.0, 2012095.0, 532972.0, 136185.0, 39783.0, 13461.0, 5250.0, 2302.0, 1069.0, 561.0, 340.0, 219.0, 122.0, 75.0, 49.0, 36.0, 16.0, 15.0, 25.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.331787109375, -0.3218116760253906, -0.31183624267578125, -0.3018608093261719, -0.2918853759765625, -0.2819099426269531, -0.27193450927734375, -0.2619590759277344, -0.251983642578125, -0.24200820922851562, -0.23203277587890625, -0.22205734252929688, -0.2120819091796875, -0.20210647583007812, -0.19213104248046875, -0.18215560913085938, -0.17218017578125, -0.16220474243164062, -0.15222930908203125, -0.14225387573242188, -0.1322784423828125, -0.12230300903320312, -0.11232757568359375, -0.10235214233398438, -0.092376708984375, -0.08240127563476562, -0.07242584228515625, -0.062450408935546875, -0.0524749755859375, -0.042499542236328125, -0.03252410888671875, -0.022548675537109375, -0.0125732421875, -0.002597808837890625, 0.00737762451171875, 0.017353057861328125, 0.0273284912109375, 0.037303924560546875, 0.04727935791015625, 0.057254791259765625, 0.067230224609375, 0.07720565795898438, 0.08718109130859375, 0.09715652465820312, 0.1071319580078125, 0.11710739135742188, 0.12708282470703125, 0.13705825805664062, 0.14703369140625, 0.15700912475585938, 0.16698455810546875, 0.17695999145507812, 0.1869354248046875, 0.19691085815429688, 0.20688629150390625, 0.21686172485351562, 0.226837158203125, 0.23681259155273438, 0.24678802490234375, 0.2567634582519531, 0.2667388916015625, 0.2767143249511719, 0.28668975830078125, 0.2966651916503906, 0.306640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 9.0, 7.0, 14.0, 12.0, 14.0, 15.0, 44.0, 57.0, 68.0, 112.0, 130.0, 200.0, 281.0, 422.0, 605.0, 654.0, 435.0, 323.0, 230.0, 142.0, 97.0, 62.0, 42.0, 27.0, 24.0, 13.0, 11.0, 7.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2902984619140625, -0.281524658203125, -0.2727508544921875, -0.26397705078125, -0.2552032470703125, -0.246429443359375, -0.2376556396484375, -0.2288818359375, -0.2201080322265625, -0.211334228515625, -0.2025604248046875, -0.19378662109375, -0.1850128173828125, -0.176239013671875, -0.1674652099609375, -0.15869140625, -0.1499176025390625, -0.141143798828125, -0.1323699951171875, -0.12359619140625, -0.1148223876953125, -0.106048583984375, -0.0972747802734375, -0.0885009765625, -0.0797271728515625, -0.070953369140625, -0.0621795654296875, -0.05340576171875, -0.0446319580078125, -0.035858154296875, -0.0270843505859375, -0.018310546875, -0.0095367431640625, -0.000762939453125, 0.0080108642578125, 0.01678466796875, 0.0255584716796875, 0.034332275390625, 0.0431060791015625, 0.0518798828125, 0.0606536865234375, 0.069427490234375, 0.0782012939453125, 0.08697509765625, 0.0957489013671875, 0.104522705078125, 0.1132965087890625, 0.1220703125, 0.1308441162109375, 0.139617919921875, 0.1483917236328125, 0.15716552734375, 0.1659393310546875, 0.174713134765625, 0.1834869384765625, 0.1922607421875, 0.2010345458984375, 0.209808349609375, 0.2185821533203125, 0.22735595703125, 0.2361297607421875, 0.244903564453125, 0.2536773681640625, 0.262451171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 6.0, 17.0, 22.0, 22.0, 28.0, 42.0, 57.0, 57.0, 66.0, 69.0, 85.0, 80.0, 76.0, 59.0, 74.0, 46.0, 45.0, 34.0, 37.0, 29.0, 12.0, 13.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3001172542572021, -1.2667630910873413, -1.2334089279174805, -1.2000547647476196, -1.1667006015777588, -1.133346438407898, -1.099992275238037, -1.0666382312774658, -1.0332839488983154, -0.9999297857284546, -0.9665756225585938, -0.9332214593887329, -0.8998672962188721, -0.8665131330490112, -0.8331590294837952, -0.7998048663139343, -0.7664507627487183, -0.7330965995788574, -0.6997424364089966, -0.6663882732391357, -0.6330341100692749, -0.5996799468994141, -0.566325843334198, -0.5329716801643372, -0.4996175169944763, -0.4662633538246155, -0.43290919065475464, -0.3995550572872162, -0.36620089411735535, -0.3328467309474945, -0.29949259757995605, -0.2661384344100952, -0.2327842116355896, -0.19943004846572876, -0.1660759001970291, -0.13272175192832947, -0.09936758875846863, -0.06601342558860779, -0.03265927731990814, 0.0006948709487915039, 0.034049034118652344, 0.06740318983793259, 0.10075734555721283, 0.13411149382591248, 0.16746565699577332, 0.20081982016563416, 0.2341739684343338, 0.26752811670303345, 0.3008822798728943, 0.3342364430427551, 0.36759060621261597, 0.4009447395801544, 0.43429890275001526, 0.4676530659198761, 0.5010071992874146, 0.5343613624572754, 0.5677155256271362, 0.6010696887969971, 0.6344238519668579, 0.6677780151367188, 0.7011321783065796, 0.7344863414764404, 0.7678404450416565, 0.8011946082115173, 0.8345487713813782]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 2.0, 8.0, 5.0, 7.0, 5.0, 12.0, 12.0, 5.0, 25.0, 17.0, 18.0, 29.0, 33.0, 27.0, 28.0, 28.0, 28.0, 31.0, 47.0, 36.0, 30.0, 39.0, 37.0, 38.0, 41.0, 36.0, 41.0, 28.0, 44.0, 21.0, 28.0, 28.0, 29.0, 18.0, 14.0, 15.0, 19.0, 22.0, 11.0, 10.0, 11.0, 6.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5925029516220093, -0.5726257562637329, -0.5527485609054565, -0.5328713655471802, -0.512994110584259, -0.49311691522598267, -0.4732397198677063, -0.45336252450942993, -0.43348532915115356, -0.4136081337928772, -0.39373090863227844, -0.3738537132740021, -0.3539765179157257, -0.33409929275512695, -0.3142220973968506, -0.2943449020385742, -0.27446767687797546, -0.2545904815196991, -0.23471327126026154, -0.21483606100082397, -0.1949588656425476, -0.17508165538311005, -0.15520444512367249, -0.13532724976539612, -0.11545003950595856, -0.09557283669710159, -0.07569563388824463, -0.05581842362880707, -0.035941220819950104, -0.01606401801109314, 0.0038131922483444214, 0.02369038760662079, 0.04356759786605835, 0.06344480067491531, 0.08332200348377228, 0.10319921374320984, 0.1230764165520668, 0.14295361936092377, 0.16283082962036133, 0.1827080249786377, 0.20258523523807526, 0.22246244549751282, 0.24233964085578918, 0.26221686601638794, 0.2820940613746643, 0.3019712567329407, 0.32184845209121704, 0.3417256474494934, 0.36160287261009216, 0.38148006796836853, 0.4013572931289673, 0.42123448848724365, 0.44111168384552, 0.4609888792037964, 0.48086610436439514, 0.5007432699203491, 0.5206205248832703, 0.5404977202415466, 0.560374915599823, 0.5802521705627441, 0.6001293659210205, 0.6200065612792969, 0.6398837566375732, 0.6597609519958496, 0.679638147354126]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 7.0, 14.0, 25.0, 42.0, 69.0, 120.0, 169.0, 299.0, 491.0, 827.0, 1430.0, 2322.0, 3779.0, 5709.0, 9240.0, 14391.0, 22810.0, 37097.0, 63884.0, 120000.0, 219574.0, 234024.0, 133905.0, 70849.0, 40334.0, 24764.0, 15692.0, 9821.0, 6432.0, 3995.0, 2488.0, 1559.0, 975.0, 564.0, 343.0, 184.0, 106.0, 77.0, 43.0, 34.0, 17.0, 12.0, 13.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.209716796875, -0.20318031311035156, -0.19664382934570312, -0.1901073455810547, -0.18357086181640625, -0.1770343780517578, -0.17049789428710938, -0.16396141052246094, -0.1574249267578125, -0.15088844299316406, -0.14435195922851562, -0.1378154754638672, -0.13127899169921875, -0.12474250793457031, -0.11820602416992188, -0.11166954040527344, -0.105133056640625, -0.09859657287597656, -0.09206008911132812, -0.08552360534667969, -0.07898712158203125, -0.07245063781738281, -0.06591415405273438, -0.05937767028808594, -0.0528411865234375, -0.04630470275878906, -0.039768218994140625, -0.03323173522949219, -0.02669525146484375, -0.020158767700195312, -0.013622283935546875, -0.0070858001708984375, -0.00054931640625, 0.0059871673583984375, 0.012523651123046875, 0.019060134887695312, 0.02559661865234375, 0.03213310241699219, 0.038669586181640625, 0.04520606994628906, 0.0517425537109375, 0.05827903747558594, 0.06481552124023438, 0.07135200500488281, 0.07788848876953125, 0.08442497253417969, 0.09096145629882812, 0.09749794006347656, 0.104034423828125, 0.11057090759277344, 0.11710739135742188, 0.12364387512207031, 0.13018035888671875, 0.1367168426513672, 0.14325332641601562, 0.14978981018066406, 0.1563262939453125, 0.16286277770996094, 0.16939926147460938, 0.1759357452392578, 0.18247222900390625, 0.1890087127685547, 0.19554519653320312, 0.20208168029785156, 0.2086181640625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 8.0, 5.0, 11.0, 8.0, 13.0, 13.0, 15.0, 18.0, 15.0, 32.0, 17.0, 25.0, 23.0, 29.0, 36.0, 29.0, 43.0, 43.0, 37.0, 46.0, 48.0, 53.0, 38.0, 31.0, 49.0, 27.0, 41.0, 26.0, 30.0, 28.0, 33.0, 24.0, 14.0, 12.0, 12.0, 18.0, 8.0, 13.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14483261108398438, -0.14049530029296875, -0.13615798950195312, -0.1318206787109375, -0.12748336791992188, -0.12314605712890625, -0.11880874633789062, -0.114471435546875, -0.11013412475585938, -0.10579681396484375, -0.10145950317382812, -0.0971221923828125, -0.09278488159179688, -0.08844757080078125, -0.08411026000976562, -0.07977294921875, -0.07543563842773438, -0.07109832763671875, -0.06676101684570312, -0.0624237060546875, -0.058086395263671875, -0.05374908447265625, -0.049411773681640625, -0.045074462890625, -0.040737152099609375, -0.03639984130859375, -0.032062530517578125, -0.0277252197265625, -0.023387908935546875, -0.01905059814453125, -0.014713287353515625, -0.0103759765625, -0.006038665771484375, -0.00170135498046875, 0.002635955810546875, 0.0069732666015625, 0.011310577392578125, 0.01564788818359375, 0.019985198974609375, 0.024322509765625, 0.028659820556640625, 0.03299713134765625, 0.037334442138671875, 0.0416717529296875, 0.046009063720703125, 0.05034637451171875, 0.054683685302734375, 0.05902099609375, 0.06335830688476562, 0.06769561767578125, 0.07203292846679688, 0.0763702392578125, 0.08070755004882812, 0.08504486083984375, 0.08938217163085938, 0.093719482421875, 0.09805679321289062, 0.10239410400390625, 0.10673141479492188, 0.1110687255859375, 0.11540603637695312, 0.11974334716796875, 0.12408065795898438, 0.12841796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 16.0, 10.0, 16.0, 20.0, 17.0, 37.0, 30.0, 44.0, 55.0, 82.0, 135.0, 172.0, 302.0, 559.0, 1146.0, 2731.0, 6849.0, 17915.0, 47704.0, 159104.0, 519493.0, 200673.0, 56664.0, 20649.0, 7998.0, 3195.0, 1377.0, 603.0, 334.0, 153.0, 115.0, 98.0, 55.0, 45.0, 33.0, 21.0, 28.0, 15.0, 13.0, 10.0, 16.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.44161224365234375, -0.4266815185546875, -0.41175079345703125, -0.396820068359375, -0.38188934326171875, -0.3669586181640625, -0.35202789306640625, -0.33709716796875, -0.32216644287109375, -0.3072357177734375, -0.29230499267578125, -0.277374267578125, -0.26244354248046875, -0.2475128173828125, -0.23258209228515625, -0.2176513671875, -0.20272064208984375, -0.1877899169921875, -0.17285919189453125, -0.157928466796875, -0.14299774169921875, -0.1280670166015625, -0.11313629150390625, -0.09820556640625, -0.08327484130859375, -0.0683441162109375, -0.05341339111328125, -0.038482666015625, -0.02355194091796875, -0.0086212158203125, 0.00630950927734375, 0.021240234375, 0.03617095947265625, 0.0511016845703125, 0.06603240966796875, 0.080963134765625, 0.09589385986328125, 0.1108245849609375, 0.12575531005859375, 0.14068603515625, 0.15561676025390625, 0.1705474853515625, 0.18547821044921875, 0.200408935546875, 0.21533966064453125, 0.2302703857421875, 0.24520111083984375, 0.2601318359375, 0.27506256103515625, 0.2899932861328125, 0.30492401123046875, 0.319854736328125, 0.33478546142578125, 0.3497161865234375, 0.36464691162109375, 0.37957763671875, 0.39450836181640625, 0.4094390869140625, 0.42436981201171875, 0.439300537109375, 0.45423126220703125, 0.4691619873046875, 0.48409271240234375, 0.4990234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 8.0, 10.0, 12.0, 20.0, 20.0, 20.0, 33.0, 41.0, 46.0, 66.0, 69.0, 67.0, 64.0, 64.0, 60.0, 73.0, 61.0, 54.0, 37.0, 34.0, 30.0, 25.0, 18.0, 16.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7274169921875, -0.707275390625, -0.6871337890625, -0.6669921875, -0.6468505859375, -0.626708984375, -0.6065673828125, -0.58642578125, -0.5662841796875, -0.546142578125, -0.5260009765625, -0.505859375, -0.4857177734375, -0.465576171875, -0.4454345703125, -0.42529296875, -0.4051513671875, -0.385009765625, -0.3648681640625, -0.3447265625, -0.3245849609375, -0.304443359375, -0.2843017578125, -0.26416015625, -0.2440185546875, -0.223876953125, -0.2037353515625, -0.18359375, -0.1634521484375, -0.143310546875, -0.1231689453125, -0.10302734375, -0.0828857421875, -0.062744140625, -0.0426025390625, -0.0224609375, -0.0023193359375, 0.017822265625, 0.0379638671875, 0.05810546875, 0.0782470703125, 0.098388671875, 0.1185302734375, 0.138671875, 0.1588134765625, 0.178955078125, 0.1990966796875, 0.21923828125, 0.2393798828125, 0.259521484375, 0.2796630859375, 0.2998046875, 0.3199462890625, 0.340087890625, 0.3602294921875, 0.38037109375, 0.4005126953125, 0.420654296875, 0.4407958984375, 0.4609375, 0.4810791015625, 0.501220703125, 0.5213623046875, 0.54150390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 13.0, 25.0, 45.0, 53.0, 75.0, 171.0, 294.0, 678.0, 1441.0, 3303.0, 7413.0, 17737.0, 50561.0, 337079.0, 524063.0, 67592.0, 21835.0, 8778.0, 3882.0, 1747.0, 827.0, 376.0, 226.0, 119.0, 62.0, 38.0, 27.0, 19.0, 14.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.33367156982421875, -0.3235931396484375, -0.31351470947265625, -0.303436279296875, -0.29335784912109375, -0.2832794189453125, -0.27320098876953125, -0.26312255859375, -0.25304412841796875, -0.2429656982421875, -0.23288726806640625, -0.222808837890625, -0.21273040771484375, -0.2026519775390625, -0.19257354736328125, -0.1824951171875, -0.17241668701171875, -0.1623382568359375, -0.15225982666015625, -0.142181396484375, -0.13210296630859375, -0.1220245361328125, -0.11194610595703125, -0.10186767578125, -0.09178924560546875, -0.0817108154296875, -0.07163238525390625, -0.061553955078125, -0.05147552490234375, -0.0413970947265625, -0.03131866455078125, -0.021240234375, -0.01116180419921875, -0.0010833740234375, 0.00899505615234375, 0.019073486328125, 0.02915191650390625, 0.0392303466796875, 0.04930877685546875, 0.05938720703125, 0.06946563720703125, 0.0795440673828125, 0.08962249755859375, 0.099700927734375, 0.10977935791015625, 0.1198577880859375, 0.12993621826171875, 0.1400146484375, 0.15009307861328125, 0.1601715087890625, 0.17024993896484375, 0.180328369140625, 0.19040679931640625, 0.2004852294921875, 0.21056365966796875, 0.22064208984375, 0.23072052001953125, 0.2407989501953125, 0.25087738037109375, 0.260955810546875, 0.27103424072265625, 0.2811126708984375, 0.29119110107421875, 0.30126953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 1.0, 7.0, 4.0, 3.0, 6.0, 7.0, 10.0, 11.0, 12.0, 13.0, 22.0, 35.0, 52.0, 79.0, 101.0, 137.0, 125.0, 109.0, 71.0, 44.0, 35.0, 22.0, 13.0, 16.0, 2.0, 9.0, 8.0, 9.0, 8.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.464387893676758e-05, -4.336237907409668e-05, -4.208087921142578e-05, -4.079937934875488e-05, -3.9517879486083984e-05, -3.8236379623413086e-05, -3.695487976074219e-05, -3.567337989807129e-05, -3.439188003540039e-05, -3.311038017272949e-05, -3.1828880310058594e-05, -3.0547380447387695e-05, -2.9265880584716797e-05, -2.79843807220459e-05, -2.6702880859375e-05, -2.54213809967041e-05, -2.4139881134033203e-05, -2.2858381271362305e-05, -2.1576881408691406e-05, -2.0295381546020508e-05, -1.901388168334961e-05, -1.773238182067871e-05, -1.6450881958007812e-05, -1.5169382095336914e-05, -1.3887882232666016e-05, -1.2606382369995117e-05, -1.1324882507324219e-05, -1.004338264465332e-05, -8.761882781982422e-06, -7.4803829193115234e-06, -6.198883056640625e-06, -4.9173831939697266e-06, -3.635883331298828e-06, -2.3543834686279297e-06, -1.0728836059570312e-06, 2.086162567138672e-07, 1.4901161193847656e-06, 2.771615982055664e-06, 4.0531158447265625e-06, 5.334615707397461e-06, 6.616115570068359e-06, 7.897615432739258e-06, 9.179115295410156e-06, 1.0460615158081055e-05, 1.1742115020751953e-05, 1.3023614883422852e-05, 1.430511474609375e-05, 1.558661460876465e-05, 1.6868114471435547e-05, 1.8149614334106445e-05, 1.9431114196777344e-05, 2.0712614059448242e-05, 2.199411392211914e-05, 2.327561378479004e-05, 2.4557113647460938e-05, 2.5838613510131836e-05, 2.7120113372802734e-05, 2.8401613235473633e-05, 2.968311309814453e-05, 3.096461296081543e-05, 3.224611282348633e-05, 3.3527612686157227e-05, 3.4809112548828125e-05, 3.6090612411499023e-05, 3.737211227416992e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 7.0, 11.0, 15.0, 9.0, 21.0, 28.0, 38.0, 61.0, 91.0, 158.0, 323.0, 620.0, 1568.0, 3919.0, 10656.0, 30482.0, 119600.0, 618824.0, 198519.0, 40988.0, 13920.0, 4979.0, 1985.0, 843.0, 363.0, 167.0, 127.0, 78.0, 50.0, 37.0, 16.0, 11.0, 12.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.259521484375, -0.250762939453125, -0.24200439453125, -0.233245849609375, -0.2244873046875, -0.215728759765625, -0.20697021484375, -0.198211669921875, -0.189453125, -0.180694580078125, -0.17193603515625, -0.163177490234375, -0.1544189453125, -0.145660400390625, -0.13690185546875, -0.128143310546875, -0.119384765625, -0.110626220703125, -0.10186767578125, -0.093109130859375, -0.0843505859375, -0.075592041015625, -0.06683349609375, -0.058074951171875, -0.04931640625, -0.040557861328125, -0.03179931640625, -0.023040771484375, -0.0142822265625, -0.005523681640625, 0.00323486328125, 0.011993408203125, 0.020751953125, 0.029510498046875, 0.03826904296875, 0.047027587890625, 0.0557861328125, 0.064544677734375, 0.07330322265625, 0.082061767578125, 0.0908203125, 0.099578857421875, 0.10833740234375, 0.117095947265625, 0.1258544921875, 0.134613037109375, 0.14337158203125, 0.152130126953125, 0.160888671875, 0.169647216796875, 0.17840576171875, 0.187164306640625, 0.1959228515625, 0.204681396484375, 0.21343994140625, 0.222198486328125, 0.23095703125, 0.239715576171875, 0.24847412109375, 0.257232666015625, 0.2659912109375, 0.274749755859375, 0.28350830078125, 0.292266845703125, 0.301025390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 19.0, 41.0, 53.0, 82.0, 138.0, 168.0, 126.0, 105.0, 50.0, 39.0, 33.0, 19.0, 15.0, 9.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1971435546875, -0.18942832946777344, -0.18171310424804688, -0.1739978790283203, -0.16628265380859375, -0.1585674285888672, -0.15085220336914062, -0.14313697814941406, -0.1354217529296875, -0.12770652770996094, -0.11999130249023438, -0.11227607727050781, -0.10456085205078125, -0.09684562683105469, -0.08913040161132812, -0.08141517639160156, -0.073699951171875, -0.06598472595214844, -0.058269500732421875, -0.05055427551269531, -0.04283905029296875, -0.03512382507324219, -0.027408599853515625, -0.019693374633789062, -0.0119781494140625, -0.0042629241943359375, 0.003452301025390625, 0.011167526245117188, 0.01888275146484375, 0.026597976684570312, 0.034313201904296875, 0.04202842712402344, 0.04974365234375, 0.05745887756347656, 0.06517410278320312, 0.07288932800292969, 0.08060455322265625, 0.08831977844238281, 0.09603500366210938, 0.10375022888183594, 0.1114654541015625, 0.11918067932128906, 0.12689590454101562, 0.1346111297607422, 0.14232635498046875, 0.1500415802001953, 0.15775680541992188, 0.16547203063964844, 0.173187255859375, 0.18090248107910156, 0.18861770629882812, 0.1963329315185547, 0.20404815673828125, 0.2117633819580078, 0.21947860717773438, 0.22719383239746094, 0.2349090576171875, 0.24262428283691406, 0.2503395080566406, 0.2580547332763672, 0.26576995849609375, 0.2734851837158203, 0.2812004089355469, 0.28891563415527344, 0.296630859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 7.0, 15.0, 35.0, 37.0, 62.0, 81.0, 95.0, 95.0, 108.0, 97.0, 124.0, 77.0, 53.0, 45.0, 25.0, 13.0, 13.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.670444369316101, -1.6092681884765625, -1.548092007637024, -1.4869158267974854, -1.4257397651672363, -1.3645634651184082, -1.3033874034881592, -1.2422112226486206, -1.181035041809082, -1.1198588609695435, -1.0586826801300049, -0.9975065588951111, -0.9363303780555725, -0.8751541972160339, -0.8139780759811401, -0.7528018951416016, -0.691625714302063, -0.6304495334625244, -0.5692733526229858, -0.508097231388092, -0.44692105054855347, -0.3857448697090149, -0.3245687186717987, -0.2633925676345825, -0.20221638679504395, -0.14104022085666656, -0.07986405491828918, -0.018687888979911804, 0.042488276958465576, 0.10366445779800415, 0.16484060883522034, 0.22601675987243652, 0.28719305992126465, 0.3483692407608032, 0.4095453917980194, 0.4707215428352356, 0.5318977236747742, 0.5930739045143127, 0.6542500257492065, 0.7154262065887451, 0.7766023874282837, 0.8377785682678223, 0.8989547491073608, 0.9601308703422546, 1.0213069915771484, 1.0824832916259766, 1.1436593532562256, 1.2048355340957642, 1.2660117149353027, 1.3271878957748413, 1.3883640766143799, 1.4495402574539185, 1.510716438293457, 1.571892499923706, 1.6330686807632446, 1.6942448616027832, 1.7554210424423218, 1.8165972232818604, 1.877773404121399, 1.9389495849609375, 2.0001256465911865, 2.0613019466400146, 2.1224780082702637, 2.183654308319092, 2.244830369949341]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 12.0, 8.0, 17.0, 19.0, 25.0, 24.0, 25.0, 28.0, 26.0, 43.0, 31.0, 44.0, 37.0, 32.0, 38.0, 37.0, 48.0, 46.0, 35.0, 37.0, 36.0, 42.0, 33.0, 38.0, 21.0, 16.0, 25.0, 27.0, 19.0, 11.0, 20.0, 10.0, 12.0, 14.0, 4.0, 10.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1940932273864746, -1.158704161643982, -1.1233150959014893, -1.0879260301589966, -1.052536964416504, -1.0171478986740112, -0.9817587733268738, -0.9463697075843811, -0.9109806418418884, -0.8755915760993958, -0.8402025103569031, -0.8048134446144104, -0.769424319267273, -0.7340352535247803, -0.6986461877822876, -0.6632571220397949, -0.6278680562973022, -0.5924789905548096, -0.5570899248123169, -0.5217008590698242, -0.48631176352500916, -0.4509226977825165, -0.4155336022377014, -0.38014453649520874, -0.34475547075271606, -0.3093664050102234, -0.2739773392677307, -0.23858824372291565, -0.20319917798042297, -0.1678101122379303, -0.13242103159427643, -0.09703195095062256, -0.061643004417419434, -0.02625393122434616, 0.009135141968727112, 0.044524215161800385, 0.07991328835487366, 0.11530235409736633, 0.1506914347410202, 0.18608051538467407, 0.22146958112716675, 0.2568586468696594, 0.2922477126121521, 0.32763680815696716, 0.36302587389945984, 0.3984149396419525, 0.4338040351867676, 0.46919310092926025, 0.5045821666717529, 0.5399712324142456, 0.5753602981567383, 0.610749363899231, 0.6461384296417236, 0.6815274953842163, 0.7169166207313538, 0.7523056864738464, 0.7876947522163391, 0.8230838179588318, 0.8584728837013245, 0.8938619494438171, 0.9292510747909546, 0.9646401405334473, 1.00002920627594, 1.0354182720184326, 1.0708073377609253]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 17.0, 22.0, 37.0, 41.0, 75.0, 126.0, 199.0, 355.0, 573.0, 1051.0, 1873.0, 3558.0, 6933.0, 13668.0, 29102.0, 63329.0, 147165.0, 379257.0, 1245951.0, 1542764.0, 450125.0, 170834.0, 72489.0, 32850.0, 15658.0, 7738.0, 3832.0, 2072.0, 1073.0, 623.0, 338.0, 196.0, 106.0, 94.0, 57.0, 35.0, 22.0, 12.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2113037109375, -0.20528030395507812, -0.19925689697265625, -0.19323348999023438, -0.1872100830078125, -0.18118667602539062, -0.17516326904296875, -0.16913986206054688, -0.163116455078125, -0.15709304809570312, -0.15106964111328125, -0.14504623413085938, -0.1390228271484375, -0.13299942016601562, -0.12697601318359375, -0.12095260620117188, -0.11492919921875, -0.10890579223632812, -0.10288238525390625, -0.09685897827148438, -0.0908355712890625, -0.08481216430664062, -0.07878875732421875, -0.07276535034179688, -0.066741943359375, -0.060718536376953125, -0.05469512939453125, -0.048671722412109375, -0.0426483154296875, -0.036624908447265625, -0.03060150146484375, -0.024578094482421875, -0.0185546875, -0.012531280517578125, -0.00650787353515625, -0.000484466552734375, 0.0055389404296875, 0.011562347412109375, 0.01758575439453125, 0.023609161376953125, 0.029632568359375, 0.035655975341796875, 0.04167938232421875, 0.047702789306640625, 0.0537261962890625, 0.059749603271484375, 0.06577301025390625, 0.07179641723632812, 0.07781982421875, 0.08384323120117188, 0.08986663818359375, 0.09589004516601562, 0.1019134521484375, 0.10793685913085938, 0.11396026611328125, 0.11998367309570312, 0.126007080078125, 0.13203048706054688, 0.13805389404296875, 0.14407730102539062, 0.1501007080078125, 0.15612411499023438, 0.16214752197265625, 0.16817092895507812, 0.1741943359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 8.0, 3.0, 8.0, 10.0, 6.0, 7.0, 17.0, 16.0, 18.0, 18.0, 23.0, 26.0, 26.0, 29.0, 30.0, 38.0, 44.0, 42.0, 38.0, 49.0, 56.0, 46.0, 50.0, 55.0, 32.0, 43.0, 31.0, 33.0, 29.0, 28.0, 27.0, 23.0, 14.0, 15.0, 15.0, 13.0, 8.0, 9.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.171630859375, -0.16605377197265625, -0.1604766845703125, -0.15489959716796875, -0.149322509765625, -0.14374542236328125, -0.1381683349609375, -0.13259124755859375, -0.12701416015625, -0.12143707275390625, -0.1158599853515625, -0.11028289794921875, -0.104705810546875, -0.09912872314453125, -0.0935516357421875, -0.08797454833984375, -0.0823974609375, -0.07682037353515625, -0.0712432861328125, -0.06566619873046875, -0.060089111328125, -0.05451202392578125, -0.0489349365234375, -0.04335784912109375, -0.03778076171875, -0.03220367431640625, -0.0266265869140625, -0.02104949951171875, -0.015472412109375, -0.00989532470703125, -0.0043182373046875, 0.00125885009765625, 0.0068359375, 0.01241302490234375, 0.0179901123046875, 0.02356719970703125, 0.029144287109375, 0.03472137451171875, 0.0402984619140625, 0.04587554931640625, 0.05145263671875, 0.05702972412109375, 0.0626068115234375, 0.06818389892578125, 0.073760986328125, 0.07933807373046875, 0.0849151611328125, 0.09049224853515625, 0.0960693359375, 0.10164642333984375, 0.1072235107421875, 0.11280059814453125, 0.118377685546875, 0.12395477294921875, 0.1295318603515625, 0.13510894775390625, 0.14068603515625, 0.14626312255859375, 0.1518402099609375, 0.15741729736328125, 0.162994384765625, 0.16857147216796875, 0.1741485595703125, 0.17972564697265625, 0.185302734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 7.0, 9.0, 18.0, 17.0, 27.0, 46.0, 49.0, 68.0, 98.0, 142.0, 181.0, 286.0, 457.0, 804.0, 1573.0, 3158.0, 7431.0, 19474.0, 57065.0, 185844.0, 718559.0, 2143822.0, 763113.0, 197014.0, 59579.0, 20385.0, 7880.0, 3275.0, 1529.0, 849.0, 504.0, 284.0, 220.0, 125.0, 118.0, 69.0, 44.0, 32.0, 22.0, 26.0, 17.0, 14.0, 4.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.36962890625, -0.35790252685546875, -0.3461761474609375, -0.33444976806640625, -0.322723388671875, -0.31099700927734375, -0.2992706298828125, -0.28754425048828125, -0.27581787109375, -0.26409149169921875, -0.2523651123046875, -0.24063873291015625, -0.228912353515625, -0.21718597412109375, -0.2054595947265625, -0.19373321533203125, -0.1820068359375, -0.17028045654296875, -0.1585540771484375, -0.14682769775390625, -0.135101318359375, -0.12337493896484375, -0.1116485595703125, -0.09992218017578125, -0.08819580078125, -0.07646942138671875, -0.0647430419921875, -0.05301666259765625, -0.041290283203125, -0.02956390380859375, -0.0178375244140625, -0.00611114501953125, 0.005615234375, 0.01734161376953125, 0.0290679931640625, 0.04079437255859375, 0.052520751953125, 0.06424713134765625, 0.0759735107421875, 0.08769989013671875, 0.09942626953125, 0.11115264892578125, 0.1228790283203125, 0.13460540771484375, 0.146331787109375, 0.15805816650390625, 0.1697845458984375, 0.18151092529296875, 0.1932373046875, 0.20496368408203125, 0.2166900634765625, 0.22841644287109375, 0.240142822265625, 0.25186920166015625, 0.2635955810546875, 0.27532196044921875, 0.28704833984375, 0.29877471923828125, 0.3105010986328125, 0.32222747802734375, 0.333953857421875, 0.34568023681640625, 0.3574066162109375, 0.36913299560546875, 0.380859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 13.0, 23.0, 23.0, 46.0, 65.0, 84.0, 140.0, 207.0, 376.0, 557.0, 738.0, 597.0, 426.0, 270.0, 155.0, 120.0, 72.0, 57.0, 22.0, 24.0, 18.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3010520935058594, -0.28936004638671875, -0.2776679992675781, -0.2659759521484375, -0.2542839050292969, -0.24259185791015625, -0.23089981079101562, -0.219207763671875, -0.20751571655273438, -0.19582366943359375, -0.18413162231445312, -0.1724395751953125, -0.16074752807617188, -0.14905548095703125, -0.13736343383789062, -0.12567138671875, -0.11397933959960938, -0.10228729248046875, -0.09059524536132812, -0.0789031982421875, -0.06721115112304688, -0.05551910400390625, -0.043827056884765625, -0.032135009765625, -0.020442962646484375, -0.00875091552734375, 0.002941131591796875, 0.0146331787109375, 0.026325225830078125, 0.03801727294921875, 0.049709320068359375, 0.0614013671875, 0.07309341430664062, 0.08478546142578125, 0.09647750854492188, 0.1081695556640625, 0.11986160278320312, 0.13155364990234375, 0.14324569702148438, 0.154937744140625, 0.16662979125976562, 0.17832183837890625, 0.19001388549804688, 0.2017059326171875, 0.21339797973632812, 0.22509002685546875, 0.23678207397460938, 0.24847412109375, 0.2601661682128906, 0.27185821533203125, 0.2835502624511719, 0.2952423095703125, 0.3069343566894531, 0.31862640380859375, 0.3303184509277344, 0.342010498046875, 0.3537025451660156, 0.36539459228515625, 0.3770866394042969, 0.3887786865234375, 0.4004707336425781, 0.41216278076171875, 0.4238548278808594, 0.435546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 6.0, 6.0, 5.0, 11.0, 16.0, 23.0, 36.0, 38.0, 58.0, 64.0, 74.0, 80.0, 80.0, 79.0, 89.0, 78.0, 61.0, 48.0, 39.0, 30.0, 25.0, 13.0, 16.0, 10.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1421663761138916, -1.1003005504608154, -1.0584347248077393, -1.016568899154663, -0.9747030735015869, -0.9328372478485107, -0.8909713625907898, -0.8491055369377136, -0.8072397112846375, -0.7653738856315613, -0.7235080599784851, -0.6816421747207642, -0.639776349067688, -0.5979105234146118, -0.5560446977615356, -0.5141788721084595, -0.4723130464553833, -0.43044722080230713, -0.38858139514923096, -0.3467155396938324, -0.3048497140407562, -0.26298388838768005, -0.2211180329322815, -0.17925220727920532, -0.13738638162612915, -0.09552054852247238, -0.05365471541881561, -0.011788874864578247, 0.030076950788497925, 0.0719427764415741, 0.11380863189697266, 0.15567445755004883, 0.19754040241241455, 0.23940622806549072, 0.2812720537185669, 0.32313790917396545, 0.3650037348270416, 0.4068695604801178, 0.44873541593551636, 0.49060124158859253, 0.5324670672416687, 0.5743328928947449, 0.616198718547821, 0.658064603805542, 0.6999304294586182, 0.7417962551116943, 0.7836620807647705, 0.8255279064178467, 0.8673937320709229, 0.909259557723999, 0.9511253833770752, 0.9929912090301514, 1.0348570346832275, 1.0767228603363037, 1.1185886859893799, 1.160454511642456, 1.2023203372955322, 1.2441861629486084, 1.2860519886016846, 1.3279178142547607, 1.369783639907837, 1.411649465560913, 1.4535152912139893, 1.4953811168670654, 1.5372470617294312]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 6.0, 15.0, 15.0, 10.0, 17.0, 18.0, 19.0, 19.0, 18.0, 24.0, 32.0, 42.0, 33.0, 43.0, 41.0, 31.0, 53.0, 44.0, 40.0, 37.0, 41.0, 38.0, 46.0, 44.0, 34.0, 28.0, 30.0, 32.0, 18.0, 11.0, 18.0, 16.0, 10.0, 17.0, 11.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9363552927970886, -0.9088358879089355, -0.8813164830207825, -0.8537970781326294, -0.8262777328491211, -0.7987582683563232, -0.7712389230728149, -0.7437195181846619, -0.7162001132965088, -0.6886807084083557, -0.6611613035202026, -0.6336418986320496, -0.6061224937438965, -0.5786031484603882, -0.5510837435722351, -0.523564338684082, -0.49604493379592896, -0.4685255289077759, -0.4410061240196228, -0.4134867489337921, -0.38596734404563904, -0.35844793915748596, -0.3309285640716553, -0.3034091591835022, -0.2758897542953491, -0.24837034940719604, -0.22085095942020416, -0.19333156943321228, -0.1658121645450592, -0.13829275965690613, -0.11077336966991425, -0.08325397968292236, -0.05573451519012451, -0.028215117752552032, -0.0006957203149795532, 0.026823677122592926, 0.054343074560165405, 0.08186247944831848, 0.10938186943531036, 0.13690125942230225, 0.16442066431045532, 0.1919400691986084, 0.21945945918560028, 0.24697884917259216, 0.27449825406074524, 0.3020176589488983, 0.329537034034729, 0.3570564389228821, 0.38457584381103516, 0.41209524869918823, 0.4396146535873413, 0.467134028673172, 0.4946534335613251, 0.5221728086471558, 0.5496922135353088, 0.5772116184234619, 0.604731023311615, 0.6322504281997681, 0.6597698330879211, 0.6872892379760742, 0.7148085832595825, 0.7423280477523804, 0.7698473930358887, 0.7973667979240417, 0.8248862028121948]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 5.0, 9.0, 13.0, 20.0, 46.0, 69.0, 85.0, 145.0, 306.0, 561.0, 925.0, 1659.0, 3179.0, 5592.0, 10356.0, 18828.0, 34198.0, 65468.0, 131509.0, 262631.0, 253103.0, 124701.0, 62351.0, 32655.0, 18019.0, 9920.0, 5457.0, 2936.0, 1677.0, 929.0, 506.0, 262.0, 177.0, 96.0, 56.0, 36.0, 24.0, 10.0, 13.0, 6.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228271484375, -0.22039031982421875, -0.2125091552734375, -0.20462799072265625, -0.196746826171875, -0.18886566162109375, -0.1809844970703125, -0.17310333251953125, -0.16522216796875, -0.15734100341796875, -0.1494598388671875, -0.14157867431640625, -0.133697509765625, -0.12581634521484375, -0.1179351806640625, -0.11005401611328125, -0.1021728515625, -0.09429168701171875, -0.0864105224609375, -0.07852935791015625, -0.070648193359375, -0.06276702880859375, -0.0548858642578125, -0.04700469970703125, -0.03912353515625, -0.03124237060546875, -0.0233612060546875, -0.01548004150390625, -0.007598876953125, 0.00028228759765625, 0.0081634521484375, 0.01604461669921875, 0.02392578125, 0.03180694580078125, 0.0396881103515625, 0.04756927490234375, 0.055450439453125, 0.06333160400390625, 0.0712127685546875, 0.07909393310546875, 0.08697509765625, 0.09485626220703125, 0.1027374267578125, 0.11061859130859375, 0.118499755859375, 0.12638092041015625, 0.1342620849609375, 0.14214324951171875, 0.1500244140625, 0.15790557861328125, 0.1657867431640625, 0.17366790771484375, 0.181549072265625, 0.18943023681640625, 0.1973114013671875, 0.20519256591796875, 0.21307373046875, 0.22095489501953125, 0.2288360595703125, 0.23671722412109375, 0.244598388671875, 0.25247955322265625, 0.2603607177734375, 0.26824188232421875, 0.276123046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 8.0, 3.0, 7.0, 13.0, 12.0, 17.0, 19.0, 12.0, 17.0, 21.0, 26.0, 33.0, 27.0, 46.0, 47.0, 42.0, 38.0, 69.0, 49.0, 48.0, 49.0, 36.0, 43.0, 42.0, 39.0, 26.0, 27.0, 25.0, 29.0, 20.0, 23.0, 15.0, 20.0, 11.0, 10.0, 8.0, 3.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1783447265625, -0.17239761352539062, -0.16645050048828125, -0.16050338745117188, -0.1545562744140625, -0.14860916137695312, -0.14266204833984375, -0.13671493530273438, -0.130767822265625, -0.12482070922851562, -0.11887359619140625, -0.11292648315429688, -0.1069793701171875, -0.10103225708007812, -0.09508514404296875, -0.08913803100585938, -0.08319091796875, -0.07724380493164062, -0.07129669189453125, -0.06534957885742188, -0.0594024658203125, -0.053455352783203125, -0.04750823974609375, -0.041561126708984375, -0.035614013671875, -0.029666900634765625, -0.02371978759765625, -0.017772674560546875, -0.0118255615234375, -0.005878448486328125, 6.866455078125e-05, 0.006015777587890625, 0.011962890625, 0.017910003662109375, 0.02385711669921875, 0.029804229736328125, 0.0357513427734375, 0.041698455810546875, 0.04764556884765625, 0.053592681884765625, 0.059539794921875, 0.06548690795898438, 0.07143402099609375, 0.07738113403320312, 0.0833282470703125, 0.08927536010742188, 0.09522247314453125, 0.10116958618164062, 0.10711669921875, 0.11306381225585938, 0.11901092529296875, 0.12495803833007812, 0.1309051513671875, 0.13685226440429688, 0.14279937744140625, 0.14874649047851562, 0.154693603515625, 0.16064071655273438, 0.16658782958984375, 0.17253494262695312, 0.1784820556640625, 0.18442916870117188, 0.19037628173828125, 0.19632339477539062, 0.2022705078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 8.0, 14.0, 11.0, 22.0, 18.0, 32.0, 41.0, 52.0, 74.0, 82.0, 133.0, 200.0, 329.0, 647.0, 1720.0, 4316.0, 12248.0, 35916.0, 113185.0, 475149.0, 294799.0, 71736.0, 24091.0, 8202.0, 3003.0, 1164.0, 506.0, 244.0, 176.0, 93.0, 83.0, 47.0, 41.0, 40.0, 35.0, 14.0, 26.0, 12.0, 13.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.65283203125, -0.6346054077148438, -0.6163787841796875, -0.5981521606445312, -0.579925537109375, -0.5616989135742188, -0.5434722900390625, -0.5252456665039062, -0.50701904296875, -0.48879241943359375, -0.4705657958984375, -0.45233917236328125, -0.434112548828125, -0.41588592529296875, -0.3976593017578125, -0.37943267822265625, -0.3612060546875, -0.34297943115234375, -0.3247528076171875, -0.30652618408203125, -0.288299560546875, -0.27007293701171875, -0.2518463134765625, -0.23361968994140625, -0.21539306640625, -0.19716644287109375, -0.1789398193359375, -0.16071319580078125, -0.142486572265625, -0.12425994873046875, -0.1060333251953125, -0.08780670166015625, -0.069580078125, -0.05135345458984375, -0.0331268310546875, -0.01490020751953125, 0.003326416015625, 0.02155303955078125, 0.0397796630859375, 0.05800628662109375, 0.07623291015625, 0.09445953369140625, 0.1126861572265625, 0.13091278076171875, 0.149139404296875, 0.16736602783203125, 0.1855926513671875, 0.20381927490234375, 0.2220458984375, 0.24027252197265625, 0.2584991455078125, 0.27672576904296875, 0.294952392578125, 0.31317901611328125, 0.3314056396484375, 0.34963226318359375, 0.36785888671875, 0.38608551025390625, 0.4043121337890625, 0.42253875732421875, 0.440765380859375, 0.45899200439453125, 0.4772186279296875, 0.49544525146484375, 0.513671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 13.0, 15.0, 13.0, 17.0, 19.0, 30.0, 23.0, 39.0, 45.0, 47.0, 43.0, 59.0, 41.0, 52.0, 52.0, 55.0, 40.0, 37.0, 50.0, 35.0, 37.0, 43.0, 29.0, 25.0, 27.0, 15.0, 17.0, 7.0, 10.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56787109375, -0.5475997924804688, -0.5273284912109375, -0.5070571899414062, -0.486785888671875, -0.46651458740234375, -0.4462432861328125, -0.42597198486328125, -0.40570068359375, -0.38542938232421875, -0.3651580810546875, -0.34488677978515625, -0.324615478515625, -0.30434417724609375, -0.2840728759765625, -0.26380157470703125, -0.2435302734375, -0.22325897216796875, -0.2029876708984375, -0.18271636962890625, -0.162445068359375, -0.14217376708984375, -0.1219024658203125, -0.10163116455078125, -0.08135986328125, -0.06108856201171875, -0.0408172607421875, -0.02054595947265625, -0.000274658203125, 0.01999664306640625, 0.0402679443359375, 0.06053924560546875, 0.080810546875, 0.10108184814453125, 0.1213531494140625, 0.14162445068359375, 0.161895751953125, 0.18216705322265625, 0.2024383544921875, 0.22270965576171875, 0.24298095703125, 0.26325225830078125, 0.2835235595703125, 0.30379486083984375, 0.324066162109375, 0.34433746337890625, 0.3646087646484375, 0.38488006591796875, 0.4051513671875, 0.42542266845703125, 0.4456939697265625, 0.46596527099609375, 0.486236572265625, 0.5065078735351562, 0.5267791748046875, 0.5470504760742188, 0.56732177734375, 0.5875930786132812, 0.6078643798828125, 0.6281356811523438, 0.648406982421875, 0.6686782836914062, 0.6889495849609375, 0.7092208862304688, 0.7294921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 20.0, 29.0, 43.0, 73.0, 110.0, 236.0, 432.0, 1027.0, 2525.0, 7524.0, 23405.0, 72063.0, 330633.0, 471225.0, 94133.0, 29818.0, 9699.0, 3190.0, 1222.0, 549.0, 243.0, 144.0, 87.0, 40.0, 31.0, 17.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.27072906494140625, -0.2614288330078125, -0.25212860107421875, -0.242828369140625, -0.23352813720703125, -0.2242279052734375, -0.21492767333984375, -0.20562744140625, -0.19632720947265625, -0.1870269775390625, -0.17772674560546875, -0.168426513671875, -0.15912628173828125, -0.1498260498046875, -0.14052581787109375, -0.1312255859375, -0.12192535400390625, -0.1126251220703125, -0.10332489013671875, -0.094024658203125, -0.08472442626953125, -0.0754241943359375, -0.06612396240234375, -0.05682373046875, -0.04752349853515625, -0.0382232666015625, -0.02892303466796875, -0.019622802734375, -0.01032257080078125, -0.0010223388671875, 0.00827789306640625, 0.017578125, 0.02687835693359375, 0.0361785888671875, 0.04547882080078125, 0.054779052734375, 0.06407928466796875, 0.0733795166015625, 0.08267974853515625, 0.09197998046875, 0.10128021240234375, 0.1105804443359375, 0.11988067626953125, 0.129180908203125, 0.13848114013671875, 0.1477813720703125, 0.15708160400390625, 0.1663818359375, 0.17568206787109375, 0.1849822998046875, 0.19428253173828125, 0.203582763671875, 0.21288299560546875, 0.2221832275390625, 0.23148345947265625, 0.24078369140625, 0.25008392333984375, 0.2593841552734375, 0.26868438720703125, 0.277984619140625, 0.28728485107421875, 0.2965850830078125, 0.30588531494140625, 0.315185546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 10.0, 4.0, 8.0, 8.0, 15.0, 22.0, 17.0, 38.0, 42.0, 64.0, 113.0, 104.0, 148.0, 138.0, 90.0, 55.0, 31.0, 23.0, 21.0, 11.0, 8.0, 5.0, 6.0, 3.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-05, -4.2426399886608124e-05, -4.0745362639427185e-05, -3.9064325392246246e-05, -3.738328814506531e-05, -3.570225089788437e-05, -3.402121365070343e-05, -3.234017640352249e-05, -3.065913915634155e-05, -2.8978101909160614e-05, -2.7297064661979675e-05, -2.5616027414798737e-05, -2.3934990167617798e-05, -2.225395292043686e-05, -2.057291567325592e-05, -1.889187842607498e-05, -1.7210841178894043e-05, -1.5529803931713104e-05, -1.3848766684532166e-05, -1.2167729437351227e-05, -1.0486692190170288e-05, -8.80565494298935e-06, -7.124617695808411e-06, -5.443580448627472e-06, -3.762543201446533e-06, -2.0815059542655945e-06, -4.0046870708465576e-07, 1.280568540096283e-06, 2.9616057872772217e-06, 4.64264303445816e-06, 6.323680281639099e-06, 8.004717528820038e-06, 9.685754776000977e-06, 1.1366792023181915e-05, 1.3047829270362854e-05, 1.4728866517543793e-05, 1.640990376472473e-05, 1.809094101190567e-05, 1.977197825908661e-05, 2.1453015506267548e-05, 2.3134052753448486e-05, 2.4815090000629425e-05, 2.6496127247810364e-05, 2.8177164494991302e-05, 2.985820174217224e-05, 3.153923898935318e-05, 3.322027623653412e-05, 3.490131348371506e-05, 3.6582350730895996e-05, 3.8263387978076935e-05, 3.9944425225257874e-05, 4.162546247243881e-05, 4.330649971961975e-05, 4.498753696680069e-05, 4.666857421398163e-05, 4.834961146116257e-05, 5.0030648708343506e-05, 5.1711685955524445e-05, 5.339272320270538e-05, 5.507376044988632e-05, 5.675479769706726e-05, 5.84358349442482e-05, 6.011687219142914e-05, 6.179790943861008e-05, 6.347894668579102e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 9.0, 7.0, 15.0, 30.0, 31.0, 48.0, 62.0, 87.0, 113.0, 163.0, 261.0, 529.0, 1391.0, 4457.0, 16199.0, 57652.0, 242910.0, 544108.0, 130813.0, 35218.0, 9610.0, 2758.0, 980.0, 398.0, 208.0, 142.0, 84.0, 74.0, 43.0, 38.0, 31.0, 22.0, 15.0, 7.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251953125, -0.24335479736328125, -0.2347564697265625, -0.22615814208984375, -0.217559814453125, -0.20896148681640625, -0.2003631591796875, -0.19176483154296875, -0.18316650390625, -0.17456817626953125, -0.1659698486328125, -0.15737152099609375, -0.148773193359375, -0.14017486572265625, -0.1315765380859375, -0.12297821044921875, -0.1143798828125, -0.10578155517578125, -0.0971832275390625, -0.08858489990234375, -0.079986572265625, -0.07138824462890625, -0.0627899169921875, -0.05419158935546875, -0.04559326171875, -0.03699493408203125, -0.0283966064453125, -0.01979827880859375, -0.011199951171875, -0.00260162353515625, 0.0059967041015625, 0.01459503173828125, 0.023193359375, 0.03179168701171875, 0.0403900146484375, 0.04898834228515625, 0.057586669921875, 0.06618499755859375, 0.0747833251953125, 0.08338165283203125, 0.09197998046875, 0.10057830810546875, 0.1091766357421875, 0.11777496337890625, 0.126373291015625, 0.13497161865234375, 0.1435699462890625, 0.15216827392578125, 0.1607666015625, 0.16936492919921875, 0.1779632568359375, 0.18656158447265625, 0.195159912109375, 0.20375823974609375, 0.2123565673828125, 0.22095489501953125, 0.22955322265625, 0.23815155029296875, 0.2467498779296875, 0.25534820556640625, 0.263946533203125, 0.27254486083984375, 0.2811431884765625, 0.28974151611328125, 0.29833984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 12.0, 7.0, 15.0, 16.0, 24.0, 23.0, 37.0, 59.0, 89.0, 139.0, 167.0, 142.0, 85.0, 46.0, 35.0, 22.0, 20.0, 20.0, 11.0, 10.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.408203125, -0.3990459442138672, -0.3898887634277344, -0.38073158264160156, -0.37157440185546875, -0.36241722106933594, -0.3532600402832031, -0.3441028594970703, -0.3349456787109375, -0.3257884979248047, -0.3166313171386719, -0.30747413635253906, -0.29831695556640625, -0.28915977478027344, -0.2800025939941406, -0.2708454132080078, -0.261688232421875, -0.2525310516357422, -0.24337387084960938, -0.23421669006347656, -0.22505950927734375, -0.21590232849121094, -0.20674514770507812, -0.1975879669189453, -0.1884307861328125, -0.1792736053466797, -0.17011642456054688, -0.16095924377441406, -0.15180206298828125, -0.14264488220214844, -0.13348770141601562, -0.12433052062988281, -0.11517333984375, -0.10601615905761719, -0.09685897827148438, -0.08770179748535156, -0.07854461669921875, -0.06938743591308594, -0.060230255126953125, -0.05107307434082031, -0.0419158935546875, -0.03275871276855469, -0.023601531982421875, -0.014444351196289062, -0.00528717041015625, 0.0038700103759765625, 0.013027191162109375, 0.022184371948242188, 0.031341552734375, 0.04049873352050781, 0.049655914306640625, 0.05881309509277344, 0.06797027587890625, 0.07712745666503906, 0.08628463745117188, 0.09544181823730469, 0.1045989990234375, 0.11375617980957031, 0.12291336059570312, 0.13207054138183594, 0.14122772216796875, 0.15038490295410156, 0.15954208374023438, 0.1686992645263672, 0.1778564453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 20.0, 37.0, 64.0, 136.0, 200.0, 196.0, 151.0, 101.0, 59.0, 15.0, 14.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.455748558044434, -4.339577674865723, -4.22340726852417, -4.107236385345459, -3.991065740585327, -3.8748950958251953, -3.7587244510650635, -3.6425538063049316, -3.5263829231262207, -3.410212278366089, -3.294041633605957, -3.177870750427246, -3.0617001056671143, -2.9455294609069824, -2.8293588161468506, -2.7131881713867188, -2.597017526626587, -2.480846881866455, -2.3646762371063232, -2.2485055923461914, -2.1323347091674805, -2.0161640644073486, -1.8999934196472168, -1.783822774887085, -1.6676520109176636, -1.5514813661575317, -1.4353106021881104, -1.3191399574279785, -1.2029693126678467, -1.0867985486984253, -0.9706279039382935, -0.8544571995735168, -0.7382864952087402, -0.6221157908439636, -0.505945086479187, -0.3897744417190552, -0.27360373735427856, -0.15743303298950195, -0.04126238822937012, 0.0749083161354065, 0.1910790205001831, 0.3072497248649597, 0.42342039942741394, 0.5395910739898682, 0.6557617783546448, 0.7719324827194214, 0.8881031274795532, 1.0042738914489746, 1.1204445362091064, 1.2366151809692383, 1.3527859449386597, 1.4689565896987915, 1.585127353668213, 1.7012979984283447, 1.8174686431884766, 1.9336392879486084, 2.0498099327087402, 2.165980577468872, 2.282151222229004, 2.398322105407715, 2.5144927501678467, 2.6306633949279785, 2.7468340396881104, 2.863004684448242, 2.979175567626953]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 10.0, 10.0, 12.0, 14.0, 14.0, 13.0, 21.0, 36.0, 33.0, 27.0, 32.0, 29.0, 39.0, 34.0, 46.0, 34.0, 45.0, 36.0, 55.0, 41.0, 38.0, 36.0, 35.0, 34.0, 33.0, 33.0, 30.0, 31.0, 17.0, 20.0, 17.0, 12.0, 15.0, 11.0, 7.0, 5.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3328157663345337, -1.2871006727218628, -1.241385579109192, -1.195670485496521, -1.1499555110931396, -1.1042404174804688, -1.0585253238677979, -1.012810230255127, -0.967095136642456, -0.9213800430297852, -0.8756649494171143, -0.8299499154090881, -0.7842348217964172, -0.7385197281837463, -0.6928046941757202, -0.6470896005630493, -0.6013745069503784, -0.5556594133377075, -0.5099443197250366, -0.4642292857170105, -0.4185141921043396, -0.3727990984916687, -0.3270840346813202, -0.2813689708709717, -0.23565387725830078, -0.18993879854679108, -0.14422371983528137, -0.09850864112377167, -0.05279356241226196, -0.007078483700752258, 0.038636595010757446, 0.08435165882110596, 0.1300668716430664, 0.1757819503545761, 0.22149702906608582, 0.2672120928764343, 0.3129271864891052, 0.3586422801017761, 0.40435734391212463, 0.45007240772247314, 0.49578750133514404, 0.5415025949478149, 0.5872176885604858, 0.632932722568512, 0.6786478161811829, 0.7243629097938538, 0.7700779438018799, 0.8157930374145508, 0.8615081310272217, 0.9072232246398926, 0.9529383182525635, 0.9986533522605896, 1.0443685054779053, 1.0900834798812866, 1.1357985734939575, 1.1815136671066284, 1.2272287607192993, 1.2729438543319702, 1.3186589479446411, 1.364374041557312, 1.4100890159606934, 1.4558041095733643, 1.5015192031860352, 1.547234296798706, 1.592949390411377]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 7.0, 8.0, 15.0, 34.0, 37.0, 54.0, 74.0, 124.0, 211.0, 311.0, 431.0, 731.0, 1103.0, 1777.0, 2951.0, 4770.0, 8232.0, 13789.0, 24391.0, 43849.0, 82592.0, 164262.0, 356059.0, 850955.0, 1340528.0, 689899.0, 301127.0, 142512.0, 73008.0, 38895.0, 21646.0, 12054.0, 7051.0, 4179.0, 2500.0, 1534.0, 931.0, 620.0, 365.0, 235.0, 151.0, 108.0, 52.0, 43.0, 23.0, 23.0, 10.0, 8.0, 9.0, 2.0, 3.0, 2.0], "bins": [-0.1968994140625, -0.19148826599121094, -0.18607711791992188, -0.1806659698486328, -0.17525482177734375, -0.1698436737060547, -0.16443252563476562, -0.15902137756347656, -0.1536102294921875, -0.14819908142089844, -0.14278793334960938, -0.1373767852783203, -0.13196563720703125, -0.1265544891357422, -0.12114334106445312, -0.11573219299316406, -0.110321044921875, -0.10490989685058594, -0.09949874877929688, -0.09408760070800781, -0.08867645263671875, -0.08326530456542969, -0.07785415649414062, -0.07244300842285156, -0.0670318603515625, -0.06162071228027344, -0.056209564208984375, -0.05079841613769531, -0.04538726806640625, -0.03997611999511719, -0.034564971923828125, -0.029153823852539062, -0.02374267578125, -0.018331527709960938, -0.012920379638671875, -0.0075092315673828125, -0.00209808349609375, 0.0033130645751953125, 0.008724212646484375, 0.014135360717773438, 0.0195465087890625, 0.024957656860351562, 0.030368804931640625, 0.03577995300292969, 0.04119110107421875, 0.04660224914550781, 0.052013397216796875, 0.05742454528808594, 0.062835693359375, 0.06824684143066406, 0.07365798950195312, 0.07906913757324219, 0.08448028564453125, 0.08989143371582031, 0.09530258178710938, 0.10071372985839844, 0.1061248779296875, 0.11153602600097656, 0.11694717407226562, 0.12235832214355469, 0.12776947021484375, 0.1331806182861328, 0.13859176635742188, 0.14400291442871094, 0.1494140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 14.0, 9.0, 16.0, 16.0, 22.0, 20.0, 25.0, 22.0, 27.0, 32.0, 29.0, 29.0, 50.0, 37.0, 42.0, 41.0, 39.0, 38.0, 43.0, 42.0, 41.0, 47.0, 41.0, 44.0, 27.0, 25.0, 28.0, 28.0, 18.0, 12.0, 18.0, 6.0, 14.0, 10.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.16487503051757812, -0.15872955322265625, -0.15258407592773438, -0.1464385986328125, -0.14029312133789062, -0.13414764404296875, -0.12800216674804688, -0.121856689453125, -0.11571121215820312, -0.10956573486328125, -0.10342025756835938, -0.0972747802734375, -0.09112930297851562, -0.08498382568359375, -0.07883834838867188, -0.07269287109375, -0.06654739379882812, -0.06040191650390625, -0.054256439208984375, -0.0481109619140625, -0.041965484619140625, -0.03582000732421875, -0.029674530029296875, -0.023529052734375, -0.017383575439453125, -0.01123809814453125, -0.005092620849609375, 0.0010528564453125, 0.007198333740234375, 0.01334381103515625, 0.019489288330078125, 0.025634765625, 0.031780242919921875, 0.03792572021484375, 0.044071197509765625, 0.0502166748046875, 0.056362152099609375, 0.06250762939453125, 0.06865310668945312, 0.074798583984375, 0.08094406127929688, 0.08708953857421875, 0.09323501586914062, 0.0993804931640625, 0.10552597045898438, 0.11167144775390625, 0.11781692504882812, 0.12396240234375, 0.13010787963867188, 0.13625335693359375, 0.14239883422851562, 0.1485443115234375, 0.15468978881835938, 0.16083526611328125, 0.16698074340820312, 0.173126220703125, 0.17927169799804688, 0.18541717529296875, 0.19156265258789062, 0.1977081298828125, 0.20385360717773438, 0.20999908447265625, 0.21614456176757812, 0.2222900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 11.0, 11.0, 17.0, 35.0, 32.0, 32.0, 66.0, 69.0, 83.0, 123.0, 191.0, 342.0, 581.0, 1035.0, 2104.0, 5127.0, 14529.0, 47196.0, 190048.0, 1082841.0, 2308938.0, 410806.0, 89892.0, 25169.0, 8298.0, 3253.0, 1404.0, 759.0, 418.0, 236.0, 161.0, 110.0, 74.0, 71.0, 50.0, 32.0, 29.0, 21.0, 22.0, 8.0, 12.0, 6.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5617141723632812, -0.5448150634765625, -0.5279159545898438, -0.511016845703125, -0.49411773681640625, -0.4772186279296875, -0.46031951904296875, -0.44342041015625, -0.42652130126953125, -0.4096221923828125, -0.39272308349609375, -0.375823974609375, -0.35892486572265625, -0.3420257568359375, -0.32512664794921875, -0.3082275390625, -0.29132843017578125, -0.2744293212890625, -0.25753021240234375, -0.240631103515625, -0.22373199462890625, -0.2068328857421875, -0.18993377685546875, -0.17303466796875, -0.15613555908203125, -0.1392364501953125, -0.12233734130859375, -0.105438232421875, -0.08853912353515625, -0.0716400146484375, -0.05474090576171875, -0.037841796875, -0.02094268798828125, -0.0040435791015625, 0.01285552978515625, 0.029754638671875, 0.04665374755859375, 0.0635528564453125, 0.08045196533203125, 0.09735107421875, 0.11425018310546875, 0.1311492919921875, 0.14804840087890625, 0.164947509765625, 0.18184661865234375, 0.1987457275390625, 0.21564483642578125, 0.2325439453125, 0.24944305419921875, 0.2663421630859375, 0.28324127197265625, 0.300140380859375, 0.31703948974609375, 0.3339385986328125, 0.35083770751953125, 0.36773681640625, 0.38463592529296875, 0.4015350341796875, 0.41843414306640625, 0.435333251953125, 0.45223236083984375, 0.4691314697265625, 0.48603057861328125, 0.5029296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 6.0, 10.0, 16.0, 22.0, 29.0, 39.0, 67.0, 108.0, 166.0, 291.0, 480.0, 781.0, 821.0, 498.0, 280.0, 172.0, 96.0, 61.0, 41.0, 32.0, 20.0, 8.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7184371948242188, -0.6990814208984375, -0.6797256469726562, -0.660369873046875, -0.6410140991210938, -0.6216583251953125, -0.6023025512695312, -0.58294677734375, -0.5635910034179688, -0.5442352294921875, -0.5248794555664062, -0.505523681640625, -0.48616790771484375, -0.4668121337890625, -0.44745635986328125, -0.4281005859375, -0.40874481201171875, -0.3893890380859375, -0.37003326416015625, -0.350677490234375, -0.33132171630859375, -0.3119659423828125, -0.29261016845703125, -0.27325439453125, -0.25389862060546875, -0.2345428466796875, -0.21518707275390625, -0.195831298828125, -0.17647552490234375, -0.1571197509765625, -0.13776397705078125, -0.118408203125, -0.09905242919921875, -0.0796966552734375, -0.06034088134765625, -0.040985107421875, -0.02162933349609375, -0.0022735595703125, 0.01708221435546875, 0.03643798828125, 0.05579376220703125, 0.0751495361328125, 0.09450531005859375, 0.113861083984375, 0.13321685791015625, 0.1525726318359375, 0.17192840576171875, 0.1912841796875, 0.21063995361328125, 0.2299957275390625, 0.24935150146484375, 0.268707275390625, 0.28806304931640625, 0.3074188232421875, 0.32677459716796875, 0.34613037109375, 0.36548614501953125, 0.3848419189453125, 0.40419769287109375, 0.423553466796875, 0.44290924072265625, 0.4622650146484375, 0.48162078857421875, 0.5009765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 14.0, 22.0, 28.0, 40.0, 47.0, 78.0, 83.0, 117.0, 108.0, 95.0, 107.0, 82.0, 57.0, 51.0, 25.0, 16.0, 8.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.010375499725342, -2.927600383758545, -2.844825029373169, -2.762049913406372, -2.679274797439575, -2.596499443054199, -2.5137243270874023, -2.4309492111206055, -2.3481738567352295, -2.2653987407684326, -2.1826233863830566, -2.0998482704162598, -2.017073154449463, -1.934297800064087, -1.85152268409729, -1.7687474489212036, -1.6859723329544067, -1.6031970977783203, -1.5204219818115234, -1.437646746635437, -1.3548715114593506, -1.2720963954925537, -1.1893211603164673, -1.1065459251403809, -1.023770809173584, -0.9409956336021423, -0.8582203984260559, -0.7754452228546143, -0.6926699876785278, -0.6098948121070862, -0.5271196365356445, -0.4443444013595581, -0.3615691661834717, -0.27879396080970764, -0.1960187703371048, -0.11324357986450195, -0.030468374490737915, 0.05230683088302612, 0.13508200645446777, 0.2178572416305542, 0.30063241720199585, 0.3834076225757599, 0.4661828279495239, 0.5489580035209656, 0.6317331790924072, 0.7145084142684937, 0.7972835898399353, 0.8800588250160217, 0.9628340005874634, 1.0456092357635498, 1.1283843517303467, 1.211159586906433, 1.2939348220825195, 1.3767099380493164, 1.4594851732254028, 1.5422604084014893, 1.6250355243682861, 1.7078107595443726, 1.7905858755111694, 1.8733611106872559, 1.9561363458633423, 2.0389115810394287, 2.1216866970062256, 2.2044620513916016, 2.2872371673583984]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 11.0, 7.0, 3.0, 14.0, 17.0, 16.0, 17.0, 19.0, 17.0, 30.0, 30.0, 25.0, 36.0, 34.0, 51.0, 41.0, 29.0, 46.0, 50.0, 46.0, 52.0, 45.0, 39.0, 47.0, 34.0, 47.0, 29.0, 28.0, 17.0, 17.0, 23.0, 17.0, 20.0, 16.0, 7.0, 8.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2766914367675781, -1.2308825254440308, -1.185073733329773, -1.1392648220062256, -1.0934559106826782, -1.0476469993591309, -1.001838207244873, -0.9560292959213257, -0.9102203845977783, -0.8644115328788757, -0.8186026215553284, -0.7727937698364258, -0.7269848585128784, -0.6811760067939758, -0.6353671550750732, -0.5895582437515259, -0.5437493920326233, -0.4979405105113983, -0.45213162899017334, -0.40632277727127075, -0.3605138659477234, -0.3147050142288208, -0.2688961327075958, -0.22308725118637085, -0.17727836966514587, -0.1314694881439209, -0.08566061407327652, -0.03985174000263214, 0.0059571415185928345, 0.05176602303981781, 0.09757488965988159, 0.14338377118110657, 0.18919265270233154, 0.23500153422355652, 0.2808104157447815, 0.3266192674636841, 0.37242817878723145, 0.41823703050613403, 0.464045912027359, 0.509854793548584, 0.5556637048721313, 0.6014725565910339, 0.6472814679145813, 0.6930903196334839, 0.7388992309570312, 0.7847080826759338, 0.8305169343948364, 0.8763258457183838, 0.9221346974372864, 0.967943549156189, 1.0137524604797363, 1.0595613718032837, 1.1053701639175415, 1.1511790752410889, 1.1969879865646362, 1.2427968978881836, 1.2886056900024414, 1.3344146013259888, 1.3802233934402466, 1.426032304763794, 1.4718412160873413, 1.5176501274108887, 1.5634589195251465, 1.6092678308486938, 1.6550767421722412]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 11.0, 22.0, 28.0, 45.0, 61.0, 84.0, 140.0, 216.0, 341.0, 516.0, 808.0, 1346.0, 1931.0, 3061.0, 4649.0, 7013.0, 10407.0, 16070.0, 25176.0, 40532.0, 68103.0, 116395.0, 190196.0, 209944.0, 139378.0, 81115.0, 47527.0, 29253.0, 18830.0, 12256.0, 7961.0, 5284.0, 3426.0, 2264.0, 1450.0, 965.0, 609.0, 419.0, 256.0, 169.0, 93.0, 66.0, 41.0, 29.0, 21.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.22998046875, -0.22260093688964844, -0.21522140502929688, -0.2078418731689453, -0.20046234130859375, -0.1930828094482422, -0.18570327758789062, -0.17832374572753906, -0.1709442138671875, -0.16356468200683594, -0.15618515014648438, -0.1488056182861328, -0.14142608642578125, -0.1340465545654297, -0.12666702270507812, -0.11928749084472656, -0.111907958984375, -0.10452842712402344, -0.09714889526367188, -0.08976936340332031, -0.08238983154296875, -0.07501029968261719, -0.06763076782226562, -0.06025123596191406, -0.0528717041015625, -0.04549217224121094, -0.038112640380859375, -0.030733108520507812, -0.02335357666015625, -0.015974044799804688, -0.008594512939453125, -0.0012149810791015625, 0.00616455078125, 0.013544082641601562, 0.020923614501953125, 0.028303146362304688, 0.03568267822265625, 0.04306221008300781, 0.050441741943359375, 0.05782127380371094, 0.0652008056640625, 0.07258033752441406, 0.07995986938476562, 0.08733940124511719, 0.09471893310546875, 0.10209846496582031, 0.10947799682617188, 0.11685752868652344, 0.124237060546875, 0.13161659240722656, 0.13899612426757812, 0.1463756561279297, 0.15375518798828125, 0.1611347198486328, 0.16851425170898438, 0.17589378356933594, 0.1832733154296875, 0.19065284729003906, 0.19803237915039062, 0.2054119110107422, 0.21279144287109375, 0.2201709747314453, 0.22755050659179688, 0.23493003845214844, 0.2423095703125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 7.0, 8.0, 13.0, 13.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 28.0, 27.0, 35.0, 26.0, 29.0, 33.0, 42.0, 33.0, 36.0, 34.0, 43.0, 54.0, 38.0, 32.0, 46.0, 36.0, 44.0, 37.0, 23.0, 24.0, 17.0, 25.0, 11.0, 14.0, 20.0, 14.0, 8.0, 12.0, 3.0, 4.0, 5.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2021484375, -0.19617843627929688, -0.19020843505859375, -0.18423843383789062, -0.1782684326171875, -0.17229843139648438, -0.16632843017578125, -0.16035842895507812, -0.154388427734375, -0.14841842651367188, -0.14244842529296875, -0.13647842407226562, -0.1305084228515625, -0.12453842163085938, -0.11856842041015625, -0.11259841918945312, -0.10662841796875, -0.10065841674804688, -0.09468841552734375, -0.08871841430664062, -0.0827484130859375, -0.07677841186523438, -0.07080841064453125, -0.06483840942382812, -0.058868408203125, -0.052898406982421875, -0.04692840576171875, -0.040958404541015625, -0.0349884033203125, -0.029018402099609375, -0.02304840087890625, -0.017078399658203125, -0.0111083984375, -0.005138397216796875, 0.00083160400390625, 0.006801605224609375, 0.0127716064453125, 0.018741607666015625, 0.02471160888671875, 0.030681610107421875, 0.036651611328125, 0.042621612548828125, 0.04859161376953125, 0.054561614990234375, 0.0605316162109375, 0.06650161743164062, 0.07247161865234375, 0.07844161987304688, 0.08441162109375, 0.09038162231445312, 0.09635162353515625, 0.10232162475585938, 0.1082916259765625, 0.11426162719726562, 0.12023162841796875, 0.12620162963867188, 0.132171630859375, 0.13814163208007812, 0.14411163330078125, 0.15008163452148438, 0.1560516357421875, 0.16202163696289062, 0.16799163818359375, 0.17396163940429688, 0.179931640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 8.0, 11.0, 20.0, 31.0, 38.0, 55.0, 106.0, 193.0, 259.0, 563.0, 1659.0, 8460.0, 56322.0, 421969.0, 480558.0, 65236.0, 9810.0, 1817.0, 598.0, 332.0, 190.0, 90.0, 85.0, 41.0, 32.0, 19.0, 19.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0225982666015625, -0.988555908203125, -0.9545135498046875, -0.92047119140625, -0.8864288330078125, -0.852386474609375, -0.8183441162109375, -0.7843017578125, -0.7502593994140625, -0.716217041015625, -0.6821746826171875, -0.64813232421875, -0.6140899658203125, -0.580047607421875, -0.5460052490234375, -0.511962890625, -0.4779205322265625, -0.443878173828125, -0.4098358154296875, -0.37579345703125, -0.3417510986328125, -0.307708740234375, -0.2736663818359375, -0.2396240234375, -0.2055816650390625, -0.171539306640625, -0.1374969482421875, -0.10345458984375, -0.0694122314453125, -0.035369873046875, -0.0013275146484375, 0.03271484375, 0.0667572021484375, 0.100799560546875, 0.1348419189453125, 0.16888427734375, 0.2029266357421875, 0.236968994140625, 0.2710113525390625, 0.3050537109375, 0.3390960693359375, 0.373138427734375, 0.4071807861328125, 0.44122314453125, 0.4752655029296875, 0.509307861328125, 0.5433502197265625, 0.577392578125, 0.6114349365234375, 0.645477294921875, 0.6795196533203125, 0.71356201171875, 0.7476043701171875, 0.781646728515625, 0.8156890869140625, 0.8497314453125, 0.8837738037109375, 0.917816162109375, 0.9518585205078125, 0.98590087890625, 1.0199432373046875, 1.053985595703125, 1.0880279541015625, 1.1220703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 10.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 23.0, 26.0, 25.0, 27.0, 29.0, 40.0, 35.0, 45.0, 40.0, 44.0, 53.0, 37.0, 34.0, 36.0, 40.0, 51.0, 51.0, 43.0, 39.0, 33.0, 28.0, 20.0, 25.0, 16.0, 13.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.81396484375, -0.7909622192382812, -0.7679595947265625, -0.7449569702148438, -0.721954345703125, -0.6989517211914062, -0.6759490966796875, -0.6529464721679688, -0.62994384765625, -0.6069412231445312, -0.5839385986328125, -0.5609359741210938, -0.537933349609375, -0.5149307250976562, -0.4919281005859375, -0.46892547607421875, -0.4459228515625, -0.42292022705078125, -0.3999176025390625, -0.37691497802734375, -0.353912353515625, -0.33090972900390625, -0.3079071044921875, -0.28490447998046875, -0.26190185546875, -0.23889923095703125, -0.2158966064453125, -0.19289398193359375, -0.169891357421875, -0.14688873291015625, -0.1238861083984375, -0.10088348388671875, -0.077880859375, -0.05487823486328125, -0.0318756103515625, -0.00887298583984375, 0.014129638671875, 0.03713226318359375, 0.0601348876953125, 0.08313751220703125, 0.10614013671875, 0.12914276123046875, 0.1521453857421875, 0.17514801025390625, 0.198150634765625, 0.22115325927734375, 0.2441558837890625, 0.26715850830078125, 0.2901611328125, 0.31316375732421875, 0.3361663818359375, 0.35916900634765625, 0.382171630859375, 0.40517425537109375, 0.4281768798828125, 0.45117950439453125, 0.47418212890625, 0.49718475341796875, 0.5201873779296875, 0.5431900024414062, 0.566192626953125, 0.5891952514648438, 0.6121978759765625, 0.6352005004882812, 0.658203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 9.0, 10.0, 20.0, 19.0, 37.0, 46.0, 85.0, 149.0, 203.0, 289.0, 569.0, 1095.0, 2323.0, 5615.0, 14296.0, 38078.0, 101270.0, 276831.0, 372793.0, 145922.0, 54070.0, 20588.0, 7893.0, 3212.0, 1393.0, 714.0, 353.0, 231.0, 124.0, 73.0, 68.0, 61.0, 32.0, 12.0, 16.0, 14.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.268798828125, -0.2613697052001953, -0.2539405822753906, -0.24651145935058594, -0.23908233642578125, -0.23165321350097656, -0.22422409057617188, -0.2167949676513672, -0.2093658447265625, -0.2019367218017578, -0.19450759887695312, -0.18707847595214844, -0.17964935302734375, -0.17222023010253906, -0.16479110717773438, -0.1573619842529297, -0.149932861328125, -0.1425037384033203, -0.13507461547851562, -0.12764549255371094, -0.12021636962890625, -0.11278724670410156, -0.10535812377929688, -0.09792900085449219, -0.0904998779296875, -0.08307075500488281, -0.07564163208007812, -0.06821250915527344, -0.06078338623046875, -0.05335426330566406, -0.045925140380859375, -0.03849601745605469, -0.03106689453125, -0.023637771606445312, -0.016208648681640625, -0.008779525756835938, -0.00135040283203125, 0.0060787200927734375, 0.013507843017578125, 0.020936965942382812, 0.0283660888671875, 0.03579521179199219, 0.043224334716796875, 0.05065345764160156, 0.05808258056640625, 0.06551170349121094, 0.07294082641601562, 0.08036994934082031, 0.087799072265625, 0.09522819519042969, 0.10265731811523438, 0.11008644104003906, 0.11751556396484375, 0.12494468688964844, 0.13237380981445312, 0.1398029327392578, 0.1472320556640625, 0.1546611785888672, 0.16209030151367188, 0.16951942443847656, 0.17694854736328125, 0.18437767028808594, 0.19180679321289062, 0.1992359161376953, 0.2066650390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 10.0, 16.0, 14.0, 26.0, 31.0, 34.0, 41.0, 58.0, 90.0, 102.0, 101.0, 96.0, 75.0, 64.0, 44.0, 38.0, 25.0, 24.0, 16.0, 8.0, 17.0, 5.0, 10.0, 8.0, 8.0, 2.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.780292510986328e-05, -4.628114402294159e-05, -4.47593629360199e-05, -4.3237581849098206e-05, -4.1715800762176514e-05, -4.019401967525482e-05, -3.867223858833313e-05, -3.715045750141144e-05, -3.5628676414489746e-05, -3.4106895327568054e-05, -3.258511424064636e-05, -3.106333315372467e-05, -2.954155206680298e-05, -2.8019770979881287e-05, -2.6497989892959595e-05, -2.4976208806037903e-05, -2.345442771911621e-05, -2.193264663219452e-05, -2.0410865545272827e-05, -1.8889084458351135e-05, -1.7367303371429443e-05, -1.584552228450775e-05, -1.432374119758606e-05, -1.2801960110664368e-05, -1.1280179023742676e-05, -9.758397936820984e-06, -8.236616849899292e-06, -6.7148357629776e-06, -5.193054676055908e-06, -3.6712735891342163e-06, -2.1494925022125244e-06, -6.277114152908325e-07, 8.940696716308594e-07, 2.4158507585525513e-06, 3.937631845474243e-06, 5.459412932395935e-06, 6.981194019317627e-06, 8.502975106239319e-06, 1.002475619316101e-05, 1.1546537280082703e-05, 1.3068318367004395e-05, 1.4590099453926086e-05, 1.611188054084778e-05, 1.763366162776947e-05, 1.9155442714691162e-05, 2.0677223801612854e-05, 2.2199004888534546e-05, 2.3720785975456238e-05, 2.524256706237793e-05, 2.676434814929962e-05, 2.8286129236221313e-05, 2.9807910323143005e-05, 3.13296914100647e-05, 3.285147249698639e-05, 3.437325358390808e-05, 3.589503467082977e-05, 3.7416815757751465e-05, 3.893859684467316e-05, 4.046037793159485e-05, 4.198215901851654e-05, 4.350394010543823e-05, 4.5025721192359924e-05, 4.6547502279281616e-05, 4.806928336620331e-05, 4.9591064453125e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 11.0, 23.0, 14.0, 47.0, 57.0, 79.0, 98.0, 158.0, 294.0, 662.0, 1493.0, 4430.0, 15705.0, 57710.0, 210430.0, 469899.0, 207879.0, 56757.0, 15461.0, 4428.0, 1531.0, 583.0, 283.0, 144.0, 113.0, 72.0, 39.0, 39.0, 27.0, 10.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.31201171875, -0.30269622802734375, -0.2933807373046875, -0.28406524658203125, -0.274749755859375, -0.26543426513671875, -0.2561187744140625, -0.24680328369140625, -0.23748779296875, -0.22817230224609375, -0.2188568115234375, -0.20954132080078125, -0.200225830078125, -0.19091033935546875, -0.1815948486328125, -0.17227935791015625, -0.1629638671875, -0.15364837646484375, -0.1443328857421875, -0.13501739501953125, -0.125701904296875, -0.11638641357421875, -0.1070709228515625, -0.09775543212890625, -0.08843994140625, -0.07912445068359375, -0.0698089599609375, -0.06049346923828125, -0.051177978515625, -0.04186248779296875, -0.0325469970703125, -0.02323150634765625, -0.013916015625, -0.00460052490234375, 0.0047149658203125, 0.01403045654296875, 0.023345947265625, 0.03266143798828125, 0.0419769287109375, 0.05129241943359375, 0.06060791015625, 0.06992340087890625, 0.0792388916015625, 0.08855438232421875, 0.097869873046875, 0.10718536376953125, 0.1165008544921875, 0.12581634521484375, 0.1351318359375, 0.14444732666015625, 0.1537628173828125, 0.16307830810546875, 0.172393798828125, 0.18170928955078125, 0.1910247802734375, 0.20034027099609375, 0.20965576171875, 0.21897125244140625, 0.2282867431640625, 0.23760223388671875, 0.246917724609375, 0.25623321533203125, 0.2655487060546875, 0.27486419677734375, 0.2841796875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 12.0, 14.0, 17.0, 14.0, 22.0, 21.0, 25.0, 35.0, 26.0, 39.0, 47.0, 61.0, 73.0, 56.0, 60.0, 64.0, 47.0, 42.0, 54.0, 31.0, 42.0, 31.0, 23.0, 17.0, 14.0, 14.0, 15.0, 12.0, 10.0, 6.0, 10.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17694854736328125, -0.1712799072265625, -0.16561126708984375, -0.159942626953125, -0.15427398681640625, -0.1486053466796875, -0.14293670654296875, -0.13726806640625, -0.13159942626953125, -0.1259307861328125, -0.12026214599609375, -0.114593505859375, -0.10892486572265625, -0.1032562255859375, -0.09758758544921875, -0.0919189453125, -0.08625030517578125, -0.0805816650390625, -0.07491302490234375, -0.069244384765625, -0.06357574462890625, -0.0579071044921875, -0.05223846435546875, -0.04656982421875, -0.04090118408203125, -0.0352325439453125, -0.02956390380859375, -0.023895263671875, -0.01822662353515625, -0.0125579833984375, -0.00688934326171875, -0.001220703125, 0.00444793701171875, 0.0101165771484375, 0.01578521728515625, 0.021453857421875, 0.02712249755859375, 0.0327911376953125, 0.03845977783203125, 0.04412841796875, 0.04979705810546875, 0.0554656982421875, 0.06113433837890625, 0.066802978515625, 0.07247161865234375, 0.0781402587890625, 0.08380889892578125, 0.0894775390625, 0.09514617919921875, 0.1008148193359375, 0.10648345947265625, 0.112152099609375, 0.11782073974609375, 0.1234893798828125, 0.12915802001953125, 0.13482666015625, 0.14049530029296875, 0.1461639404296875, 0.15183258056640625, 0.157501220703125, 0.16316986083984375, 0.1688385009765625, 0.17450714111328125, 0.18017578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 3.0, 5.0, 11.0, 12.0, 34.0, 64.0, 128.0, 148.0, 178.0, 189.0, 120.0, 70.0, 28.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685758113861084, -1.539783239364624, -1.393808364868164, -1.2478336095809937, -1.1018587350845337, -0.9558838605880737, -0.8099090456962585, -0.6639342308044434, -0.5179593563079834, -0.3719845116138458, -0.22600966691970825, -0.08003482222557068, 0.0659400224685669, 0.21191489696502686, 0.35788971185684204, 0.5038645267486572, 0.6498394012451172, 0.7958142757415771, 0.9417890906333923, 1.0877639055252075, 1.2337387800216675, 1.3797136545181274, 1.5256884098052979, 1.6716632843017578, 1.8176381587982178, 1.9636130332946777, 2.1095879077911377, 2.2555627822875977, 2.4015374183654785, 2.5475125312805176, 2.6934871673583984, 2.8394620418548584, 2.9854373931884766, 3.1314122676849365, 3.2773871421813965, 3.4233620166778564, 3.5693368911743164, 3.7153115272521973, 3.8612864017486572, 4.007261276245117, 4.153236389160156, 4.299211025238037, 4.445186138153076, 4.591160774230957, 4.737135887145996, 4.883110523223877, 5.029085636138916, 5.175060272216797, 5.321034908294678, 5.467009544372559, 5.612984657287598, 5.7589592933654785, 5.904934406280518, 6.050909042358398, 6.1968841552734375, 6.342858791351318, 6.488833427429199, 6.63480806350708, 6.780783176422119, 6.9267578125, 7.072732925415039, 7.21870756149292, 7.364682674407959, 7.51065731048584, 7.656632423400879]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 3.0, 6.0, 8.0, 5.0, 11.0, 20.0, 13.0, 11.0, 15.0, 29.0, 34.0, 14.0, 30.0, 34.0, 33.0, 35.0, 27.0, 32.0, 41.0, 38.0, 48.0, 31.0, 33.0, 31.0, 33.0, 39.0, 38.0, 36.0, 21.0, 31.0, 20.0, 29.0, 29.0, 10.0, 12.0, 15.0, 12.0, 16.0, 21.0, 10.0, 5.0, 8.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0], "bins": [-1.900040626525879, -1.8429653644561768, -1.7858901023864746, -1.7288148403167725, -1.6717395782470703, -1.6146643161773682, -1.5575891733169556, -1.5005139112472534, -1.4434386491775513, -1.3863633871078491, -1.329288125038147, -1.2722128629684448, -1.2151377201080322, -1.15806245803833, -1.100987195968628, -1.0439119338989258, -0.9868366718292236, -0.9297614097595215, -0.8726861476898193, -0.815610945224762, -0.7585356831550598, -0.7014604210853577, -0.6443852186203003, -0.5873099565505981, -0.530234694480896, -0.47315943241119385, -0.4160842001438141, -0.3590089678764343, -0.3019337058067322, -0.24485844373703003, -0.18778321146965027, -0.1307079792022705, -0.07363271713256836, -0.016557469964027405, 0.04051777720451355, 0.0975930243730545, 0.15466827154159546, 0.2117435336112976, 0.26881876587867737, 0.32589399814605713, 0.3829692602157593, 0.4400445222854614, 0.4971197545528412, 0.554194986820221, 0.6112702488899231, 0.6683455109596252, 0.7254207134246826, 0.7824959754943848, 0.8395712375640869, 0.8966464996337891, 0.9537217617034912, 1.0107970237731934, 1.0678722858428955, 1.1249475479125977, 1.1820226907730103, 1.2390979528427124, 1.2961732149124146, 1.3532484769821167, 1.4103237390518188, 1.467399001121521, 1.5244741439819336, 1.5815494060516357, 1.638624668121338, 1.69569993019104, 1.7527751922607422]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 9.0, 6.0, 5.0, 16.0, 31.0, 42.0, 61.0, 93.0, 145.0, 239.0, 375.0, 610.0, 1042.0, 1816.0, 3158.0, 5713.0, 10698.0, 20597.0, 40688.0, 83411.0, 184666.0, 468752.0, 1278393.0, 1275893.0, 466154.0, 183399.0, 82956.0, 40553.0, 20778.0, 10731.0, 5710.0, 3208.0, 1763.0, 961.0, 615.0, 372.0, 229.0, 133.0, 86.0, 54.0, 36.0, 33.0, 19.0, 14.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.277099609375, -0.26940155029296875, -0.2617034912109375, -0.25400543212890625, -0.246307373046875, -0.23860931396484375, -0.2309112548828125, -0.22321319580078125, -0.21551513671875, -0.20781707763671875, -0.2001190185546875, -0.19242095947265625, -0.184722900390625, -0.17702484130859375, -0.1693267822265625, -0.16162872314453125, -0.1539306640625, -0.14623260498046875, -0.1385345458984375, -0.13083648681640625, -0.123138427734375, -0.11544036865234375, -0.1077423095703125, -0.10004425048828125, -0.09234619140625, -0.08464813232421875, -0.0769500732421875, -0.06925201416015625, -0.061553955078125, -0.05385589599609375, -0.0461578369140625, -0.03845977783203125, -0.03076171875, -0.02306365966796875, -0.0153656005859375, -0.00766754150390625, 3.0517578125e-05, 0.00772857666015625, 0.0154266357421875, 0.02312469482421875, 0.03082275390625, 0.03852081298828125, 0.0462188720703125, 0.05391693115234375, 0.061614990234375, 0.06931304931640625, 0.0770111083984375, 0.08470916748046875, 0.0924072265625, 0.10010528564453125, 0.1078033447265625, 0.11550140380859375, 0.123199462890625, 0.13089752197265625, 0.1385955810546875, 0.14629364013671875, 0.15399169921875, 0.16168975830078125, 0.1693878173828125, 0.17708587646484375, 0.184783935546875, 0.19248199462890625, 0.2001800537109375, 0.20787811279296875, 0.215576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 16.0, 14.0, 8.0, 15.0, 16.0, 22.0, 23.0, 29.0, 24.0, 24.0, 38.0, 35.0, 37.0, 30.0, 47.0, 31.0, 43.0, 35.0, 33.0, 54.0, 40.0, 44.0, 31.0, 36.0, 29.0, 29.0, 22.0, 27.0, 25.0, 17.0, 21.0, 17.0, 9.0, 9.0, 9.0, 8.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.23486328125, -0.22769737243652344, -0.22053146362304688, -0.2133655548095703, -0.20619964599609375, -0.1990337371826172, -0.19186782836914062, -0.18470191955566406, -0.1775360107421875, -0.17037010192871094, -0.16320419311523438, -0.1560382843017578, -0.14887237548828125, -0.1417064666748047, -0.13454055786132812, -0.12737464904785156, -0.120208740234375, -0.11304283142089844, -0.10587692260742188, -0.09871101379394531, -0.09154510498046875, -0.08437919616699219, -0.07721328735351562, -0.07004737854003906, -0.0628814697265625, -0.05571556091308594, -0.048549652099609375, -0.04138374328613281, -0.03421783447265625, -0.027051925659179688, -0.019886016845703125, -0.012720108032226562, -0.00555419921875, 0.0016117095947265625, 0.008777618408203125, 0.015943527221679688, 0.02310943603515625, 0.030275344848632812, 0.037441253662109375, 0.04460716247558594, 0.0517730712890625, 0.05893898010253906, 0.06610488891601562, 0.07327079772949219, 0.08043670654296875, 0.08760261535644531, 0.09476852416992188, 0.10193443298339844, 0.109100341796875, 0.11626625061035156, 0.12343215942382812, 0.1305980682373047, 0.13776397705078125, 0.1449298858642578, 0.15209579467773438, 0.15926170349121094, 0.1664276123046875, 0.17359352111816406, 0.18075942993164062, 0.1879253387451172, 0.19509124755859375, 0.2022571563720703, 0.20942306518554688, 0.21658897399902344, 0.2237548828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 15.0, 12.0, 31.0, 38.0, 50.0, 60.0, 81.0, 126.0, 208.0, 328.0, 547.0, 912.0, 1765.0, 3688.0, 8643.0, 21244.0, 55631.0, 156396.0, 494934.0, 1772566.0, 1184726.0, 318051.0, 107297.0, 38719.0, 15371.0, 6466.0, 2879.0, 1388.0, 805.0, 428.0, 260.0, 179.0, 126.0, 83.0, 74.0, 42.0, 31.0, 28.0, 18.0, 9.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39794921875, -0.38364410400390625, -0.3693389892578125, -0.35503387451171875, -0.340728759765625, -0.32642364501953125, -0.3121185302734375, -0.29781341552734375, -0.28350830078125, -0.26920318603515625, -0.2548980712890625, -0.24059295654296875, -0.226287841796875, -0.21198272705078125, -0.1976776123046875, -0.18337249755859375, -0.1690673828125, -0.15476226806640625, -0.1404571533203125, -0.12615203857421875, -0.111846923828125, -0.09754180908203125, -0.0832366943359375, -0.06893157958984375, -0.05462646484375, -0.04032135009765625, -0.0260162353515625, -0.01171112060546875, 0.002593994140625, 0.01689910888671875, 0.0312042236328125, 0.04550933837890625, 0.059814453125, 0.07411956787109375, 0.0884246826171875, 0.10272979736328125, 0.117034912109375, 0.13134002685546875, 0.1456451416015625, 0.15995025634765625, 0.17425537109375, 0.18856048583984375, 0.2028656005859375, 0.21717071533203125, 0.231475830078125, 0.24578094482421875, 0.2600860595703125, 0.27439117431640625, 0.2886962890625, 0.30300140380859375, 0.3173065185546875, 0.33161163330078125, 0.345916748046875, 0.36022186279296875, 0.3745269775390625, 0.38883209228515625, 0.40313720703125, 0.41744232177734375, 0.4317474365234375, 0.44605255126953125, 0.460357666015625, 0.47466278076171875, 0.4889678955078125, 0.5032730102539062, 0.517578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 7.0, 21.0, 34.0, 40.0, 79.0, 136.0, 209.0, 370.0, 602.0, 850.0, 667.0, 375.0, 234.0, 129.0, 105.0, 61.0, 38.0, 39.0, 21.0, 13.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4825439453125, -0.459228515625, -0.4359130859375, -0.41259765625, -0.3892822265625, -0.365966796875, -0.3426513671875, -0.3193359375, -0.2960205078125, -0.272705078125, -0.2493896484375, -0.22607421875, -0.2027587890625, -0.179443359375, -0.1561279296875, -0.1328125, -0.1094970703125, -0.086181640625, -0.0628662109375, -0.03955078125, -0.0162353515625, 0.007080078125, 0.0303955078125, 0.0537109375, 0.0770263671875, 0.100341796875, 0.1236572265625, 0.14697265625, 0.1702880859375, 0.193603515625, 0.2169189453125, 0.240234375, 0.2635498046875, 0.286865234375, 0.3101806640625, 0.33349609375, 0.3568115234375, 0.380126953125, 0.4034423828125, 0.4267578125, 0.4500732421875, 0.473388671875, 0.4967041015625, 0.52001953125, 0.5433349609375, 0.566650390625, 0.5899658203125, 0.61328125, 0.6365966796875, 0.659912109375, 0.6832275390625, 0.70654296875, 0.7298583984375, 0.753173828125, 0.7764892578125, 0.7998046875, 0.8231201171875, 0.846435546875, 0.8697509765625, 0.89306640625, 0.9163818359375, 0.939697265625, 0.9630126953125, 0.986328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 7.0, 11.0, 15.0, 11.0, 39.0, 45.0, 55.0, 65.0, 80.0, 92.0, 93.0, 87.0, 87.0, 85.0, 50.0, 62.0, 27.0, 30.0, 12.0, 12.0, 13.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943532705307007, -2.8673970699310303, -2.791261672973633, -2.7151260375976562, -2.6389904022216797, -2.562854766845703, -2.4867191314697266, -2.410583734512329, -2.3344480991363525, -2.258312463760376, -2.1821770668029785, -2.106041431427002, -2.0299057960510254, -1.9537701606750488, -1.8776346445083618, -1.8014991283416748, -1.7253634929656982, -1.6492278575897217, -1.5730923414230347, -1.4969568252563477, -1.420821189880371, -1.3446855545043945, -1.2685500383377075, -1.1924145221710205, -1.116278886795044, -1.0401432514190674, -0.9640077352523804, -0.8878721594810486, -0.8117365837097168, -0.735601007938385, -0.6594654321670532, -0.5833298563957214, -0.5071942806243896, -0.43105870485305786, -0.3549231290817261, -0.2787875533103943, -0.2026519775390625, -0.1265164017677307, -0.050380825996398926, 0.02575474977493286, 0.10189032554626465, 0.17802590131759644, 0.2541614770889282, 0.33029705286026, 0.4064326286315918, 0.4825682044029236, 0.5587037801742554, 0.6348393559455872, 0.710974931716919, 0.7871105074882507, 0.8632460832595825, 0.9393816590309143, 1.015517234802246, 1.0916528701782227, 1.1677883863449097, 1.2439239025115967, 1.3200595378875732, 1.3961951732635498, 1.4723306894302368, 1.5484662055969238, 1.6246018409729004, 1.700737476348877, 1.776872992515564, 1.853008508682251, 1.9291441440582275]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 6.0, 7.0, 8.0, 15.0, 12.0, 11.0, 20.0, 16.0, 28.0, 28.0, 27.0, 34.0, 40.0, 37.0, 39.0, 41.0, 42.0, 49.0, 35.0, 35.0, 39.0, 34.0, 42.0, 34.0, 42.0, 44.0, 24.0, 26.0, 33.0, 23.0, 25.0, 16.0, 14.0, 8.0, 11.0, 8.0, 3.0, 5.0, 5.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6516945362091064, -1.5991718769073486, -1.5466490983963013, -1.4941264390945435, -1.4416037797927856, -1.3890810012817383, -1.3365583419799805, -1.2840356826782227, -1.2315130233764648, -1.178990364074707, -1.1264675855636597, -1.0739449262619019, -1.021422266960144, -0.9688995480537415, -0.9163768291473389, -0.863854169845581, -0.8113313913345337, -0.7588086724281311, -0.7062860131263733, -0.6537632942199707, -0.6012406349182129, -0.5487179160118103, -0.4961951971054077, -0.4436725080013275, -0.3911498188972473, -0.3386271297931671, -0.2861044406890869, -0.23358172178268433, -0.18105903267860413, -0.12853634357452393, -0.07601362466812134, -0.023490935564041138, 0.029031753540039062, 0.08155445009469986, 0.13407714664936066, 0.18659985065460205, 0.23912253975868225, 0.29164522886276245, 0.34416794776916504, 0.39669063687324524, 0.44921332597732544, 0.501736044883728, 0.5542587041854858, 0.6067814230918884, 0.659304141998291, 0.7118268013000488, 0.7643495202064514, 0.816872239112854, 0.8693948984146118, 0.9219176173210144, 0.9744402766227722, 1.0269629955291748, 1.0794856548309326, 1.1320083141326904, 1.1845310926437378, 1.2370537519454956, 1.289576530456543, 1.3420991897583008, 1.3946219682693481, 1.447144627571106, 1.4996672868728638, 1.5521900653839111, 1.604712724685669, 1.6572353839874268, 1.7097580432891846]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 24.0, 36.0, 38.0, 51.0, 92.0, 135.0, 162.0, 242.0, 336.0, 519.0, 689.0, 963.0, 1382.0, 2038.0, 2832.0, 4048.0, 5811.0, 8235.0, 11989.0, 17376.0, 26442.0, 42261.0, 75081.0, 155818.0, 259413.0, 193594.0, 94127.0, 49895.0, 30597.0, 19953.0, 13534.0, 9223.0, 6476.0, 4457.0, 3132.0, 2269.0, 1583.0, 1054.0, 781.0, 553.0, 389.0, 285.0, 162.0, 146.0, 99.0, 71.0, 40.0, 34.0, 18.0, 9.0, 10.0, 12.0, 6.0, 11.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24068832397460938, -0.23308563232421875, -0.22548294067382812, -0.2178802490234375, -0.21027755737304688, -0.20267486572265625, -0.19507217407226562, -0.187469482421875, -0.17986679077148438, -0.17226409912109375, -0.16466140747070312, -0.1570587158203125, -0.14945602416992188, -0.14185333251953125, -0.13425064086914062, -0.12664794921875, -0.11904525756835938, -0.11144256591796875, -0.10383987426757812, -0.0962371826171875, -0.08863449096679688, -0.08103179931640625, -0.07342910766601562, -0.065826416015625, -0.058223724365234375, -0.05062103271484375, -0.043018341064453125, -0.0354156494140625, -0.027812957763671875, -0.02021026611328125, -0.012607574462890625, -0.0050048828125, 0.002597808837890625, 0.01020050048828125, 0.017803192138671875, 0.0254058837890625, 0.033008575439453125, 0.04061126708984375, 0.048213958740234375, 0.055816650390625, 0.06341934204101562, 0.07102203369140625, 0.07862472534179688, 0.0862274169921875, 0.09383010864257812, 0.10143280029296875, 0.10903549194335938, 0.11663818359375, 0.12424087524414062, 0.13184356689453125, 0.13944625854492188, 0.1470489501953125, 0.15465164184570312, 0.16225433349609375, 0.16985702514648438, 0.177459716796875, 0.18506240844726562, 0.19266510009765625, 0.20026779174804688, 0.2078704833984375, 0.21547317504882812, 0.22307586669921875, 0.23067855834960938, 0.23828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 10.0, 7.0, 13.0, 11.0, 13.0, 9.0, 23.0, 14.0, 20.0, 19.0, 30.0, 26.0, 30.0, 30.0, 43.0, 34.0, 36.0, 30.0, 37.0, 37.0, 38.0, 24.0, 40.0, 36.0, 35.0, 29.0, 40.0, 36.0, 35.0, 24.0, 27.0, 26.0, 17.0, 17.0, 9.0, 18.0, 15.0, 11.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19544219970703125, -0.1891021728515625, -0.18276214599609375, -0.176422119140625, -0.17008209228515625, -0.1637420654296875, -0.15740203857421875, -0.15106201171875, -0.14472198486328125, -0.1383819580078125, -0.13204193115234375, -0.125701904296875, -0.11936187744140625, -0.1130218505859375, -0.10668182373046875, -0.100341796875, -0.09400177001953125, -0.0876617431640625, -0.08132171630859375, -0.074981689453125, -0.06864166259765625, -0.0623016357421875, -0.05596160888671875, -0.04962158203125, -0.04328155517578125, -0.0369415283203125, -0.03060150146484375, -0.024261474609375, -0.01792144775390625, -0.0115814208984375, -0.00524139404296875, 0.0010986328125, 0.00743865966796875, 0.0137786865234375, 0.02011871337890625, 0.026458740234375, 0.03279876708984375, 0.0391387939453125, 0.04547882080078125, 0.05181884765625, 0.05815887451171875, 0.0644989013671875, 0.07083892822265625, 0.077178955078125, 0.08351898193359375, 0.0898590087890625, 0.09619903564453125, 0.1025390625, 0.10887908935546875, 0.1152191162109375, 0.12155914306640625, 0.127899169921875, 0.13423919677734375, 0.1405792236328125, 0.14691925048828125, 0.15325927734375, 0.15959930419921875, 0.1659393310546875, 0.17227935791015625, 0.178619384765625, 0.18495941162109375, 0.1912994384765625, 0.19763946533203125, 0.2039794921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 11.0, 21.0, 26.0, 31.0, 39.0, 56.0, 75.0, 86.0, 183.0, 290.0, 636.0, 1530.0, 4092.0, 11298.0, 31426.0, 95737.0, 459574.0, 330922.0, 72147.0, 25302.0, 9216.0, 3275.0, 1271.0, 547.0, 277.0, 150.0, 96.0, 69.0, 45.0, 35.0, 23.0, 16.0, 10.0, 7.0, 9.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5340576171875, -0.513427734375, -0.4927978515625, -0.47216796875, -0.4515380859375, -0.430908203125, -0.4102783203125, -0.3896484375, -0.3690185546875, -0.348388671875, -0.3277587890625, -0.30712890625, -0.2864990234375, -0.265869140625, -0.2452392578125, -0.224609375, -0.2039794921875, -0.183349609375, -0.1627197265625, -0.14208984375, -0.1214599609375, -0.100830078125, -0.0802001953125, -0.0595703125, -0.0389404296875, -0.018310546875, 0.0023193359375, 0.02294921875, 0.0435791015625, 0.064208984375, 0.0848388671875, 0.10546875, 0.1260986328125, 0.146728515625, 0.1673583984375, 0.18798828125, 0.2086181640625, 0.229248046875, 0.2498779296875, 0.2705078125, 0.2911376953125, 0.311767578125, 0.3323974609375, 0.35302734375, 0.3736572265625, 0.394287109375, 0.4149169921875, 0.435546875, 0.4561767578125, 0.476806640625, 0.4974365234375, 0.51806640625, 0.5386962890625, 0.559326171875, 0.5799560546875, 0.6005859375, 0.6212158203125, 0.641845703125, 0.6624755859375, 0.68310546875, 0.7037353515625, 0.724365234375, 0.7449951171875, 0.765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 10.0, 8.0, 16.0, 9.0, 15.0, 8.0, 14.0, 14.0, 18.0, 14.0, 23.0, 29.0, 27.0, 35.0, 36.0, 31.0, 35.0, 32.0, 29.0, 45.0, 48.0, 43.0, 30.0, 38.0, 40.0, 43.0, 28.0, 29.0, 27.0, 26.0, 27.0, 19.0, 27.0, 13.0, 18.0, 12.0, 12.0, 12.0, 5.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.583984375, -0.5655059814453125, -0.547027587890625, -0.5285491943359375, -0.51007080078125, -0.4915924072265625, -0.473114013671875, -0.4546356201171875, -0.4361572265625, -0.4176788330078125, -0.399200439453125, -0.3807220458984375, -0.36224365234375, -0.3437652587890625, -0.325286865234375, -0.3068084716796875, -0.288330078125, -0.2698516845703125, -0.251373291015625, -0.2328948974609375, -0.21441650390625, -0.1959381103515625, -0.177459716796875, -0.1589813232421875, -0.1405029296875, -0.1220245361328125, -0.103546142578125, -0.0850677490234375, -0.06658935546875, -0.0481109619140625, -0.029632568359375, -0.0111541748046875, 0.00732421875, 0.0258026123046875, 0.044281005859375, 0.0627593994140625, 0.08123779296875, 0.0997161865234375, 0.118194580078125, 0.1366729736328125, 0.1551513671875, 0.1736297607421875, 0.192108154296875, 0.2105865478515625, 0.22906494140625, 0.2475433349609375, 0.266021728515625, 0.2845001220703125, 0.302978515625, 0.3214569091796875, 0.339935302734375, 0.3584136962890625, 0.37689208984375, 0.3953704833984375, 0.413848876953125, 0.4323272705078125, 0.4508056640625, 0.4692840576171875, 0.487762451171875, 0.5062408447265625, 0.52471923828125, 0.5431976318359375, 0.561676025390625, 0.5801544189453125, 0.5986328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 20.0, 24.0, 39.0, 57.0, 121.0, 180.0, 260.0, 459.0, 810.0, 1528.0, 2818.0, 5388.0, 10245.0, 20042.0, 39621.0, 79952.0, 187037.0, 360622.0, 180861.0, 78585.0, 38827.0, 19698.0, 9878.0, 5193.0, 2686.0, 1528.0, 818.0, 479.0, 298.0, 171.0, 102.0, 58.0, 43.0, 28.0, 15.0, 12.0, 11.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.1590442657470703, -0.15414810180664062, -0.14925193786621094, -0.14435577392578125, -0.13945960998535156, -0.13456344604492188, -0.1296672821044922, -0.1247711181640625, -0.11987495422363281, -0.11497879028320312, -0.11008262634277344, -0.10518646240234375, -0.10029029846191406, -0.09539413452148438, -0.09049797058105469, -0.085601806640625, -0.08070564270019531, -0.07580947875976562, -0.07091331481933594, -0.06601715087890625, -0.06112098693847656, -0.056224822998046875, -0.05132865905761719, -0.0464324951171875, -0.04153633117675781, -0.036640167236328125, -0.03174400329589844, -0.02684783935546875, -0.021951675415039062, -0.017055511474609375, -0.012159347534179688, -0.00726318359375, -0.0023670196533203125, 0.002529144287109375, 0.0074253082275390625, 0.01232147216796875, 0.017217636108398438, 0.022113800048828125, 0.027009963989257812, 0.0319061279296875, 0.03680229187011719, 0.041698455810546875, 0.04659461975097656, 0.05149078369140625, 0.05638694763183594, 0.061283111572265625, 0.06617927551269531, 0.071075439453125, 0.07597160339355469, 0.08086776733398438, 0.08576393127441406, 0.09066009521484375, 0.09555625915527344, 0.10045242309570312, 0.10534858703613281, 0.1102447509765625, 0.11514091491699219, 0.12003707885742188, 0.12493324279785156, 0.12982940673828125, 0.13472557067871094, 0.13962173461914062, 0.1445178985595703, 0.1494140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 8.0, 5.0, 4.0, 11.0, 11.0, 12.0, 8.0, 11.0, 30.0, 38.0, 45.0, 80.0, 103.0, 154.0, 155.0, 106.0, 53.0, 40.0, 27.0, 24.0, 17.0, 7.0, 7.0, 12.0, 4.0, 5.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.55055046081543e-05, -6.376765668392181e-05, -6.202980875968933e-05, -6.029196083545685e-05, -5.8554112911224365e-05, -5.681626498699188e-05, -5.50784170627594e-05, -5.3340569138526917e-05, -5.1602721214294434e-05, -4.986487329006195e-05, -4.812702536582947e-05, -4.6389177441596985e-05, -4.46513295173645e-05, -4.291348159313202e-05, -4.1175633668899536e-05, -3.943778574466705e-05, -3.769993782043457e-05, -3.596208989620209e-05, -3.4224241971969604e-05, -3.248639404773712e-05, -3.074854612350464e-05, -2.9010698199272156e-05, -2.7272850275039673e-05, -2.553500235080719e-05, -2.3797154426574707e-05, -2.2059306502342224e-05, -2.032145857810974e-05, -1.8583610653877258e-05, -1.6845762729644775e-05, -1.5107914805412292e-05, -1.337006688117981e-05, -1.1632218956947327e-05, -9.894371032714844e-06, -8.15652310848236e-06, -6.418675184249878e-06, -4.680827260017395e-06, -2.942979335784912e-06, -1.2051314115524292e-06, 5.327165126800537e-07, 2.2705644369125366e-06, 4.0084123611450195e-06, 5.7462602853775024e-06, 7.484108209609985e-06, 9.221956133842468e-06, 1.0959804058074951e-05, 1.2697651982307434e-05, 1.4435499906539917e-05, 1.61733478307724e-05, 1.7911195755004883e-05, 1.9649043679237366e-05, 2.138689160346985e-05, 2.312473952770233e-05, 2.4862587451934814e-05, 2.6600435376167297e-05, 2.833828330039978e-05, 3.0076131224632263e-05, 3.1813979148864746e-05, 3.355182707309723e-05, 3.528967499732971e-05, 3.7027522921562195e-05, 3.876537084579468e-05, 4.050321877002716e-05, 4.2241066694259644e-05, 4.3978914618492126e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 6.0, 9.0, 13.0, 22.0, 26.0, 45.0, 46.0, 87.0, 122.0, 196.0, 330.0, 619.0, 1142.0, 2881.0, 8019.0, 29385.0, 121543.0, 511979.0, 285464.0, 61898.0, 16002.0, 4943.0, 1829.0, 801.0, 404.0, 266.0, 164.0, 103.0, 58.0, 39.0, 43.0, 15.0, 16.0, 15.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.313140869140625, -0.30328369140625, -0.293426513671875, -0.2835693359375, -0.273712158203125, -0.26385498046875, -0.253997802734375, -0.244140625, -0.234283447265625, -0.22442626953125, -0.214569091796875, -0.2047119140625, -0.194854736328125, -0.18499755859375, -0.175140380859375, -0.165283203125, -0.155426025390625, -0.14556884765625, -0.135711669921875, -0.1258544921875, -0.115997314453125, -0.10614013671875, -0.096282958984375, -0.08642578125, -0.076568603515625, -0.06671142578125, -0.056854248046875, -0.0469970703125, -0.037139892578125, -0.02728271484375, -0.017425537109375, -0.007568359375, 0.002288818359375, 0.01214599609375, 0.022003173828125, 0.0318603515625, 0.041717529296875, 0.05157470703125, 0.061431884765625, 0.0712890625, 0.081146240234375, 0.09100341796875, 0.100860595703125, 0.1107177734375, 0.120574951171875, 0.13043212890625, 0.140289306640625, 0.150146484375, 0.160003662109375, 0.16986083984375, 0.179718017578125, 0.1895751953125, 0.199432373046875, 0.20928955078125, 0.219146728515625, 0.22900390625, 0.238861083984375, 0.24871826171875, 0.258575439453125, 0.2684326171875, 0.278289794921875, 0.28814697265625, 0.298004150390625, 0.307861328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 10.0, 9.0, 10.0, 18.0, 17.0, 19.0, 25.0, 51.0, 53.0, 62.0, 93.0, 95.0, 110.0, 108.0, 73.0, 52.0, 46.0, 35.0, 25.0, 28.0, 12.0, 8.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18535423278808594, -0.17698287963867188, -0.1686115264892578, -0.16024017333984375, -0.1518688201904297, -0.14349746704101562, -0.13512611389160156, -0.1267547607421875, -0.11838340759277344, -0.11001205444335938, -0.10164070129394531, -0.09326934814453125, -0.08489799499511719, -0.07652664184570312, -0.06815528869628906, -0.059783935546875, -0.05141258239746094, -0.043041229248046875, -0.03466987609863281, -0.02629852294921875, -0.017927169799804688, -0.009555816650390625, -0.0011844635009765625, 0.0071868896484375, 0.015558242797851562, 0.023929595947265625, 0.03230094909667969, 0.04067230224609375, 0.04904365539550781, 0.057415008544921875, 0.06578636169433594, 0.07415771484375, 0.08252906799316406, 0.09090042114257812, 0.09927177429199219, 0.10764312744140625, 0.11601448059082031, 0.12438583374023438, 0.13275718688964844, 0.1411285400390625, 0.14949989318847656, 0.15787124633789062, 0.1662425994873047, 0.17461395263671875, 0.1829853057861328, 0.19135665893554688, 0.19972801208496094, 0.208099365234375, 0.21647071838378906, 0.22484207153320312, 0.2332134246826172, 0.24158477783203125, 0.2499561309814453, 0.2583274841308594, 0.26669883728027344, 0.2750701904296875, 0.28344154357910156, 0.2918128967285156, 0.3001842498779297, 0.30855560302734375, 0.3169269561767578, 0.3252983093261719, 0.33366966247558594, 0.342041015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 11.0, 17.0, 24.0, 39.0, 74.0, 114.0, 132.0, 160.0, 134.0, 116.0, 76.0, 56.0, 26.0, 14.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6895956993103027, -2.5931897163391113, -2.49678373336792, -2.4003775119781494, -2.303971529006958, -2.2075655460357666, -2.111159563064575, -2.0147533416748047, -1.9183473587036133, -1.8219413757324219, -1.725535273551941, -1.6291292905807495, -1.5327231884002686, -1.4363172054290771, -1.3399112224578857, -1.2435051202774048, -1.1470991373062134, -1.050693154335022, -0.954287052154541, -0.8578810691833496, -0.7614749670028687, -0.6650689840316772, -0.5686629414558411, -0.4722568988800049, -0.3758508563041687, -0.2794448137283325, -0.18303878605365753, -0.08663275837898254, 0.009773284196853638, 0.10617932677268982, 0.2025853395462036, 0.2989913821220398, 0.395397424697876, 0.49180346727371216, 0.5882095098495483, 0.6846154928207397, 0.7810215950012207, 0.8774275779724121, 0.9738336205482483, 1.0702396631240845, 1.1666457653045654, 1.2630517482757568, 1.3594578504562378, 1.4558638334274292, 1.5522699356079102, 1.6486759185791016, 1.745081901550293, 1.841488003730774, 1.9378939867019653, 2.0343000888824463, 2.1307060718536377, 2.227112054824829, 2.3235180377960205, 2.419924259185791, 2.5163302421569824, 2.612736225128174, 2.7091422080993652, 2.8055481910705566, 2.901954174041748, 2.9983603954315186, 3.09476637840271, 3.1911723613739014, 3.2875783443450928, 3.3839845657348633, 3.4803905487060547]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 2.0, 10.0, 2.0, 14.0, 15.0, 8.0, 14.0, 14.0, 20.0, 20.0, 25.0, 28.0, 15.0, 35.0, 37.0, 29.0, 37.0, 35.0, 36.0, 33.0, 42.0, 44.0, 46.0, 40.0, 33.0, 30.0, 38.0, 35.0, 34.0, 27.0, 25.0, 31.0, 35.0, 16.0, 17.0, 13.0, 15.0, 10.0, 5.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6608526706695557, -1.6099472045898438, -1.5590416193008423, -1.5081361532211304, -1.4572306871414185, -1.406325101852417, -1.355419635772705, -1.3045141696929932, -1.2536087036132812, -1.2027032375335693, -1.1517976522445679, -1.100892186164856, -1.049986720085144, -0.9990811944007874, -0.9481756687164307, -0.8972702026367188, -0.8463646173477173, -0.7954590916633606, -0.7445536255836487, -0.693648099899292, -0.6427426338195801, -0.5918371081352234, -0.5409315824508667, -0.4900260865688324, -0.4391205906867981, -0.3882150948047638, -0.3373095989227295, -0.2864040732383728, -0.2354985773563385, -0.1845930814743042, -0.1336875557899475, -0.08278205990791321, -0.031876564025878906, 0.019028939306735992, 0.06993444263935089, 0.12083995342254639, 0.1717454493045807, 0.222650945186615, 0.2735564708709717, 0.324461966753006, 0.3753674626350403, 0.4262729585170746, 0.4771784543991089, 0.5280839800834656, 0.5789895057678223, 0.6298949718475342, 0.6808004975318909, 0.7317060232162476, 0.7826114892959595, 0.8335170149803162, 0.8844224810600281, 0.9353280067443848, 0.9862334728240967, 1.0371389389038086, 1.08804452419281, 1.138949990272522, 1.1898555755615234, 1.2407610416412354, 1.2916666269302368, 1.3425720930099487, 1.3934775590896606, 1.444383144378662, 1.495288610458374, 1.546194076538086, 1.5970995426177979]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 17.0, 39.0, 72.0, 113.0, 200.0, 353.0, 640.0, 1121.0, 2100.0, 4094.0, 7596.0, 15377.0, 31978.0, 66776.0, 155947.0, 436657.0, 1515159.0, 1320887.0, 377192.0, 138161.0, 61332.0, 28884.0, 14202.0, 7183.0, 3779.0, 1979.0, 1072.0, 587.0, 320.0, 179.0, 102.0, 58.0, 35.0, 18.0, 11.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31640625, -0.30735015869140625, -0.2982940673828125, -0.28923797607421875, -0.280181884765625, -0.27112579345703125, -0.2620697021484375, -0.25301361083984375, -0.24395751953125, -0.23490142822265625, -0.2258453369140625, -0.21678924560546875, -0.207733154296875, -0.19867706298828125, -0.1896209716796875, -0.18056488037109375, -0.1715087890625, -0.16245269775390625, -0.1533966064453125, -0.14434051513671875, -0.135284423828125, -0.12622833251953125, -0.1171722412109375, -0.10811614990234375, -0.09906005859375, -0.09000396728515625, -0.0809478759765625, -0.07189178466796875, -0.062835693359375, -0.05377960205078125, -0.0447235107421875, -0.03566741943359375, -0.026611328125, -0.01755523681640625, -0.0084991455078125, 0.00055694580078125, 0.009613037109375, 0.01866912841796875, 0.0277252197265625, 0.03678131103515625, 0.04583740234375, 0.05489349365234375, 0.0639495849609375, 0.07300567626953125, 0.082061767578125, 0.09111785888671875, 0.1001739501953125, 0.10923004150390625, 0.1182861328125, 0.12734222412109375, 0.1363983154296875, 0.14545440673828125, 0.154510498046875, 0.16356658935546875, 0.1726226806640625, 0.18167877197265625, 0.19073486328125, 0.19979095458984375, 0.2088470458984375, 0.21790313720703125, 0.226959228515625, 0.23601531982421875, 0.2450714111328125, 0.25412750244140625, 0.26318359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 7.0, 8.0, 11.0, 11.0, 12.0, 12.0, 16.0, 20.0, 25.0, 17.0, 25.0, 25.0, 40.0, 37.0, 35.0, 39.0, 44.0, 36.0, 32.0, 42.0, 40.0, 33.0, 28.0, 36.0, 45.0, 41.0, 36.0, 28.0, 28.0, 18.0, 29.0, 23.0, 16.0, 17.0, 14.0, 10.0, 10.0, 10.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2269287109375, -0.22019386291503906, -0.21345901489257812, -0.2067241668701172, -0.19998931884765625, -0.1932544708251953, -0.18651962280273438, -0.17978477478027344, -0.1730499267578125, -0.16631507873535156, -0.15958023071289062, -0.1528453826904297, -0.14611053466796875, -0.1393756866455078, -0.13264083862304688, -0.12590599060058594, -0.119171142578125, -0.11243629455566406, -0.10570144653320312, -0.09896659851074219, -0.09223175048828125, -0.08549690246582031, -0.07876205444335938, -0.07202720642089844, -0.0652923583984375, -0.05855751037597656, -0.051822662353515625, -0.04508781433105469, -0.03835296630859375, -0.03161811828613281, -0.024883270263671875, -0.018148422241210938, -0.01141357421875, -0.0046787261962890625, 0.002056121826171875, 0.008790969848632812, 0.01552581787109375, 0.022260665893554688, 0.028995513916015625, 0.03573036193847656, 0.0424652099609375, 0.04920005798339844, 0.055934906005859375, 0.06266975402832031, 0.06940460205078125, 0.07613945007324219, 0.08287429809570312, 0.08960914611816406, 0.096343994140625, 0.10307884216308594, 0.10981369018554688, 0.11654853820800781, 0.12328338623046875, 0.1300182342529297, 0.13675308227539062, 0.14348793029785156, 0.1502227783203125, 0.15695762634277344, 0.16369247436523438, 0.1704273223876953, 0.17716217041015625, 0.1838970184326172, 0.19063186645507812, 0.19736671447753906, 0.2041015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 8.0, 9.0, 9.0, 9.0, 17.0, 23.0, 44.0, 48.0, 71.0, 95.0, 122.0, 190.0, 268.0, 388.0, 625.0, 950.0, 1554.0, 2669.0, 4606.0, 8302.0, 15351.0, 29333.0, 57764.0, 121274.0, 277970.0, 800134.0, 1672764.0, 715280.0, 255389.0, 112547.0, 54770.0, 27820.0, 14615.0, 7646.0, 4430.0, 2664.0, 1543.0, 1027.0, 617.0, 424.0, 302.0, 191.0, 126.0, 92.0, 64.0, 44.0, 23.0, 30.0, 22.0, 8.0, 6.0, 8.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0], "bins": [-0.33203125, -0.32180023193359375, -0.3115692138671875, -0.30133819580078125, -0.291107177734375, -0.28087615966796875, -0.2706451416015625, -0.26041412353515625, -0.25018310546875, -0.23995208740234375, -0.2297210693359375, -0.21949005126953125, -0.209259033203125, -0.19902801513671875, -0.1887969970703125, -0.17856597900390625, -0.1683349609375, -0.15810394287109375, -0.1478729248046875, -0.13764190673828125, -0.127410888671875, -0.11717987060546875, -0.1069488525390625, -0.09671783447265625, -0.08648681640625, -0.07625579833984375, -0.0660247802734375, -0.05579376220703125, -0.045562744140625, -0.03533172607421875, -0.0251007080078125, -0.01486968994140625, -0.004638671875, 0.00559234619140625, 0.0158233642578125, 0.02605438232421875, 0.036285400390625, 0.04651641845703125, 0.0567474365234375, 0.06697845458984375, 0.07720947265625, 0.08744049072265625, 0.0976715087890625, 0.10790252685546875, 0.118133544921875, 0.12836456298828125, 0.1385955810546875, 0.14882659912109375, 0.1590576171875, 0.16928863525390625, 0.1795196533203125, 0.18975067138671875, 0.199981689453125, 0.21021270751953125, 0.2204437255859375, 0.23067474365234375, 0.24090576171875, 0.25113677978515625, 0.2613677978515625, 0.27159881591796875, 0.281829833984375, 0.29206085205078125, 0.3022918701171875, 0.31252288818359375, 0.32275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 13.0, 9.0, 8.0, 13.0, 18.0, 21.0, 47.0, 53.0, 74.0, 81.0, 107.0, 175.0, 217.0, 350.0, 492.0, 568.0, 515.0, 367.0, 247.0, 173.0, 105.0, 94.0, 71.0, 63.0, 36.0, 29.0, 24.0, 21.0, 20.0, 12.0, 5.0, 8.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4225349426269531, -0.40781402587890625, -0.3930931091308594, -0.3783721923828125, -0.3636512756347656, -0.34893035888671875, -0.3342094421386719, -0.319488525390625, -0.3047676086425781, -0.29004669189453125, -0.2753257751464844, -0.2606048583984375, -0.24588394165039062, -0.23116302490234375, -0.21644210815429688, -0.20172119140625, -0.18700027465820312, -0.17227935791015625, -0.15755844116210938, -0.1428375244140625, -0.12811660766601562, -0.11339569091796875, -0.09867477416992188, -0.083953857421875, -0.06923294067382812, -0.05451202392578125, -0.039791107177734375, -0.0250701904296875, -0.010349273681640625, 0.00437164306640625, 0.019092559814453125, 0.0338134765625, 0.048534393310546875, 0.06325531005859375, 0.07797622680664062, 0.0926971435546875, 0.10741806030273438, 0.12213897705078125, 0.13685989379882812, 0.151580810546875, 0.16630172729492188, 0.18102264404296875, 0.19574356079101562, 0.2104644775390625, 0.22518539428710938, 0.23990631103515625, 0.2546272277832031, 0.26934814453125, 0.2840690612792969, 0.29878997802734375, 0.3135108947753906, 0.3282318115234375, 0.3429527282714844, 0.35767364501953125, 0.3723945617675781, 0.387115478515625, 0.4018363952636719, 0.41655731201171875, 0.4312782287597656, 0.4459991455078125, 0.4607200622558594, 0.47544097900390625, 0.4901618957519531, 0.5048828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 17.0, 24.0, 51.0, 61.0, 96.0, 142.0, 142.0, 158.0, 134.0, 82.0, 37.0, 21.0, 17.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5983855724334717, -2.477837324142456, -2.3572890758514404, -2.236740827560425, -2.11619234085083, -1.995644211769104, -1.8750958442687988, -1.7545475959777832, -1.6339993476867676, -1.513451099395752, -1.3929028511047363, -1.2723544836044312, -1.1518062353134155, -1.0312579870224, -0.9107096791267395, -0.7901613712310791, -0.6696131229400635, -0.5490648746490479, -0.42851656675338745, -0.30796828866004944, -0.18742001056671143, -0.0668717622756958, 0.0536765456199646, 0.174224853515625, 0.2947731018066406, 0.41532137989997864, 0.5358696579933167, 0.656417965888977, 0.7769662141799927, 0.8975144624710083, 1.0180628299713135, 1.138611078262329, 1.2591590881347656, 1.3797073364257812, 1.5002555847167969, 1.620803952217102, 1.7413522005081177, 1.8619004487991333, 1.9824488162994385, 2.102997064590454, 2.2235453128814697, 2.3440935611724854, 2.464641809463501, 2.5851900577545166, 2.7057385444641113, 2.826286792755127, 2.9468350410461426, 3.067383289337158, 3.187931537628174, 3.3084797859191895, 3.429028034210205, 3.5495762825012207, 3.6701245307922363, 3.790672779083252, 3.9112212657928467, 4.031769752502441, 4.152318000793457, 4.272866249084473, 4.393414497375488, 4.513962745666504, 4.6345109939575195, 4.755059242248535, 4.875607490539551, 4.996155738830566, 5.116703987121582]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 3.0, 6.0, 6.0, 6.0, 12.0, 18.0, 32.0, 14.0, 17.0, 28.0, 20.0, 28.0, 22.0, 30.0, 34.0, 43.0, 46.0, 33.0, 41.0, 42.0, 41.0, 45.0, 21.0, 39.0, 40.0, 36.0, 36.0, 24.0, 36.0, 28.0, 25.0, 19.0, 16.0, 23.0, 10.0, 12.0, 12.0, 9.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6624364852905273, -1.6146938800811768, -1.5669512748718262, -1.5192086696624756, -1.4714659452438354, -1.4237233400344849, -1.3759807348251343, -1.3282381296157837, -1.280495524406433, -1.2327529191970825, -1.185010313987732, -1.1372675895690918, -1.0895249843597412, -1.0417823791503906, -0.99403977394104, -0.9462971687316895, -0.8985545039176941, -0.8508118987083435, -0.8030692338943481, -0.7553266286849976, -0.707584023475647, -0.6598414182662964, -0.612098753452301, -0.5643561482429504, -0.5166134834289551, -0.4688708484172821, -0.4211282432079315, -0.37338560819625854, -0.32564300298690796, -0.277900367975235, -0.230157732963562, -0.18241512775421143, -0.13467252254486084, -0.08692990243434906, -0.03918727487325668, 0.008555352687835693, 0.05629797279834747, 0.10404059290885925, 0.15178322792053223, 0.1995258331298828, 0.2472684681415558, 0.29501110315322876, 0.34275370836257935, 0.3904963433742523, 0.4382389783859253, 0.4859815835952759, 0.5337241888046265, 0.581466794013977, 0.6292094588279724, 0.676952064037323, 0.7246947288513184, 0.772437334060669, 0.8201799392700195, 0.8679225444793701, 0.9156652092933655, 0.9634078145027161, 1.0111504793167114, 1.058893084526062, 1.1066356897354126, 1.1543784141540527, 1.2021210193634033, 1.249863624572754, 1.2976062297821045, 1.345348834991455, 1.3930914402008057]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 4.0, 6.0, 11.0, 6.0, 7.0, 26.0, 28.0, 46.0, 88.0, 141.0, 193.0, 315.0, 542.0, 798.0, 1369.0, 2210.0, 3514.0, 5828.0, 9698.0, 17448.0, 34884.0, 81608.0, 210782.0, 339709.0, 192245.0, 75006.0, 32280.0, 16325.0, 9183.0, 5444.0, 3401.0, 2099.0, 1192.0, 793.0, 502.0, 308.0, 187.0, 99.0, 75.0, 44.0, 35.0, 24.0, 18.0, 4.0, 8.0, 6.0, 4.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.33544921875, -0.32511138916015625, -0.3147735595703125, -0.30443572998046875, -0.294097900390625, -0.28376007080078125, -0.2734222412109375, -0.26308441162109375, -0.25274658203125, -0.24240875244140625, -0.2320709228515625, -0.22173309326171875, -0.211395263671875, -0.20105743408203125, -0.1907196044921875, -0.18038177490234375, -0.1700439453125, -0.15970611572265625, -0.1493682861328125, -0.13903045654296875, -0.128692626953125, -0.11835479736328125, -0.1080169677734375, -0.09767913818359375, -0.08734130859375, -0.07700347900390625, -0.0666656494140625, -0.05632781982421875, -0.045989990234375, -0.03565216064453125, -0.0253143310546875, -0.01497650146484375, -0.004638671875, 0.00569915771484375, 0.0160369873046875, 0.02637481689453125, 0.036712646484375, 0.04705047607421875, 0.0573883056640625, 0.06772613525390625, 0.07806396484375, 0.08840179443359375, 0.0987396240234375, 0.10907745361328125, 0.119415283203125, 0.12975311279296875, 0.1400909423828125, 0.15042877197265625, 0.1607666015625, 0.17110443115234375, 0.1814422607421875, 0.19178009033203125, 0.202117919921875, 0.21245574951171875, 0.2227935791015625, 0.23313140869140625, 0.24346923828125, 0.25380706787109375, 0.2641448974609375, 0.27448272705078125, 0.284820556640625, 0.29515838623046875, 0.3054962158203125, 0.31583404541015625, 0.326171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 10.0, 4.0, 13.0, 10.0, 23.0, 14.0, 8.0, 21.0, 18.0, 25.0, 29.0, 35.0, 40.0, 32.0, 30.0, 29.0, 32.0, 39.0, 37.0, 41.0, 38.0, 34.0, 34.0, 45.0, 34.0, 33.0, 39.0, 25.0, 30.0, 27.0, 25.0, 14.0, 15.0, 20.0, 14.0, 8.0, 10.0, 6.0, 6.0, 7.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.22412109375, -0.2174396514892578, -0.21075820922851562, -0.20407676696777344, -0.19739532470703125, -0.19071388244628906, -0.18403244018554688, -0.1773509979248047, -0.1706695556640625, -0.1639881134033203, -0.15730667114257812, -0.15062522888183594, -0.14394378662109375, -0.13726234436035156, -0.13058090209960938, -0.12389945983886719, -0.117218017578125, -0.11053657531738281, -0.10385513305664062, -0.09717369079589844, -0.09049224853515625, -0.08381080627441406, -0.07712936401367188, -0.07044792175292969, -0.0637664794921875, -0.05708503723144531, -0.050403594970703125, -0.04372215270996094, -0.03704071044921875, -0.030359268188476562, -0.023677825927734375, -0.016996383666992188, -0.01031494140625, -0.0036334991455078125, 0.003047943115234375, 0.009729385375976562, 0.01641082763671875, 0.023092269897460938, 0.029773712158203125, 0.03645515441894531, 0.0431365966796875, 0.04981803894042969, 0.056499481201171875, 0.06318092346191406, 0.06986236572265625, 0.07654380798339844, 0.08322525024414062, 0.08990669250488281, 0.096588134765625, 0.10326957702636719, 0.10995101928710938, 0.11663246154785156, 0.12331390380859375, 0.12999534606933594, 0.13667678833007812, 0.1433582305908203, 0.1500396728515625, 0.1567211151123047, 0.16340255737304688, 0.17008399963378906, 0.17676544189453125, 0.18344688415527344, 0.19012832641601562, 0.1968097686767578, 0.2034912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 13.0, 15.0, 19.0, 20.0, 29.0, 38.0, 49.0, 90.0, 146.0, 258.0, 509.0, 1238.0, 3026.0, 8416.0, 25099.0, 96988.0, 418537.0, 375769.0, 83223.0, 22448.0, 7450.0, 2882.0, 1140.0, 505.0, 248.0, 144.0, 71.0, 56.0, 36.0, 22.0, 14.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5989303588867188, -0.5801849365234375, -0.5614395141601562, -0.542694091796875, -0.5239486694335938, -0.5052032470703125, -0.48645782470703125, -0.46771240234375, -0.44896697998046875, -0.4302215576171875, -0.41147613525390625, -0.392730712890625, -0.37398529052734375, -0.3552398681640625, -0.33649444580078125, -0.3177490234375, -0.29900360107421875, -0.2802581787109375, -0.26151275634765625, -0.242767333984375, -0.22402191162109375, -0.2052764892578125, -0.18653106689453125, -0.16778564453125, -0.14904022216796875, -0.1302947998046875, -0.11154937744140625, -0.092803955078125, -0.07405853271484375, -0.0553131103515625, -0.03656768798828125, -0.017822265625, 0.00092315673828125, 0.0196685791015625, 0.03841400146484375, 0.057159423828125, 0.07590484619140625, 0.0946502685546875, 0.11339569091796875, 0.13214111328125, 0.15088653564453125, 0.1696319580078125, 0.18837738037109375, 0.207122802734375, 0.22586822509765625, 0.2446136474609375, 0.26335906982421875, 0.2821044921875, 0.30084991455078125, 0.3195953369140625, 0.33834075927734375, 0.357086181640625, 0.37583160400390625, 0.3945770263671875, 0.41332244873046875, 0.43206787109375, 0.45081329345703125, 0.4695587158203125, 0.48830413818359375, 0.507049560546875, 0.5257949829101562, 0.5445404052734375, 0.5632858276367188, 0.58203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 10.0, 11.0, 12.0, 19.0, 25.0, 21.0, 21.0, 33.0, 34.0, 29.0, 31.0, 28.0, 38.0, 40.0, 45.0, 36.0, 41.0, 41.0, 38.0, 52.0, 42.0, 36.0, 27.0, 32.0, 29.0, 29.0, 27.0, 26.0, 26.0, 21.0, 16.0, 16.0, 12.0, 9.0, 4.0, 8.0, 5.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.673828125, -0.6527786254882812, -0.6317291259765625, -0.6106796264648438, -0.589630126953125, -0.5685806274414062, -0.5475311279296875, -0.5264816284179688, -0.50543212890625, -0.48438262939453125, -0.4633331298828125, -0.44228363037109375, -0.421234130859375, -0.40018463134765625, -0.3791351318359375, -0.35808563232421875, -0.3370361328125, -0.31598663330078125, -0.2949371337890625, -0.27388763427734375, -0.252838134765625, -0.23178863525390625, -0.2107391357421875, -0.18968963623046875, -0.16864013671875, -0.14759063720703125, -0.1265411376953125, -0.10549163818359375, -0.084442138671875, -0.06339263916015625, -0.0423431396484375, -0.02129364013671875, -0.000244140625, 0.02080535888671875, 0.0418548583984375, 0.06290435791015625, 0.083953857421875, 0.10500335693359375, 0.1260528564453125, 0.14710235595703125, 0.16815185546875, 0.18920135498046875, 0.2102508544921875, 0.23130035400390625, 0.252349853515625, 0.27339935302734375, 0.2944488525390625, 0.31549835205078125, 0.3365478515625, 0.35759735107421875, 0.3786468505859375, 0.39969635009765625, 0.420745849609375, 0.44179534912109375, 0.4628448486328125, 0.48389434814453125, 0.50494384765625, 0.5259933471679688, 0.5470428466796875, 0.5680923461914062, 0.589141845703125, 0.6101913452148438, 0.6312408447265625, 0.6522903442382812, 0.67333984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 6.0, 12.0, 15.0, 26.0, 24.0, 26.0, 66.0, 86.0, 155.0, 256.0, 420.0, 755.0, 1364.0, 2420.0, 4685.0, 8954.0, 17360.0, 35296.0, 77256.0, 189204.0, 332982.0, 211852.0, 86911.0, 38661.0, 18838.0, 9755.0, 5154.0, 2615.0, 1483.0, 746.0, 441.0, 244.0, 154.0, 94.0, 90.0, 38.0, 25.0, 24.0, 11.0, 17.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.1486339569091797, -0.14406967163085938, -0.13950538635253906, -0.13494110107421875, -0.13037681579589844, -0.12581253051757812, -0.12124824523925781, -0.1166839599609375, -0.11211967468261719, -0.10755538940429688, -0.10299110412597656, -0.09842681884765625, -0.09386253356933594, -0.08929824829101562, -0.08473396301269531, -0.080169677734375, -0.07560539245605469, -0.07104110717773438, -0.06647682189941406, -0.06191253662109375, -0.05734825134277344, -0.052783966064453125, -0.04821968078613281, -0.0436553955078125, -0.03909111022949219, -0.034526824951171875, -0.029962539672851562, -0.02539825439453125, -0.020833969116210938, -0.016269683837890625, -0.011705398559570312, -0.00714111328125, -0.0025768280029296875, 0.001987457275390625, 0.0065517425537109375, 0.01111602783203125, 0.015680313110351562, 0.020244598388671875, 0.024808883666992188, 0.0293731689453125, 0.03393745422363281, 0.038501739501953125, 0.04306602478027344, 0.04763031005859375, 0.05219459533691406, 0.056758880615234375, 0.06132316589355469, 0.065887451171875, 0.07045173645019531, 0.07501602172851562, 0.07958030700683594, 0.08414459228515625, 0.08870887756347656, 0.09327316284179688, 0.09783744812011719, 0.1024017333984375, 0.10696601867675781, 0.11153030395507812, 0.11609458923339844, 0.12065887451171875, 0.12522315979003906, 0.12978744506835938, 0.1343517303466797, 0.138916015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 9.0, 4.0, 8.0, 15.0, 22.0, 35.0, 36.0, 76.0, 107.0, 129.0, 151.0, 147.0, 88.0, 55.0, 25.0, 24.0, 22.0, 9.0, 10.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.175041198730469e-05, -5.98980113863945e-05, -5.8045610785484314e-05, -5.619321018457413e-05, -5.434080958366394e-05, -5.2488408982753754e-05, -5.063600838184357e-05, -4.878360778093338e-05, -4.693120718002319e-05, -4.5078806579113007e-05, -4.322640597820282e-05, -4.137400537729263e-05, -3.9521604776382446e-05, -3.766920417547226e-05, -3.581680357456207e-05, -3.3964402973651886e-05, -3.21120023727417e-05, -3.0259601771831512e-05, -2.8407201170921326e-05, -2.655480057001114e-05, -2.4702399969100952e-05, -2.2849999368190765e-05, -2.099759876728058e-05, -1.9145198166370392e-05, -1.7292797565460205e-05, -1.544039696455002e-05, -1.3587996363639832e-05, -1.1735595762729645e-05, -9.883195161819458e-06, -8.030794560909271e-06, -6.1783939599990845e-06, -4.325993359088898e-06, -2.473592758178711e-06, -6.211921572685242e-07, 1.2312084436416626e-06, 3.0836090445518494e-06, 4.936009645462036e-06, 6.788410246372223e-06, 8.64081084728241e-06, 1.0493211448192596e-05, 1.2345612049102783e-05, 1.419801265001297e-05, 1.6050413250923157e-05, 1.7902813851833344e-05, 1.975521445274353e-05, 2.1607615053653717e-05, 2.3460015654563904e-05, 2.531241625547409e-05, 2.7164816856384277e-05, 2.9017217457294464e-05, 3.086961805820465e-05, 3.272201865911484e-05, 3.4574419260025024e-05, 3.642681986093521e-05, 3.82792204618454e-05, 4.0131621062755585e-05, 4.198402166366577e-05, 4.383642226457596e-05, 4.5688822865486145e-05, 4.754122346639633e-05, 4.939362406730652e-05, 5.1246024668216705e-05, 5.309842526912689e-05, 5.495082587003708e-05, 5.6803226470947266e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 17.0, 21.0, 24.0, 34.0, 58.0, 82.0, 116.0, 184.0, 294.0, 591.0, 989.0, 2095.0, 4625.0, 10606.0, 24878.0, 61074.0, 159617.0, 330501.0, 268442.0, 109193.0, 42758.0, 17909.0, 7507.0, 3406.0, 1573.0, 831.0, 432.0, 266.0, 153.0, 97.0, 64.0, 37.0, 23.0, 19.0, 9.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.2047119140625, -0.1992969512939453, -0.19388198852539062, -0.18846702575683594, -0.18305206298828125, -0.17763710021972656, -0.17222213745117188, -0.1668071746826172, -0.1613922119140625, -0.1559772491455078, -0.15056228637695312, -0.14514732360839844, -0.13973236083984375, -0.13431739807128906, -0.12890243530273438, -0.12348747253417969, -0.118072509765625, -0.11265754699707031, -0.10724258422851562, -0.10182762145996094, -0.09641265869140625, -0.09099769592285156, -0.08558273315429688, -0.08016777038574219, -0.0747528076171875, -0.06933784484863281, -0.06392288208007812, -0.05850791931152344, -0.05309295654296875, -0.04767799377441406, -0.042263031005859375, -0.03684806823730469, -0.03143310546875, -0.026018142700195312, -0.020603179931640625, -0.015188217163085938, -0.00977325439453125, -0.0043582916259765625, 0.001056671142578125, 0.0064716339111328125, 0.0118865966796875, 0.017301559448242188, 0.022716522216796875, 0.028131484985351562, 0.03354644775390625, 0.03896141052246094, 0.044376373291015625, 0.04979133605957031, 0.055206298828125, 0.06062126159667969, 0.06603622436523438, 0.07145118713378906, 0.07686614990234375, 0.08228111267089844, 0.08769607543945312, 0.09311103820800781, 0.0985260009765625, 0.10394096374511719, 0.10935592651367188, 0.11477088928222656, 0.12018585205078125, 0.12560081481933594, 0.13101577758789062, 0.1364307403564453, 0.141845703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 10.0, 14.0, 14.0, 17.0, 25.0, 34.0, 35.0, 50.0, 64.0, 81.0, 96.0, 89.0, 78.0, 62.0, 71.0, 44.0, 42.0, 31.0, 19.0, 19.0, 21.0, 16.0, 10.0, 5.0, 12.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2451171875, -0.23901939392089844, -0.23292160034179688, -0.2268238067626953, -0.22072601318359375, -0.2146282196044922, -0.20853042602539062, -0.20243263244628906, -0.1963348388671875, -0.19023704528808594, -0.18413925170898438, -0.1780414581298828, -0.17194366455078125, -0.1658458709716797, -0.15974807739257812, -0.15365028381347656, -0.147552490234375, -0.14145469665527344, -0.13535690307617188, -0.1292591094970703, -0.12316131591796875, -0.11706352233886719, -0.11096572875976562, -0.10486793518066406, -0.0987701416015625, -0.09267234802246094, -0.08657455444335938, -0.08047676086425781, -0.07437896728515625, -0.06828117370605469, -0.062183380126953125, -0.05608558654785156, -0.04998779296875, -0.04388999938964844, -0.037792205810546875, -0.03169441223144531, -0.02559661865234375, -0.019498825073242188, -0.013401031494140625, -0.0073032379150390625, -0.0012054443359375, 0.0048923492431640625, 0.010990142822265625, 0.017087936401367188, 0.02318572998046875, 0.029283523559570312, 0.035381317138671875, 0.04147911071777344, 0.047576904296875, 0.05367469787597656, 0.059772491455078125, 0.06587028503417969, 0.07196807861328125, 0.07806587219238281, 0.08416366577148438, 0.09026145935058594, 0.0963592529296875, 0.10245704650878906, 0.10855484008789062, 0.11465263366699219, 0.12075042724609375, 0.1268482208251953, 0.13294601440429688, 0.13904380798339844, 0.1451416015625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 19.0, 44.0, 100.0, 123.0, 175.0, 176.0, 151.0, 82.0, 51.0, 36.0, 14.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1311469078063965, -2.034599542617798, -1.9380521774291992, -1.8415048122406006, -1.7449575662612915, -1.6484102010726929, -1.5518628358840942, -1.4553155899047852, -1.3587682247161865, -1.262220859527588, -1.1656734943389893, -1.0691261291503906, -0.9725788831710815, -0.8760315179824829, -0.7794841527938843, -0.6829368472099304, -0.586389422416687, -0.48984208703041077, -0.3932947516441345, -0.2967473864555359, -0.20020005106925964, -0.1036527156829834, -0.007105350494384766, 0.08944195508956909, 0.18598932027816772, 0.28253665566444397, 0.3790839910507202, 0.47563135623931885, 0.5721787214279175, 0.6687260270118713, 0.76527339220047, 0.8618206977844238, 0.9583680629730225, 1.054915428161621, 1.1514627933502197, 1.2480101585388184, 1.3445574045181274, 1.441104769706726, 1.5376521348953247, 1.6341993808746338, 1.7307467460632324, 1.827294111251831, 1.9238414764404297, 2.0203888416290283, 2.116936206817627, 2.2134833335876465, 2.310030937194824, 2.4065780639648438, 2.5031256675720215, 2.59967303276062, 2.6962203979492188, 2.7927677631378174, 2.889315128326416, 2.9858622550964355, 3.0824098587036133, 3.178956985473633, 3.2755043506622314, 3.37205171585083, 3.4685990810394287, 3.5651464462280273, 3.661693811416626, 3.7582411766052246, 3.854788303375244, 3.9513356685638428, 4.047883033752441]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 6.0, 9.0, 10.0, 12.0, 14.0, 17.0, 16.0, 19.0, 25.0, 27.0, 21.0, 25.0, 29.0, 35.0, 36.0, 33.0, 33.0, 44.0, 29.0, 44.0, 45.0, 51.0, 50.0, 35.0, 38.0, 35.0, 36.0, 32.0, 21.0, 28.0, 19.0, 19.0, 17.0, 8.0, 16.0, 12.0, 9.0, 9.0, 5.0, 6.0, 7.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6426702737808228, -1.5931708812713623, -1.5436713695526123, -1.4941719770431519, -1.4446724653244019, -1.3951730728149414, -1.3456735610961914, -1.296174168586731, -1.2466747760772705, -1.19717538356781, -1.14767587184906, -1.0981764793395996, -1.0486769676208496, -0.9991775751113892, -0.9496781229972839, -0.9001786708831787, -0.8506791591644287, -0.8011797070503235, -0.7516802549362183, -0.7021808624267578, -0.6526813507080078, -0.6031819581985474, -0.5536825060844421, -0.5041830539703369, -0.4546836018562317, -0.40518414974212646, -0.35568469762802124, -0.3061852753162384, -0.2566858232021332, -0.20718637108802795, -0.15768694877624512, -0.10818749666213989, -0.05868816375732422, -0.009188719093799591, 0.04031072556972504, 0.08981016278266907, 0.1393096148967743, 0.18880906701087952, 0.23830848932266235, 0.2878079414367676, 0.3373073935508728, 0.386806845664978, 0.43630629777908325, 0.4858057200908661, 0.5353051424026489, 0.5848046541213989, 0.6343040466308594, 0.6838034987449646, 0.7333029508590698, 0.782802402973175, 0.8323018550872803, 0.8818012475967407, 0.9313007593154907, 0.9808001518249512, 1.0302996635437012, 1.0797990560531616, 1.129298448562622, 1.1787978410720825, 1.2282973527908325, 1.277796745300293, 1.327296257019043, 1.3767956495285034, 1.4262950420379639, 1.4757945537567139, 1.5252940654754639]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 12.0, 12.0, 23.0, 31.0, 46.0, 55.0, 103.0, 191.0, 320.0, 603.0, 1161.0, 2327.0, 4723.0, 10117.0, 21099.0, 45593.0, 105058.0, 270214.0, 823175.0, 1658288.0, 795633.0, 265838.0, 104592.0, 45483.0, 20632.0, 9793.0, 4519.0, 2182.0, 1075.0, 546.0, 328.0, 163.0, 111.0, 73.0, 41.0, 31.0, 22.0, 12.0, 14.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.301513671875, -0.29193878173828125, -0.2823638916015625, -0.27278900146484375, -0.263214111328125, -0.25363922119140625, -0.2440643310546875, -0.23448944091796875, -0.22491455078125, -0.21533966064453125, -0.2057647705078125, -0.19618988037109375, -0.186614990234375, -0.17704010009765625, -0.1674652099609375, -0.15789031982421875, -0.1483154296875, -0.13874053955078125, -0.1291656494140625, -0.11959075927734375, -0.110015869140625, -0.10044097900390625, -0.0908660888671875, -0.08129119873046875, -0.07171630859375, -0.06214141845703125, -0.0525665283203125, -0.04299163818359375, -0.033416748046875, -0.02384185791015625, -0.0142669677734375, -0.00469207763671875, 0.0048828125, 0.01445770263671875, 0.0240325927734375, 0.03360748291015625, 0.043182373046875, 0.05275726318359375, 0.0623321533203125, 0.07190704345703125, 0.08148193359375, 0.09105682373046875, 0.1006317138671875, 0.11020660400390625, 0.119781494140625, 0.12935638427734375, 0.1389312744140625, 0.14850616455078125, 0.1580810546875, 0.16765594482421875, 0.1772308349609375, 0.18680572509765625, 0.196380615234375, 0.20595550537109375, 0.2155303955078125, 0.22510528564453125, 0.23468017578125, 0.24425506591796875, 0.2538299560546875, 0.26340484619140625, 0.272979736328125, 0.28255462646484375, 0.2921295166015625, 0.30170440673828125, 0.311279296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 2.0, 8.0, 9.0, 10.0, 9.0, 14.0, 13.0, 16.0, 16.0, 28.0, 27.0, 21.0, 21.0, 26.0, 40.0, 44.0, 30.0, 47.0, 50.0, 29.0, 52.0, 33.0, 45.0, 33.0, 24.0, 35.0, 50.0, 37.0, 32.0, 28.0, 27.0, 25.0, 15.0, 14.0, 23.0, 11.0, 11.0, 5.0, 12.0, 6.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2265625, -0.21941757202148438, -0.21227264404296875, -0.20512771606445312, -0.1979827880859375, -0.19083786010742188, -0.18369293212890625, -0.17654800415039062, -0.169403076171875, -0.16225814819335938, -0.15511322021484375, -0.14796829223632812, -0.1408233642578125, -0.13367843627929688, -0.12653350830078125, -0.11938858032226562, -0.11224365234375, -0.10509872436523438, -0.09795379638671875, -0.09080886840820312, -0.0836639404296875, -0.07651901245117188, -0.06937408447265625, -0.062229156494140625, -0.055084228515625, -0.047939300537109375, -0.04079437255859375, -0.033649444580078125, -0.0265045166015625, -0.019359588623046875, -0.01221466064453125, -0.005069732666015625, 0.0020751953125, 0.009220123291015625, 0.01636505126953125, 0.023509979248046875, 0.0306549072265625, 0.037799835205078125, 0.04494476318359375, 0.052089691162109375, 0.059234619140625, 0.06637954711914062, 0.07352447509765625, 0.08066940307617188, 0.0878143310546875, 0.09495925903320312, 0.10210418701171875, 0.10924911499023438, 0.11639404296875, 0.12353897094726562, 0.13068389892578125, 0.13782882690429688, 0.1449737548828125, 0.15211868286132812, 0.15926361083984375, 0.16640853881835938, 0.173553466796875, 0.18069839477539062, 0.18784332275390625, 0.19498825073242188, 0.2021331787109375, 0.20927810668945312, 0.21642303466796875, 0.22356796264648438, 0.230712890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 12.0, 13.0, 9.0, 24.0, 33.0, 57.0, 83.0, 124.0, 210.0, 386.0, 667.0, 1336.0, 2629.0, 5578.0, 12598.0, 29499.0, 72185.0, 191539.0, 613407.0, 1966622.0, 887494.0, 251030.0, 92150.0, 37151.0, 15932.0, 6849.0, 3253.0, 1523.0, 765.0, 421.0, 233.0, 180.0, 104.0, 61.0, 39.0, 21.0, 14.0, 21.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3874092102050781, -0.37516021728515625, -0.3629112243652344, -0.3506622314453125, -0.3384132385253906, -0.32616424560546875, -0.3139152526855469, -0.301666259765625, -0.2894172668457031, -0.27716827392578125, -0.2649192810058594, -0.2526702880859375, -0.24042129516601562, -0.22817230224609375, -0.21592330932617188, -0.20367431640625, -0.19142532348632812, -0.17917633056640625, -0.16692733764648438, -0.1546783447265625, -0.14242935180664062, -0.13018035888671875, -0.11793136596679688, -0.105682373046875, -0.09343338012695312, -0.08118438720703125, -0.06893539428710938, -0.0566864013671875, -0.044437408447265625, -0.03218841552734375, -0.019939422607421875, -0.0076904296875, 0.004558563232421875, 0.01680755615234375, 0.029056549072265625, 0.0413055419921875, 0.053554534912109375, 0.06580352783203125, 0.07805252075195312, 0.090301513671875, 0.10255050659179688, 0.11479949951171875, 0.12704849243164062, 0.1392974853515625, 0.15154647827148438, 0.16379547119140625, 0.17604446411132812, 0.18829345703125, 0.20054244995117188, 0.21279144287109375, 0.22504043579101562, 0.2372894287109375, 0.24953842163085938, 0.26178741455078125, 0.2740364074707031, 0.286285400390625, 0.2985343933105469, 0.31078338623046875, 0.3230323791503906, 0.3352813720703125, 0.3475303649902344, 0.35977935791015625, 0.3720283508300781, 0.38427734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 7.0, 11.0, 11.0, 16.0, 22.0, 26.0, 39.0, 39.0, 51.0, 84.0, 124.0, 152.0, 209.0, 329.0, 456.0, 596.0, 542.0, 365.0, 248.0, 203.0, 131.0, 96.0, 57.0, 63.0, 54.0, 34.0, 28.0, 22.0, 18.0, 9.0, 8.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.467041015625, -0.4507789611816406, -0.43451690673828125, -0.4182548522949219, -0.4019927978515625, -0.3857307434082031, -0.36946868896484375, -0.3532066345214844, -0.336944580078125, -0.3206825256347656, -0.30442047119140625, -0.2881584167480469, -0.2718963623046875, -0.2556343078613281, -0.23937225341796875, -0.22311019897460938, -0.20684814453125, -0.19058609008789062, -0.17432403564453125, -0.15806198120117188, -0.1417999267578125, -0.12553787231445312, -0.10927581787109375, -0.09301376342773438, -0.076751708984375, -0.060489654541015625, -0.04422760009765625, -0.027965545654296875, -0.0117034912109375, 0.004558563232421875, 0.02082061767578125, 0.037082672119140625, 0.0533447265625, 0.06960678100585938, 0.08586883544921875, 0.10213088989257812, 0.1183929443359375, 0.13465499877929688, 0.15091705322265625, 0.16717910766601562, 0.183441162109375, 0.19970321655273438, 0.21596527099609375, 0.23222732543945312, 0.2484893798828125, 0.2647514343261719, 0.28101348876953125, 0.2972755432128906, 0.31353759765625, 0.3297996520996094, 0.34606170654296875, 0.3623237609863281, 0.3785858154296875, 0.3948478698730469, 0.41110992431640625, 0.4273719787597656, 0.443634033203125, 0.4598960876464844, 0.47615814208984375, 0.4924201965332031, 0.5086822509765625, 0.5249443054199219, 0.5412063598632812, 0.5574684143066406, 0.57373046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 7.0, 10.0, 19.0, 16.0, 22.0, 33.0, 41.0, 50.0, 70.0, 85.0, 71.0, 95.0, 90.0, 90.0, 72.0, 53.0, 47.0, 42.0, 25.0, 15.0, 16.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7945706844329834, -1.7246588468551636, -1.6547470092773438, -1.584835171699524, -1.514923334121704, -1.4450114965438843, -1.3750996589660645, -1.3051879405975342, -1.2352759838104248, -1.165364146232605, -1.0954523086547852, -1.0255404710769653, -0.9556286334991455, -0.8857167959213257, -0.8158050179481506, -0.7458931803703308, -0.6759814023971558, -0.6060695648193359, -0.5361577272415161, -0.4662459194660187, -0.39633408188819885, -0.32642224431037903, -0.2565104365348816, -0.18659859895706177, -0.11668676137924194, -0.046774931252002716, 0.02313689887523651, 0.09304872155189514, 0.16296055912971497, 0.2328723967075348, 0.3027842044830322, 0.37269604206085205, 0.4426078796386719, 0.5125197172164917, 0.5824315547943115, 0.6523433923721313, 0.7222552299499512, 0.792167067527771, 0.862078845500946, 0.9319906830787659, 1.0019025802612305, 1.0718144178390503, 1.1417262554168701, 1.21163809299469, 1.2815499305725098, 1.3514617681503296, 1.4213736057281494, 1.4912853240966797, 1.5611971616744995, 1.6311089992523193, 1.7010208368301392, 1.770932674407959, 1.8408445119857788, 1.9107563495635986, 1.980668067932129, 2.0505800247192383, 2.1204917430877686, 2.190403461456299, 2.260315418243408, 2.3302271366119385, 2.400139093399048, 2.470050811767578, 2.5399627685546875, 2.6098744869232178, 2.679786443710327]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 8.0, 7.0, 8.0, 4.0, 9.0, 8.0, 11.0, 10.0, 20.0, 12.0, 17.0, 23.0, 21.0, 23.0, 28.0, 25.0, 34.0, 27.0, 39.0, 34.0, 31.0, 35.0, 38.0, 42.0, 34.0, 39.0, 33.0, 42.0, 39.0, 31.0, 20.0, 22.0, 32.0, 25.0, 20.0, 13.0, 9.0, 25.0, 9.0, 14.0, 17.0, 18.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0], "bins": [-1.3539042472839355, -1.3137092590332031, -1.2735143899917603, -1.2333194017410278, -1.193124532699585, -1.1529295444488525, -1.1127345561981201, -1.0725395679473877, -1.0323446989059448, -0.9921497702598572, -0.9519548416137695, -0.9117598533630371, -0.8715649247169495, -0.8313699960708618, -0.7911750078201294, -0.7509800791740417, -0.7107851505279541, -0.6705902218818665, -0.6303952932357788, -0.5902003049850464, -0.5500053763389587, -0.5098104476928711, -0.46961548924446106, -0.429420530796051, -0.3892256021499634, -0.34903067350387573, -0.3088357150554657, -0.26864075660705566, -0.22844582796096802, -0.18825088441371918, -0.14805594086647034, -0.1078609824180603, -0.06766605377197266, -0.027471110224723816, 0.012723833322525024, 0.052918776869773865, 0.0931137204170227, 0.13330866396427155, 0.17350360751152039, 0.21369856595993042, 0.25389349460601807, 0.2940884232521057, 0.33428338170051575, 0.3744783401489258, 0.4146732687950134, 0.4548681974411011, 0.4950631558895111, 0.5352581143379211, 0.5754530429840088, 0.6156479716300964, 0.6558429002761841, 0.6960378885269165, 0.7362328171730042, 0.7764277458190918, 0.8166227340698242, 0.8568176627159119, 0.8970125913619995, 0.9372075200080872, 0.9774024486541748, 1.0175974369049072, 1.0577924251556396, 1.0979872941970825, 1.138182282447815, 1.1783771514892578, 1.2185721397399902]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 7.0, 6.0, 5.0, 13.0, 12.0, 15.0, 34.0, 38.0, 60.0, 89.0, 140.0, 173.0, 333.0, 404.0, 584.0, 857.0, 1193.0, 1655.0, 2278.0, 3185.0, 4272.0, 6113.0, 8755.0, 12649.0, 19994.0, 36779.0, 84447.0, 223600.0, 326760.0, 165879.0, 63172.0, 29766.0, 16922.0, 11266.0, 7802.0, 5437.0, 4049.0, 2896.0, 2029.0, 1441.0, 1021.0, 740.0, 499.0, 371.0, 249.0, 188.0, 110.0, 86.0, 63.0, 39.0, 27.0, 24.0, 11.0, 7.0, 8.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.310302734375, -0.3000755310058594, -0.28984832763671875, -0.2796211242675781, -0.2693939208984375, -0.2591667175292969, -0.24893951416015625, -0.23871231079101562, -0.228485107421875, -0.21825790405273438, -0.20803070068359375, -0.19780349731445312, -0.1875762939453125, -0.17734909057617188, -0.16712188720703125, -0.15689468383789062, -0.14666748046875, -0.13644027709960938, -0.12621307373046875, -0.11598587036132812, -0.1057586669921875, -0.09553146362304688, -0.08530426025390625, -0.07507705688476562, -0.064849853515625, -0.054622650146484375, -0.04439544677734375, -0.034168243408203125, -0.0239410400390625, -0.013713836669921875, -0.00348663330078125, 0.006740570068359375, 0.0169677734375, 0.027194976806640625, 0.03742218017578125, 0.047649383544921875, 0.0578765869140625, 0.06810379028320312, 0.07833099365234375, 0.08855819702148438, 0.098785400390625, 0.10901260375976562, 0.11923980712890625, 0.12946701049804688, 0.1396942138671875, 0.14992141723632812, 0.16014862060546875, 0.17037582397460938, 0.18060302734375, 0.19083023071289062, 0.20105743408203125, 0.21128463745117188, 0.2215118408203125, 0.23173904418945312, 0.24196624755859375, 0.2521934509277344, 0.262420654296875, 0.2726478576660156, 0.28287506103515625, 0.2931022644042969, 0.3033294677734375, 0.3135566711425781, 0.32378387451171875, 0.3340110778808594, 0.34423828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 8.0, 10.0, 18.0, 19.0, 19.0, 23.0, 31.0, 49.0, 30.0, 40.0, 38.0, 52.0, 52.0, 55.0, 64.0, 40.0, 44.0, 44.0, 41.0, 38.0, 38.0, 45.0, 29.0, 32.0, 27.0, 17.0, 15.0, 11.0, 13.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.314453125, -0.30562591552734375, -0.2967987060546875, -0.28797149658203125, -0.279144287109375, -0.27031707763671875, -0.2614898681640625, -0.25266265869140625, -0.24383544921875, -0.23500823974609375, -0.2261810302734375, -0.21735382080078125, -0.208526611328125, -0.19969940185546875, -0.1908721923828125, -0.18204498291015625, -0.1732177734375, -0.16439056396484375, -0.1555633544921875, -0.14673614501953125, -0.137908935546875, -0.12908172607421875, -0.1202545166015625, -0.11142730712890625, -0.10260009765625, -0.09377288818359375, -0.0849456787109375, -0.07611846923828125, -0.067291259765625, -0.05846405029296875, -0.0496368408203125, -0.04080963134765625, -0.031982421875, -0.02315521240234375, -0.0143280029296875, -0.00550079345703125, 0.003326416015625, 0.01215362548828125, 0.0209808349609375, 0.02980804443359375, 0.03863525390625, 0.04746246337890625, 0.0562896728515625, 0.06511688232421875, 0.073944091796875, 0.08277130126953125, 0.0915985107421875, 0.10042572021484375, 0.1092529296875, 0.11808013916015625, 0.1269073486328125, 0.13573455810546875, 0.144561767578125, 0.15338897705078125, 0.1622161865234375, 0.17104339599609375, 0.17987060546875, 0.18869781494140625, 0.1975250244140625, 0.20635223388671875, 0.215179443359375, 0.22400665283203125, 0.2328338623046875, 0.24166107177734375, 0.25048828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 11.0, 8.0, 13.0, 10.0, 22.0, 47.0, 57.0, 80.0, 105.0, 202.0, 348.0, 756.0, 1883.0, 5592.0, 17227.0, 58934.0, 374619.0, 484684.0, 72684.0, 20806.0, 6401.0, 2255.0, 845.0, 384.0, 192.0, 155.0, 79.0, 52.0, 43.0, 21.0, 10.0, 10.0, 11.0, 5.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8169708251953125, -0.790679931640625, -0.7643890380859375, -0.73809814453125, -0.7118072509765625, -0.685516357421875, -0.6592254638671875, -0.6329345703125, -0.6066436767578125, -0.580352783203125, -0.5540618896484375, -0.52777099609375, -0.5014801025390625, -0.475189208984375, -0.4488983154296875, -0.422607421875, -0.3963165283203125, -0.370025634765625, -0.3437347412109375, -0.31744384765625, -0.2911529541015625, -0.264862060546875, -0.2385711669921875, -0.2122802734375, -0.1859893798828125, -0.159698486328125, -0.1334075927734375, -0.10711669921875, -0.0808258056640625, -0.054534912109375, -0.0282440185546875, -0.001953125, 0.0243377685546875, 0.050628662109375, 0.0769195556640625, 0.10321044921875, 0.1295013427734375, 0.155792236328125, 0.1820831298828125, 0.2083740234375, 0.2346649169921875, 0.260955810546875, 0.2872467041015625, 0.31353759765625, 0.3398284912109375, 0.366119384765625, 0.3924102783203125, 0.418701171875, 0.4449920654296875, 0.471282958984375, 0.4975738525390625, 0.52386474609375, 0.5501556396484375, 0.576446533203125, 0.6027374267578125, 0.6290283203125, 0.6553192138671875, 0.681610107421875, 0.7079010009765625, 0.73419189453125, 0.7604827880859375, 0.786773681640625, 0.8130645751953125, 0.83935546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 3.0, 11.0, 6.0, 4.0, 13.0, 11.0, 12.0, 14.0, 11.0, 19.0, 26.0, 24.0, 27.0, 32.0, 35.0, 43.0, 40.0, 41.0, 45.0, 44.0, 37.0, 36.0, 43.0, 35.0, 37.0, 37.0, 38.0, 34.0, 41.0, 24.0, 23.0, 15.0, 23.0, 23.0, 15.0, 15.0, 12.0, 7.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.6171875, -0.5970382690429688, -0.5768890380859375, -0.5567398071289062, -0.536590576171875, -0.5164413452148438, -0.4962921142578125, -0.47614288330078125, -0.45599365234375, -0.43584442138671875, -0.4156951904296875, -0.39554595947265625, -0.375396728515625, -0.35524749755859375, -0.3350982666015625, -0.31494903564453125, -0.2947998046875, -0.27465057373046875, -0.2545013427734375, -0.23435211181640625, -0.214202880859375, -0.19405364990234375, -0.1739044189453125, -0.15375518798828125, -0.13360595703125, -0.11345672607421875, -0.0933074951171875, -0.07315826416015625, -0.053009033203125, -0.03285980224609375, -0.0127105712890625, 0.00743865966796875, 0.027587890625, 0.04773712158203125, 0.0678863525390625, 0.08803558349609375, 0.108184814453125, 0.12833404541015625, 0.1484832763671875, 0.16863250732421875, 0.18878173828125, 0.20893096923828125, 0.2290802001953125, 0.24922943115234375, 0.269378662109375, 0.28952789306640625, 0.3096771240234375, 0.32982635498046875, 0.3499755859375, 0.37012481689453125, 0.3902740478515625, 0.41042327880859375, 0.430572509765625, 0.45072174072265625, 0.4708709716796875, 0.49102020263671875, 0.51116943359375, 0.5313186645507812, 0.5514678955078125, 0.5716171264648438, 0.591766357421875, 0.6119155883789062, 0.6320648193359375, 0.6522140502929688, 0.67236328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 10.0, 20.0, 28.0, 63.0, 117.0, 252.0, 550.0, 1398.0, 3355.0, 8247.0, 22126.0, 96287.0, 578931.0, 272588.0, 42205.0, 13402.0, 5209.0, 2132.0, 959.0, 350.0, 153.0, 67.0, 46.0, 22.0, 12.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.2989349365234375, -0.289520263671875, -0.2801055908203125, -0.27069091796875, -0.2612762451171875, -0.251861572265625, -0.2424468994140625, -0.2330322265625, -0.2236175537109375, -0.214202880859375, -0.2047882080078125, -0.19537353515625, -0.1859588623046875, -0.176544189453125, -0.1671295166015625, -0.15771484375, -0.1483001708984375, -0.138885498046875, -0.1294708251953125, -0.12005615234375, -0.1106414794921875, -0.101226806640625, -0.0918121337890625, -0.0823974609375, -0.0729827880859375, -0.063568115234375, -0.0541534423828125, -0.04473876953125, -0.0353240966796875, -0.025909423828125, -0.0164947509765625, -0.007080078125, 0.0023345947265625, 0.011749267578125, 0.0211639404296875, 0.03057861328125, 0.0399932861328125, 0.049407958984375, 0.0588226318359375, 0.0682373046875, 0.0776519775390625, 0.087066650390625, 0.0964813232421875, 0.10589599609375, 0.1153106689453125, 0.124725341796875, 0.1341400146484375, 0.1435546875, 0.1529693603515625, 0.162384033203125, 0.1717987060546875, 0.18121337890625, 0.1906280517578125, 0.200042724609375, 0.2094573974609375, 0.2188720703125, 0.2282867431640625, 0.237701416015625, 0.2471160888671875, 0.25653076171875, 0.2659454345703125, 0.275360107421875, 0.2847747802734375, 0.294189453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 9.0, 6.0, 14.0, 16.0, 22.0, 40.0, 62.0, 122.0, 177.0, 160.0, 137.0, 75.0, 36.0, 26.0, 15.0, 15.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.127357482910156e-05, -5.9091486036777496e-05, -5.690939724445343e-05, -5.4727308452129364e-05, -5.25452196598053e-05, -5.036313086748123e-05, -4.8181042075157166e-05, -4.59989532828331e-05, -4.381686449050903e-05, -4.163477569818497e-05, -3.94526869058609e-05, -3.7270598113536835e-05, -3.508850932121277e-05, -3.29064205288887e-05, -3.0724331736564636e-05, -2.854224294424057e-05, -2.6360154151916504e-05, -2.4178065359592438e-05, -2.199597656726837e-05, -1.9813887774944305e-05, -1.763179898262024e-05, -1.5449710190296173e-05, -1.3267621397972107e-05, -1.108553260564804e-05, -8.903443813323975e-06, -6.7213550209999084e-06, -4.539266228675842e-06, -2.357177436351776e-06, -1.7508864402770996e-07, 2.007000148296356e-06, 4.189088940620422e-06, 6.3711777329444885e-06, 8.553266525268555e-06, 1.0735355317592621e-05, 1.2917444109916687e-05, 1.5099532902240753e-05, 1.728162169456482e-05, 1.9463710486888885e-05, 2.164579927921295e-05, 2.3827888071537018e-05, 2.6009976863861084e-05, 2.819206565618515e-05, 3.0374154448509216e-05, 3.255624324083328e-05, 3.473833203315735e-05, 3.6920420825481415e-05, 3.910250961780548e-05, 4.128459841012955e-05, 4.346668720245361e-05, 4.564877599477768e-05, 4.7830864787101746e-05, 5.001295357942581e-05, 5.219504237174988e-05, 5.4377131164073944e-05, 5.655921995639801e-05, 5.8741308748722076e-05, 6.092339754104614e-05, 6.310548633337021e-05, 6.528757512569427e-05, 6.746966391801834e-05, 6.965175271034241e-05, 7.183384150266647e-05, 7.401593029499054e-05, 7.61980190873146e-05, 7.838010787963867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 7.0, 13.0, 13.0, 39.0, 37.0, 58.0, 111.0, 165.0, 314.0, 646.0, 1369.0, 2924.0, 6300.0, 14927.0, 44213.0, 187877.0, 481494.0, 224555.0, 53320.0, 17008.0, 7056.0, 3128.0, 1409.0, 694.0, 343.0, 190.0, 88.0, 70.0, 55.0, 35.0, 26.0, 13.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16382408142089844, -0.15687179565429688, -0.1499195098876953, -0.14296722412109375, -0.1360149383544922, -0.12906265258789062, -0.12211036682128906, -0.1151580810546875, -0.10820579528808594, -0.10125350952148438, -0.09430122375488281, -0.08734893798828125, -0.08039665222167969, -0.07344436645507812, -0.06649208068847656, -0.059539794921875, -0.05258750915527344, -0.045635223388671875, -0.03868293762207031, -0.03173065185546875, -0.024778366088867188, -0.017826080322265625, -0.010873794555664062, -0.0039215087890625, 0.0030307769775390625, 0.009983062744140625, 0.016935348510742188, 0.02388763427734375, 0.030839920043945312, 0.037792205810546875, 0.04474449157714844, 0.05169677734375, 0.05864906311035156, 0.06560134887695312, 0.07255363464355469, 0.07950592041015625, 0.08645820617675781, 0.09341049194335938, 0.10036277770996094, 0.1073150634765625, 0.11426734924316406, 0.12121963500976562, 0.1281719207763672, 0.13512420654296875, 0.1420764923095703, 0.14902877807617188, 0.15598106384277344, 0.162933349609375, 0.16988563537597656, 0.17683792114257812, 0.1837902069091797, 0.19074249267578125, 0.1976947784423828, 0.20464706420898438, 0.21159934997558594, 0.2185516357421875, 0.22550392150878906, 0.23245620727539062, 0.2394084930419922, 0.24636077880859375, 0.2533130645751953, 0.2602653503417969, 0.26721763610839844, 0.274169921875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 12.0, 8.0, 23.0, 21.0, 25.0, 49.0, 48.0, 64.0, 85.0, 95.0, 96.0, 76.0, 73.0, 67.0, 57.0, 40.0, 31.0, 21.0, 20.0, 12.0, 8.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.207275390625, -0.20123291015625, -0.1951904296875, -0.18914794921875, -0.18310546875, -0.17706298828125, -0.1710205078125, -0.16497802734375, -0.158935546875, -0.15289306640625, -0.1468505859375, -0.14080810546875, -0.134765625, -0.12872314453125, -0.1226806640625, -0.11663818359375, -0.110595703125, -0.10455322265625, -0.0985107421875, -0.09246826171875, -0.08642578125, -0.08038330078125, -0.0743408203125, -0.06829833984375, -0.062255859375, -0.05621337890625, -0.0501708984375, -0.04412841796875, -0.0380859375, -0.03204345703125, -0.0260009765625, -0.01995849609375, -0.013916015625, -0.00787353515625, -0.0018310546875, 0.00421142578125, 0.01025390625, 0.01629638671875, 0.0223388671875, 0.02838134765625, 0.034423828125, 0.04046630859375, 0.0465087890625, 0.05255126953125, 0.05859375, 0.06463623046875, 0.0706787109375, 0.07672119140625, 0.082763671875, 0.08880615234375, 0.0948486328125, 0.10089111328125, 0.10693359375, 0.11297607421875, 0.1190185546875, 0.12506103515625, 0.131103515625, 0.13714599609375, 0.1431884765625, 0.14923095703125, 0.1552734375, 0.16131591796875, 0.1673583984375, 0.17340087890625, 0.179443359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 24.0, 41.0, 85.0, 163.0, 205.0, 181.0, 147.0, 87.0, 33.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.264548301696777, -4.139028549194336, -4.0135087966918945, -3.887989044189453, -3.7624692916870117, -3.6369495391845703, -3.511430025100708, -3.3859102725982666, -3.260390520095825, -3.134870767593384, -3.0093510150909424, -2.883831262588501, -2.7583117485046387, -2.6327919960021973, -2.507272243499756, -2.3817524909973145, -2.256232738494873, -2.1307129859924316, -2.0051932334899902, -1.8796736001968384, -1.754153847694397, -1.6286340951919556, -1.5031144618988037, -1.3775947093963623, -1.252074956893921, -1.1265552043914795, -1.001035451889038, -0.8755158185958862, -0.7499960660934448, -0.6244763135910034, -0.4989566206932068, -0.37343692779541016, -0.24791717529296875, -0.12239745259284973, 0.003122270107269287, 0.1286419928073883, 0.2541617155075073, 0.37968146800994873, 0.5052011609077454, 0.630720853805542, 0.7562406063079834, 0.8817603588104248, 1.0072801113128662, 1.132799744606018, 1.2583194971084595, 1.3838392496109009, 1.5093588829040527, 1.6348786354064941, 1.7603983879089355, 1.885918140411377, 2.0114378929138184, 2.1369576454162598, 2.262477397918701, 2.3879971504211426, 2.513516664505005, 2.6390364170074463, 2.7645561695098877, 2.890075922012329, 3.0155956745147705, 3.141115427017212, 3.266634941101074, 3.3921546936035156, 3.517674446105957, 3.6431941986083984, 3.76871395111084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 5.0, 12.0, 14.0, 6.0, 14.0, 19.0, 14.0, 20.0, 22.0, 27.0, 15.0, 23.0, 25.0, 27.0, 29.0, 49.0, 42.0, 36.0, 41.0, 33.0, 45.0, 42.0, 38.0, 43.0, 36.0, 36.0, 40.0, 31.0, 39.0, 18.0, 25.0, 23.0, 11.0, 16.0, 9.0, 12.0, 14.0, 7.0, 6.0, 8.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4789416790008545, -1.428098201751709, -1.377254843711853, -1.3264113664627075, -1.275567889213562, -1.224724531173706, -1.1738810539245605, -1.123037576675415, -1.0721940994262695, -1.021350622177124, -0.9705072045326233, -0.9196637868881226, -0.868820309638977, -0.8179768919944763, -0.7671334743499756, -0.7162899971008301, -0.6654465794563293, -0.6146031618118286, -0.5637596845626831, -0.5129162669181824, -0.46207278966903687, -0.41122937202453613, -0.360385924577713, -0.3095424771308899, -0.2586990296840668, -0.20785558223724365, -0.15701213479042053, -0.1061687022447586, -0.055325254797935486, -0.00448182225227356, 0.04636162519454956, 0.09720507264137268, 0.1480485200881958, 0.19889196753501892, 0.24973541498184204, 0.3005788326263428, 0.3514223098754883, 0.402265727519989, 0.45310917496681213, 0.5039526224136353, 0.5547960996627808, 0.6056395173072815, 0.656482994556427, 0.7073264122009277, 0.7581698894500732, 0.809013307094574, 0.8598567247390747, 0.9107002019882202, 0.961543619632721, 1.0123870372772217, 1.0632305145263672, 1.1140739917755127, 1.1649173498153687, 1.2157608270645142, 1.2666043043136597, 1.3174476623535156, 1.3682911396026611, 1.4191346168518066, 1.4699779748916626, 1.520821452140808, 1.5716649293899536, 1.6225082874298096, 1.673351764678955, 1.7241952419281006, 1.775038719177246]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 12.0, 20.0, 23.0, 32.0, 48.0, 63.0, 120.0, 205.0, 357.0, 641.0, 1166.0, 2440.0, 4950.0, 10359.0, 22570.0, 51745.0, 139050.0, 472580.0, 1533990.0, 1368341.0, 384135.0, 116155.0, 45906.0, 20193.0, 9701.0, 4658.0, 2323.0, 1158.0, 575.0, 295.0, 186.0, 84.0, 54.0, 48.0, 25.0, 11.0, 18.0, 12.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.378173828125, -0.36734771728515625, -0.3565216064453125, -0.34569549560546875, -0.334869384765625, -0.32404327392578125, -0.3132171630859375, -0.30239105224609375, -0.29156494140625, -0.28073883056640625, -0.2699127197265625, -0.25908660888671875, -0.248260498046875, -0.23743438720703125, -0.2266082763671875, -0.21578216552734375, -0.2049560546875, -0.19412994384765625, -0.1833038330078125, -0.17247772216796875, -0.161651611328125, -0.15082550048828125, -0.1399993896484375, -0.12917327880859375, -0.11834716796875, -0.10752105712890625, -0.0966949462890625, -0.08586883544921875, -0.075042724609375, -0.06421661376953125, -0.0533905029296875, -0.04256439208984375, -0.03173828125, -0.02091217041015625, -0.0100860595703125, 0.00074005126953125, 0.011566162109375, 0.02239227294921875, 0.0332183837890625, 0.04404449462890625, 0.05487060546875, 0.06569671630859375, 0.0765228271484375, 0.08734893798828125, 0.098175048828125, 0.10900115966796875, 0.1198272705078125, 0.13065338134765625, 0.1414794921875, 0.15230560302734375, 0.1631317138671875, 0.17395782470703125, 0.184783935546875, 0.19561004638671875, 0.2064361572265625, 0.21726226806640625, 0.22808837890625, 0.23891448974609375, 0.2497406005859375, 0.26056671142578125, 0.271392822265625, 0.28221893310546875, 0.2930450439453125, 0.30387115478515625, 0.314697265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 11.0, 8.0, 14.0, 17.0, 17.0, 15.0, 21.0, 20.0, 42.0, 24.0, 31.0, 34.0, 41.0, 34.0, 42.0, 41.0, 45.0, 41.0, 38.0, 46.0, 31.0, 45.0, 34.0, 44.0, 31.0, 26.0, 30.0, 17.0, 21.0, 17.0, 18.0, 20.0, 14.0, 12.0, 12.0, 11.0, 10.0, 3.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0], "bins": [-0.305908203125, -0.2978096008300781, -0.28971099853515625, -0.2816123962402344, -0.2735137939453125, -0.2654151916503906, -0.25731658935546875, -0.24921798706054688, -0.241119384765625, -0.23302078247070312, -0.22492218017578125, -0.21682357788085938, -0.2087249755859375, -0.20062637329101562, -0.19252777099609375, -0.18442916870117188, -0.17633056640625, -0.16823196411132812, -0.16013336181640625, -0.15203475952148438, -0.1439361572265625, -0.13583755493164062, -0.12773895263671875, -0.11964035034179688, -0.111541748046875, -0.10344314575195312, -0.09534454345703125, -0.08724594116210938, -0.0791473388671875, -0.07104873657226562, -0.06295013427734375, -0.054851531982421875, -0.0467529296875, -0.038654327392578125, -0.03055572509765625, -0.022457122802734375, -0.0143585205078125, -0.006259918212890625, 0.00183868408203125, 0.009937286376953125, 0.018035888671875, 0.026134490966796875, 0.03423309326171875, 0.042331695556640625, 0.0504302978515625, 0.058528900146484375, 0.06662750244140625, 0.07472610473632812, 0.08282470703125, 0.09092330932617188, 0.09902191162109375, 0.10712051391601562, 0.1152191162109375, 0.12331771850585938, 0.13141632080078125, 0.13951492309570312, 0.147613525390625, 0.15571212768554688, 0.16381072998046875, 0.17190933227539062, 0.1800079345703125, 0.18810653686523438, 0.19620513916015625, 0.20430374145507812, 0.21240234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 15.0, 15.0, 21.0, 30.0, 41.0, 38.0, 68.0, 99.0, 149.0, 238.0, 408.0, 635.0, 1158.0, 2177.0, 4633.0, 9783.0, 22040.0, 52063.0, 132597.0, 413916.0, 1740538.0, 1318069.0, 311333.0, 106209.0, 42974.0, 18230.0, 8166.0, 3933.0, 1933.0, 1059.0, 598.0, 363.0, 229.0, 161.0, 105.0, 72.0, 51.0, 28.0, 27.0, 16.0, 15.0, 7.0, 10.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4072265625, -0.39484405517578125, -0.3824615478515625, -0.37007904052734375, -0.357696533203125, -0.34531402587890625, -0.3329315185546875, -0.32054901123046875, -0.30816650390625, -0.29578399658203125, -0.2834014892578125, -0.27101898193359375, -0.258636474609375, -0.24625396728515625, -0.2338714599609375, -0.22148895263671875, -0.2091064453125, -0.19672393798828125, -0.1843414306640625, -0.17195892333984375, -0.159576416015625, -0.14719390869140625, -0.1348114013671875, -0.12242889404296875, -0.11004638671875, -0.09766387939453125, -0.0852813720703125, -0.07289886474609375, -0.060516357421875, -0.04813385009765625, -0.0357513427734375, -0.02336883544921875, -0.010986328125, 0.00139617919921875, 0.0137786865234375, 0.02616119384765625, 0.038543701171875, 0.05092620849609375, 0.0633087158203125, 0.07569122314453125, 0.08807373046875, 0.10045623779296875, 0.1128387451171875, 0.12522125244140625, 0.137603759765625, 0.14998626708984375, 0.1623687744140625, 0.17475128173828125, 0.1871337890625, 0.19951629638671875, 0.2118988037109375, 0.22428131103515625, 0.236663818359375, 0.24904632568359375, 0.2614288330078125, 0.27381134033203125, 0.28619384765625, 0.29857635498046875, 0.3109588623046875, 0.32334136962890625, 0.335723876953125, 0.34810638427734375, 0.3604888916015625, 0.37287139892578125, 0.38525390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 26.0, 18.0, 31.0, 34.0, 57.0, 82.0, 105.0, 151.0, 250.0, 394.0, 593.0, 636.0, 573.0, 345.0, 218.0, 143.0, 113.0, 68.0, 69.0, 46.0, 26.0, 20.0, 16.0, 11.0, 4.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6142578125, -0.595306396484375, -0.57635498046875, -0.557403564453125, -0.5384521484375, -0.519500732421875, -0.50054931640625, -0.481597900390625, -0.462646484375, -0.443695068359375, -0.42474365234375, -0.405792236328125, -0.3868408203125, -0.367889404296875, -0.34893798828125, -0.329986572265625, -0.31103515625, -0.292083740234375, -0.27313232421875, -0.254180908203125, -0.2352294921875, -0.216278076171875, -0.19732666015625, -0.178375244140625, -0.159423828125, -0.140472412109375, -0.12152099609375, -0.102569580078125, -0.0836181640625, -0.064666748046875, -0.04571533203125, -0.026763916015625, -0.0078125, 0.011138916015625, 0.03009033203125, 0.049041748046875, 0.0679931640625, 0.086944580078125, 0.10589599609375, 0.124847412109375, 0.143798828125, 0.162750244140625, 0.18170166015625, 0.200653076171875, 0.2196044921875, 0.238555908203125, 0.25750732421875, 0.276458740234375, 0.29541015625, 0.314361572265625, 0.33331298828125, 0.352264404296875, 0.3712158203125, 0.390167236328125, 0.40911865234375, 0.428070068359375, 0.447021484375, 0.465972900390625, 0.48492431640625, 0.503875732421875, 0.5228271484375, 0.541778564453125, 0.56072998046875, 0.579681396484375, 0.5986328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 8.0, 23.0, 36.0, 67.0, 67.0, 113.0, 151.0, 131.0, 163.0, 92.0, 68.0, 35.0, 16.0, 11.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.871828079223633, -3.752101182937622, -3.6323742866516113, -3.5126476287841797, -3.392920732498169, -3.273193836212158, -3.1534669399261475, -3.0337400436401367, -2.914013147354126, -2.7942862510681152, -2.6745593547821045, -2.5548324584960938, -2.435105800628662, -2.3153789043426514, -2.1956520080566406, -2.07592511177063, -1.9561983346939087, -1.836471438407898, -1.7167446613311768, -1.597017765045166, -1.4772908687591553, -1.3575639724731445, -1.2378371953964233, -1.1181102991104126, -0.9983834624290466, -0.8786566257476807, -0.7589297294616699, -0.639202892780304, -0.519476056098938, -0.39974915981292725, -0.2800223231315613, -0.16029542684555054, -0.04056859016418457, 0.07915826886892319, 0.19888512790203094, 0.3186119794845581, 0.43833884596824646, 0.5580657124519348, 0.6777925491333008, 0.7975194454193115, 0.9172462821006775, 1.0369731187820435, 1.1567000150680542, 1.2764267921447754, 1.3961536884307861, 1.5158805847167969, 1.6356074810028076, 1.7553343772888184, 1.8750611543655396, 1.9947880506515503, 2.1145148277282715, 2.2342417240142822, 2.353968620300293, 2.4736955165863037, 2.5934224128723145, 2.713149070739746, 2.832875967025757, 2.9526028633117676, 3.0723297595977783, 3.192056655883789, 3.3117833137512207, 3.4315102100372314, 3.551237106323242, 3.670964002609253, 3.7906908988952637]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 2.0, 6.0, 13.0, 11.0, 16.0, 14.0, 18.0, 24.0, 21.0, 26.0, 12.0, 32.0, 35.0, 39.0, 38.0, 16.0, 38.0, 33.0, 28.0, 40.0, 36.0, 46.0, 35.0, 50.0, 37.0, 26.0, 37.0, 35.0, 29.0, 28.0, 24.0, 23.0, 14.0, 17.0, 22.0, 15.0, 9.0, 10.0, 5.0, 8.0, 12.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5893858671188354, -1.5412522554397583, -1.4931187629699707, -1.4449851512908936, -1.396851658821106, -1.3487180471420288, -1.3005845546722412, -1.252450942993164, -1.204317331314087, -1.1561837196350098, -1.1080502271652222, -1.059916615486145, -1.0117831230163574, -0.9636495113372803, -0.9155159592628479, -0.8673824071884155, -0.8192489147186279, -0.7711153626441956, -0.7229818105697632, -0.674848198890686, -0.6267147064208984, -0.5785810947418213, -0.5304475426673889, -0.48231399059295654, -0.43418043851852417, -0.3860468864440918, -0.3379133343696594, -0.28977975249290466, -0.2416462004184723, -0.19351264834403992, -0.14537906646728516, -0.09724551439285278, -0.04911184310913086, -0.0009782835841178894, 0.04715527594089508, 0.09528884291648865, 0.14342239499092102, 0.1915559470653534, 0.23968952894210815, 0.2878230810165405, 0.3359566330909729, 0.3840901851654053, 0.43222373723983765, 0.4803573191165924, 0.5284909009933472, 0.5766243934631348, 0.6247580051422119, 0.6728915572166443, 0.7210251092910767, 0.769158661365509, 0.8172922134399414, 0.8654258251190186, 0.9135593175888062, 0.9616929292678833, 1.009826421737671, 1.057960033416748, 1.1060936450958252, 1.1542272567749023, 1.20236074924469, 1.250494360923767, 1.2986278533935547, 1.3467614650726318, 1.394895076751709, 1.4430285692214966, 1.4911620616912842]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 16.0, 15.0, 18.0, 39.0, 105.0, 221.0, 479.0, 1238.0, 2791.0, 6962.0, 15666.0, 35571.0, 125298.0, 534656.0, 237812.0, 51010.0, 20628.0, 9166.0, 3964.0, 1619.0, 660.0, 303.0, 141.0, 84.0, 31.0, 28.0, 10.0, 7.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8773574829101562, -0.8557891845703125, -0.8342208862304688, -0.812652587890625, -0.7910842895507812, -0.7695159912109375, -0.7479476928710938, -0.72637939453125, -0.7048110961914062, -0.6832427978515625, -0.6616744995117188, -0.640106201171875, -0.6185379028320312, -0.5969696044921875, -0.5754013061523438, -0.5538330078125, -0.5322647094726562, -0.5106964111328125, -0.48912811279296875, -0.467559814453125, -0.44599151611328125, -0.4244232177734375, -0.40285491943359375, -0.38128662109375, -0.35971832275390625, -0.3381500244140625, -0.31658172607421875, -0.295013427734375, -0.27344512939453125, -0.2518768310546875, -0.23030853271484375, -0.208740234375, -0.18717193603515625, -0.1656036376953125, -0.14403533935546875, -0.122467041015625, -0.10089874267578125, -0.0793304443359375, -0.05776214599609375, -0.03619384765625, -0.01462554931640625, 0.0069427490234375, 0.02851104736328125, 0.050079345703125, 0.07164764404296875, 0.0932159423828125, 0.11478424072265625, 0.1363525390625, 0.15792083740234375, 0.1794891357421875, 0.20105743408203125, 0.222625732421875, 0.24419403076171875, 0.2657623291015625, 0.28733062744140625, 0.30889892578125, 0.33046722412109375, 0.3520355224609375, 0.37360382080078125, 0.395172119140625, 0.41674041748046875, 0.4383087158203125, 0.45987701416015625, 0.4814453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 11.0, 6.0, 13.0, 10.0, 13.0, 14.0, 15.0, 24.0, 11.0, 22.0, 36.0, 32.0, 38.0, 47.0, 37.0, 37.0, 53.0, 48.0, 44.0, 37.0, 42.0, 35.0, 40.0, 42.0, 32.0, 24.0, 36.0, 35.0, 32.0, 26.0, 18.0, 10.0, 17.0, 9.0, 11.0, 10.0, 9.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.29150390625, -0.28334808349609375, -0.2751922607421875, -0.26703643798828125, -0.258880615234375, -0.25072479248046875, -0.2425689697265625, -0.23441314697265625, -0.22625732421875, -0.21810150146484375, -0.2099456787109375, -0.20178985595703125, -0.193634033203125, -0.18547821044921875, -0.1773223876953125, -0.16916656494140625, -0.1610107421875, -0.15285491943359375, -0.1446990966796875, -0.13654327392578125, -0.128387451171875, -0.12023162841796875, -0.1120758056640625, -0.10391998291015625, -0.09576416015625, -0.08760833740234375, -0.0794525146484375, -0.07129669189453125, -0.063140869140625, -0.05498504638671875, -0.0468292236328125, -0.03867340087890625, -0.030517578125, -0.02236175537109375, -0.0142059326171875, -0.00605010986328125, 0.002105712890625, 0.01026153564453125, 0.0184173583984375, 0.02657318115234375, 0.03472900390625, 0.04288482666015625, 0.0510406494140625, 0.05919647216796875, 0.067352294921875, 0.07550811767578125, 0.0836639404296875, 0.09181976318359375, 0.0999755859375, 0.10813140869140625, 0.1162872314453125, 0.12444305419921875, 0.132598876953125, 0.14075469970703125, 0.1489105224609375, 0.15706634521484375, 0.16522216796875, 0.17337799072265625, 0.1815338134765625, 0.18968963623046875, 0.197845458984375, 0.20600128173828125, 0.2141571044921875, 0.22231292724609375, 0.23046875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 6.0, 12.0, 11.0, 13.0, 29.0, 49.0, 77.0, 131.0, 213.0, 407.0, 863.0, 2200.0, 7014.0, 26615.0, 142959.0, 714812.0, 119591.0, 23499.0, 6192.0, 2004.0, 856.0, 394.0, 221.0, 127.0, 88.0, 52.0, 43.0, 22.0, 11.0, 9.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2294921875, -1.195770263671875, -1.16204833984375, -1.128326416015625, -1.0946044921875, -1.060882568359375, -1.02716064453125, -0.993438720703125, -0.959716796875, -0.925994873046875, -0.89227294921875, -0.858551025390625, -0.8248291015625, -0.791107177734375, -0.75738525390625, -0.723663330078125, -0.68994140625, -0.656219482421875, -0.62249755859375, -0.588775634765625, -0.5550537109375, -0.521331787109375, -0.48760986328125, -0.453887939453125, -0.420166015625, -0.386444091796875, -0.35272216796875, -0.319000244140625, -0.2852783203125, -0.251556396484375, -0.21783447265625, -0.184112548828125, -0.150390625, -0.116668701171875, -0.08294677734375, -0.049224853515625, -0.0155029296875, 0.018218994140625, 0.05194091796875, 0.085662841796875, 0.119384765625, 0.153106689453125, 0.18682861328125, 0.220550537109375, 0.2542724609375, 0.287994384765625, 0.32171630859375, 0.355438232421875, 0.38916015625, 0.422882080078125, 0.45660400390625, 0.490325927734375, 0.5240478515625, 0.557769775390625, 0.59149169921875, 0.625213623046875, 0.658935546875, 0.692657470703125, 0.72637939453125, 0.760101318359375, 0.7938232421875, 0.827545166015625, 0.86126708984375, 0.894989013671875, 0.9287109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 7.0, 13.0, 11.0, 10.0, 16.0, 15.0, 19.0, 14.0, 35.0, 36.0, 21.0, 38.0, 45.0, 45.0, 45.0, 49.0, 47.0, 40.0, 53.0, 50.0, 43.0, 49.0, 42.0, 25.0, 35.0, 29.0, 29.0, 17.0, 22.0, 11.0, 14.0, 13.0, 8.0, 8.0, 12.0, 8.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84521484375, -0.818939208984375, -0.79266357421875, -0.766387939453125, -0.7401123046875, -0.713836669921875, -0.68756103515625, -0.661285400390625, -0.635009765625, -0.608734130859375, -0.58245849609375, -0.556182861328125, -0.5299072265625, -0.503631591796875, -0.47735595703125, -0.451080322265625, -0.4248046875, -0.398529052734375, -0.37225341796875, -0.345977783203125, -0.3197021484375, -0.293426513671875, -0.26715087890625, -0.240875244140625, -0.214599609375, -0.188323974609375, -0.16204833984375, -0.135772705078125, -0.1094970703125, -0.083221435546875, -0.05694580078125, -0.030670166015625, -0.00439453125, 0.021881103515625, 0.04815673828125, 0.074432373046875, 0.1007080078125, 0.126983642578125, 0.15325927734375, 0.179534912109375, 0.205810546875, 0.232086181640625, 0.25836181640625, 0.284637451171875, 0.3109130859375, 0.337188720703125, 0.36346435546875, 0.389739990234375, 0.416015625, 0.442291259765625, 0.46856689453125, 0.494842529296875, 0.5211181640625, 0.547393798828125, 0.57366943359375, 0.599945068359375, 0.626220703125, 0.652496337890625, 0.67877197265625, 0.705047607421875, 0.7313232421875, 0.757598876953125, 0.78387451171875, 0.810150146484375, 0.83642578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 8.0, 19.0, 32.0, 58.0, 68.0, 111.0, 215.0, 380.0, 805.0, 1636.0, 3607.0, 7840.0, 18119.0, 46695.0, 179134.0, 555360.0, 159552.0, 43863.0, 17196.0, 7361.0, 3283.0, 1566.0, 731.0, 363.0, 199.0, 124.0, 70.0, 46.0, 34.0, 18.0, 13.0, 9.0, 6.0, 4.0, 5.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2459716796875, -0.2378978729248047, -0.22982406616210938, -0.22175025939941406, -0.21367645263671875, -0.20560264587402344, -0.19752883911132812, -0.1894550323486328, -0.1813812255859375, -0.1733074188232422, -0.16523361206054688, -0.15715980529785156, -0.14908599853515625, -0.14101219177246094, -0.13293838500976562, -0.12486457824707031, -0.116790771484375, -0.10871696472167969, -0.10064315795898438, -0.09256935119628906, -0.08449554443359375, -0.07642173767089844, -0.06834793090820312, -0.06027412414550781, -0.0522003173828125, -0.04412651062011719, -0.036052703857421875, -0.027978897094726562, -0.01990509033203125, -0.011831283569335938, -0.003757476806640625, 0.0043163299560546875, 0.01239013671875, 0.020463943481445312, 0.028537750244140625, 0.03661155700683594, 0.04468536376953125, 0.05275917053222656, 0.060832977294921875, 0.06890678405761719, 0.0769805908203125, 0.08505439758300781, 0.09312820434570312, 0.10120201110839844, 0.10927581787109375, 0.11734962463378906, 0.12542343139648438, 0.1334972381591797, 0.141571044921875, 0.1496448516845703, 0.15771865844726562, 0.16579246520996094, 0.17386627197265625, 0.18194007873535156, 0.19001388549804688, 0.1980876922607422, 0.2061614990234375, 0.2142353057861328, 0.22230911254882812, 0.23038291931152344, 0.23845672607421875, 0.24653053283691406, 0.2546043395996094, 0.2626781463623047, 0.270751953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 2.0, 7.0, 7.0, 7.0, 5.0, 10.0, 14.0, 21.0, 30.0, 22.0, 53.0, 107.0, 144.0, 162.0, 124.0, 71.0, 52.0, 33.0, 25.0, 14.0, 11.0, 9.0, 9.0, 5.0, 2.0, 7.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.604194641113281e-05, -6.392784416675568e-05, -6.181374192237854e-05, -5.9699639678001404e-05, -5.758553743362427e-05, -5.547143518924713e-05, -5.3357332944869995e-05, -5.124323070049286e-05, -4.912912845611572e-05, -4.7015026211738586e-05, -4.490092396736145e-05, -4.2786821722984314e-05, -4.067271947860718e-05, -3.855861723423004e-05, -3.6444514989852905e-05, -3.433041274547577e-05, -3.221631050109863e-05, -3.0102208256721497e-05, -2.798810601234436e-05, -2.5874003767967224e-05, -2.3759901523590088e-05, -2.164579927921295e-05, -1.9531697034835815e-05, -1.741759479045868e-05, -1.5303492546081543e-05, -1.3189390301704407e-05, -1.107528805732727e-05, -8.961185812950134e-06, -6.847083568572998e-06, -4.732981324195862e-06, -2.6188790798187256e-06, -5.047768354415894e-07, 1.6093254089355469e-06, 3.723427653312683e-06, 5.837529897689819e-06, 7.951632142066956e-06, 1.0065734386444092e-05, 1.2179836630821228e-05, 1.4293938875198364e-05, 1.64080411195755e-05, 1.8522143363952637e-05, 2.0636245608329773e-05, 2.275034785270691e-05, 2.4864450097084045e-05, 2.697855234146118e-05, 2.9092654585838318e-05, 3.1206756830215454e-05, 3.332085907459259e-05, 3.5434961318969727e-05, 3.754906356334686e-05, 3.9663165807724e-05, 4.1777268052101135e-05, 4.389137029647827e-05, 4.600547254085541e-05, 4.8119574785232544e-05, 5.023367702960968e-05, 5.2347779273986816e-05, 5.446188151836395e-05, 5.657598376274109e-05, 5.8690086007118225e-05, 6.080418825149536e-05, 6.29182904958725e-05, 6.503239274024963e-05, 6.714649498462677e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 12.0, 19.0, 35.0, 41.0, 68.0, 102.0, 176.0, 253.0, 473.0, 819.0, 1726.0, 3966.0, 10024.0, 26977.0, 82620.0, 353066.0, 418598.0, 98339.0, 31178.0, 11323.0, 4486.0, 1941.0, 931.0, 478.0, 318.0, 202.0, 110.0, 74.0, 70.0, 32.0, 23.0, 13.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.244873046875, -0.23699188232421875, -0.2291107177734375, -0.22122955322265625, -0.213348388671875, -0.20546722412109375, -0.1975860595703125, -0.18970489501953125, -0.18182373046875, -0.17394256591796875, -0.1660614013671875, -0.15818023681640625, -0.150299072265625, -0.14241790771484375, -0.1345367431640625, -0.12665557861328125, -0.1187744140625, -0.11089324951171875, -0.1030120849609375, -0.09513092041015625, -0.087249755859375, -0.07936859130859375, -0.0714874267578125, -0.06360626220703125, -0.05572509765625, -0.04784393310546875, -0.0399627685546875, -0.03208160400390625, -0.024200439453125, -0.01631927490234375, -0.0084381103515625, -0.00055694580078125, 0.00732421875, 0.01520538330078125, 0.0230865478515625, 0.03096771240234375, 0.038848876953125, 0.04673004150390625, 0.0546112060546875, 0.06249237060546875, 0.07037353515625, 0.07825469970703125, 0.0861358642578125, 0.09401702880859375, 0.101898193359375, 0.10977935791015625, 0.1176605224609375, 0.12554168701171875, 0.1334228515625, 0.14130401611328125, 0.1491851806640625, 0.15706634521484375, 0.164947509765625, 0.17282867431640625, 0.1807098388671875, 0.18859100341796875, 0.19647216796875, 0.20435333251953125, 0.2122344970703125, 0.22011566162109375, 0.227996826171875, 0.23587799072265625, 0.2437591552734375, 0.25164031982421875, 0.259521484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 9.0, 8.0, 11.0, 7.0, 17.0, 24.0, 26.0, 41.0, 46.0, 75.0, 82.0, 98.0, 119.0, 98.0, 80.0, 51.0, 49.0, 29.0, 23.0, 13.0, 10.0, 12.0, 11.0, 10.0, 7.0, 4.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.1789073944091797, -0.17116928100585938, -0.16343116760253906, -0.15569305419921875, -0.14795494079589844, -0.14021682739257812, -0.1324787139892578, -0.1247406005859375, -0.11700248718261719, -0.10926437377929688, -0.10152626037597656, -0.09378814697265625, -0.08605003356933594, -0.07831192016601562, -0.07057380676269531, -0.062835693359375, -0.05509757995605469, -0.047359466552734375, -0.03962135314941406, -0.03188323974609375, -0.024145126342773438, -0.016407012939453125, -0.008668899536132812, -0.0009307861328125, 0.0068073272705078125, 0.014545440673828125, 0.022283554077148438, 0.03002166748046875, 0.03775978088378906, 0.045497894287109375, 0.05323600769042969, 0.06097412109375, 0.06871223449707031, 0.07645034790039062, 0.08418846130371094, 0.09192657470703125, 0.09966468811035156, 0.10740280151367188, 0.11514091491699219, 0.1228790283203125, 0.1306171417236328, 0.13835525512695312, 0.14609336853027344, 0.15383148193359375, 0.16156959533691406, 0.16930770874023438, 0.1770458221435547, 0.184783935546875, 0.1925220489501953, 0.20026016235351562, 0.20799827575683594, 0.21573638916015625, 0.22347450256347656, 0.23121261596679688, 0.2389507293701172, 0.2466888427734375, 0.2544269561767578, 0.2621650695800781, 0.26990318298339844, 0.27764129638671875, 0.28537940979003906, 0.2931175231933594, 0.3008556365966797, 0.30859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 24.0, 38.0, 132.0, 189.0, 230.0, 186.0, 103.0, 53.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.537570953369141, -5.381424427032471, -5.225278377532959, -5.069131851196289, -4.912985801696777, -4.756839275360107, -4.600693225860596, -4.444546699523926, -4.288400650024414, -4.132254123687744, -3.9761080741882324, -3.8199617862701416, -3.663815498352051, -3.50766921043396, -3.351522922515869, -3.195376396179199, -3.0392301082611084, -2.8830838203430176, -2.7269375324249268, -2.570791244506836, -2.414644956588745, -2.2584986686706543, -2.1023521423339844, -1.946205973625183, -1.7900596857070923, -1.6339133977890015, -1.4777671098709106, -1.3216207027435303, -1.1654744148254395, -1.0093281269073486, -0.8531818389892578, -0.697035551071167, -0.5408892631530762, -0.38474297523498535, -0.22859665751457214, -0.07245033979415894, 0.08369594812393188, 0.2398422360420227, 0.3959885835647583, 0.5521348714828491, 0.7082811594009399, 0.8644274473190308, 1.0205737352371216, 1.176720142364502, 1.3328664302825928, 1.4890127182006836, 1.6451590061187744, 1.8013052940368652, 1.957451581954956, 2.113597869873047, 2.2697441577911377, 2.4258904457092285, 2.5820367336273193, 2.73818302154541, 2.89432954788208, 3.050475597381592, 3.2066221237182617, 3.3627684116363525, 3.5189146995544434, 3.675060987472534, 3.831207275390625, 3.987353563308716, 4.143499851226807, 4.299646377563477, 4.455792427062988]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 7.0, 12.0, 20.0, 18.0, 19.0, 27.0, 16.0, 21.0, 27.0, 28.0, 54.0, 29.0, 42.0, 40.0, 44.0, 35.0, 39.0, 38.0, 41.0, 41.0, 36.0, 40.0, 30.0, 32.0, 29.0, 32.0, 33.0, 18.0, 22.0, 20.0, 20.0, 13.0, 12.0, 8.0, 2.0, 10.0, 6.0, 3.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5388506650924683, -1.4822354316711426, -1.4256203174591064, -1.3690050840377808, -1.312389850616455, -1.255774736404419, -1.1991595029830933, -1.1425442695617676, -1.0859291553497314, -1.0293139219284058, -0.9726987481117249, -0.916083574295044, -0.8594683408737183, -0.8028531670570374, -0.7462379932403564, -0.6896227598190308, -0.6330075263977051, -0.5763923525810242, -0.5197771191596985, -0.4631619453430176, -0.4065467417240143, -0.349931538105011, -0.2933163642883301, -0.23670116066932678, -0.1800859570503235, -0.12347076088190079, -0.06685556471347809, -0.010240375995635986, 0.04637482762336731, 0.1029900312423706, 0.1596052050590515, 0.2162204086780548, 0.27283573150634766, 0.32945093512535095, 0.38606613874435425, 0.44268131256103516, 0.49929651618003845, 0.5559117197990417, 0.6125268936157227, 0.6691421270370483, 0.7257573008537292, 0.7823724746704102, 0.8389877080917358, 0.8956028819084167, 0.9522180557250977, 1.0088332891464233, 1.065448522567749, 1.1220636367797852, 1.1786788702011108, 1.2352941036224365, 1.2919092178344727, 1.3485244512557983, 1.405139684677124, 1.4617547988891602, 1.5183700323104858, 1.5749852657318115, 1.6316003799438477, 1.6882156133651733, 1.7448307275772095, 1.8014459609985352, 1.8580611944198608, 1.9146764278411865, 1.9712915420532227, 2.027906656265259, 2.084522008895874]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 12.0, 16.0, 20.0, 28.0, 44.0, 81.0, 113.0, 178.0, 327.0, 546.0, 906.0, 1558.0, 2733.0, 4722.0, 8590.0, 16061.0, 29598.0, 59428.0, 131670.0, 321897.0, 736628.0, 1182341.0, 922017.0, 432536.0, 182520.0, 78986.0, 37573.0, 19375.0, 10481.0, 5808.0, 3250.0, 1819.0, 1040.0, 549.0, 305.0, 201.0, 111.0, 77.0, 46.0, 25.0, 14.0, 16.0, 9.0, 9.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-0.281005859375, -0.2733421325683594, -0.26567840576171875, -0.2580146789550781, -0.2503509521484375, -0.24268722534179688, -0.23502349853515625, -0.22735977172851562, -0.219696044921875, -0.21203231811523438, -0.20436859130859375, -0.19670486450195312, -0.1890411376953125, -0.18137741088867188, -0.17371368408203125, -0.16604995727539062, -0.15838623046875, -0.15072250366210938, -0.14305877685546875, -0.13539505004882812, -0.1277313232421875, -0.12006759643554688, -0.11240386962890625, -0.10474014282226562, -0.097076416015625, -0.08941268920898438, -0.08174896240234375, -0.07408523559570312, -0.0664215087890625, -0.058757781982421875, -0.05109405517578125, -0.043430328369140625, -0.0357666015625, -0.028102874755859375, -0.02043914794921875, -0.012775421142578125, -0.0051116943359375, 0.002552032470703125, 0.01021575927734375, 0.017879486083984375, 0.025543212890625, 0.033206939697265625, 0.04087066650390625, 0.048534393310546875, 0.0561981201171875, 0.06386184692382812, 0.07152557373046875, 0.07918930053710938, 0.08685302734375, 0.09451675415039062, 0.10218048095703125, 0.10984420776367188, 0.1175079345703125, 0.12517166137695312, 0.13283538818359375, 0.14049911499023438, 0.148162841796875, 0.15582656860351562, 0.16349029541015625, 0.17115402221679688, 0.1788177490234375, 0.18648147583007812, 0.19414520263671875, 0.20180892944335938, 0.20947265625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 6.0, 8.0, 10.0, 8.0, 8.0, 12.0, 17.0, 14.0, 19.0, 20.0, 20.0, 27.0, 35.0, 36.0, 37.0, 31.0, 40.0, 52.0, 44.0, 28.0, 41.0, 54.0, 35.0, 37.0, 28.0, 28.0, 24.0, 32.0, 36.0, 22.0, 30.0, 22.0, 24.0, 17.0, 16.0, 14.0, 9.0, 7.0, 7.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.2267131805419922, -0.21868515014648438, -0.21065711975097656, -0.20262908935546875, -0.19460105895996094, -0.18657302856445312, -0.1785449981689453, -0.1705169677734375, -0.1624889373779297, -0.15446090698242188, -0.14643287658691406, -0.13840484619140625, -0.13037681579589844, -0.12234878540039062, -0.11432075500488281, -0.106292724609375, -0.09826469421386719, -0.09023666381835938, -0.08220863342285156, -0.07418060302734375, -0.06615257263183594, -0.058124542236328125, -0.05009651184082031, -0.0420684814453125, -0.03404045104980469, -0.026012420654296875, -0.017984390258789062, -0.00995635986328125, -0.0019283294677734375, 0.006099700927734375, 0.014127731323242188, 0.02215576171875, 0.030183792114257812, 0.038211822509765625, 0.04623985290527344, 0.05426788330078125, 0.06229591369628906, 0.07032394409179688, 0.07835197448730469, 0.0863800048828125, 0.09440803527832031, 0.10243606567382812, 0.11046409606933594, 0.11849212646484375, 0.12652015686035156, 0.13454818725585938, 0.1425762176513672, 0.150604248046875, 0.1586322784423828, 0.16666030883789062, 0.17468833923339844, 0.18271636962890625, 0.19074440002441406, 0.19877243041992188, 0.2068004608154297, 0.2148284912109375, 0.2228565216064453, 0.23088455200195312, 0.23891258239746094, 0.24694061279296875, 0.25496864318847656, 0.2629966735839844, 0.2710247039794922, 0.279052734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 4.0, 9.0, 14.0, 21.0, 29.0, 45.0, 66.0, 102.0, 157.0, 283.0, 505.0, 877.0, 1775.0, 3912.0, 9921.0, 27868.0, 82291.0, 276525.0, 1303155.0, 1889642.0, 419073.0, 116491.0, 38371.0, 13353.0, 5175.0, 2149.0, 1065.0, 523.0, 321.0, 195.0, 116.0, 79.0, 58.0, 44.0, 27.0, 11.0, 8.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.55517578125, -0.5398178100585938, -0.5244598388671875, -0.5091018676757812, -0.493743896484375, -0.47838592529296875, -0.4630279541015625, -0.44766998291015625, -0.43231201171875, -0.41695404052734375, -0.4015960693359375, -0.38623809814453125, -0.370880126953125, -0.35552215576171875, -0.3401641845703125, -0.32480621337890625, -0.3094482421875, -0.29409027099609375, -0.2787322998046875, -0.26337432861328125, -0.248016357421875, -0.23265838623046875, -0.2173004150390625, -0.20194244384765625, -0.18658447265625, -0.17122650146484375, -0.1558685302734375, -0.14051055908203125, -0.125152587890625, -0.10979461669921875, -0.0944366455078125, -0.07907867431640625, -0.063720703125, -0.04836273193359375, -0.0330047607421875, -0.01764678955078125, -0.002288818359375, 0.01306915283203125, 0.0284271240234375, 0.04378509521484375, 0.05914306640625, 0.07450103759765625, 0.0898590087890625, 0.10521697998046875, 0.120574951171875, 0.13593292236328125, 0.1512908935546875, 0.16664886474609375, 0.1820068359375, 0.19736480712890625, 0.2127227783203125, 0.22808074951171875, 0.243438720703125, 0.25879669189453125, 0.2741546630859375, 0.28951263427734375, 0.30487060546875, 0.32022857666015625, 0.3355865478515625, 0.35094451904296875, 0.366302490234375, 0.38166046142578125, 0.3970184326171875, 0.41237640380859375, 0.427734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 8.0, 7.0, 4.0, 11.0, 13.0, 20.0, 15.0, 39.0, 33.0, 51.0, 67.0, 88.0, 119.0, 156.0, 214.0, 320.0, 418.0, 451.0, 474.0, 403.0, 288.0, 223.0, 148.0, 113.0, 69.0, 64.0, 58.0, 52.0, 36.0, 31.0, 18.0, 20.0, 11.0, 9.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4546546936035156, -0.43787384033203125, -0.4210929870605469, -0.4043121337890625, -0.3875312805175781, -0.37075042724609375, -0.3539695739746094, -0.337188720703125, -0.3204078674316406, -0.30362701416015625, -0.2868461608886719, -0.2700653076171875, -0.2532844543457031, -0.23650360107421875, -0.21972274780273438, -0.20294189453125, -0.18616104125976562, -0.16938018798828125, -0.15259933471679688, -0.1358184814453125, -0.11903762817382812, -0.10225677490234375, -0.08547592163085938, -0.068695068359375, -0.051914215087890625, -0.03513336181640625, -0.018352508544921875, -0.0015716552734375, 0.015209197998046875, 0.03199005126953125, 0.048770904541015625, 0.0655517578125, 0.08233261108398438, 0.09911346435546875, 0.11589431762695312, 0.1326751708984375, 0.14945602416992188, 0.16623687744140625, 0.18301773071289062, 0.199798583984375, 0.21657943725585938, 0.23336029052734375, 0.2501411437988281, 0.2669219970703125, 0.2837028503417969, 0.30048370361328125, 0.3172645568847656, 0.33404541015625, 0.3508262634277344, 0.36760711669921875, 0.3843879699707031, 0.4011688232421875, 0.4179496765136719, 0.43473052978515625, 0.4515113830566406, 0.468292236328125, 0.4850730895996094, 0.5018539428710938, 0.5186347961425781, 0.5354156494140625, 0.5521965026855469, 0.5689773559570312, 0.5857582092285156, 0.6025390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 9.0, 30.0, 74.0, 131.0, 163.0, 198.0, 176.0, 114.0, 44.0, 23.0, 11.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0295021533966064, -2.8640270233154297, -2.698552131652832, -2.5330770015716553, -2.3676018714904785, -2.2021267414093018, -2.036651611328125, -1.8711767196655273, -1.7057015895843506, -1.5402264595031738, -1.3747514486312866, -1.2092764377593994, -1.0438013076782227, -0.8783262372016907, -0.7128511667251587, -0.5473761558532715, -0.3819010257720947, -0.21642595529556274, -0.05095088481903076, 0.11452418565750122, 0.2799992561340332, 0.4454743266105652, 0.6109493970870972, 0.7764244079589844, 0.9418995380401611, 1.107374668121338, 1.272849678993225, 1.4383246898651123, 1.603799819946289, 1.7692749500274658, 1.934749960899353, 2.1002249717712402, 2.265699863433838, 2.4311749935150146, 2.5966501235961914, 2.762125015258789, 2.927600145339966, 3.0930752754211426, 3.2585501670837402, 3.424025297164917, 3.5895004272460938, 3.7549755573272705, 3.9204506874084473, 4.085925579071045, 4.251400947570801, 4.416875839233398, 4.582350730895996, 4.747825622558594, 4.91330099105835, 5.078775882720947, 5.244251251220703, 5.409726142883301, 5.575201034545898, 5.740676403045654, 5.906151294708252, 6.071626663208008, 6.2371015548706055, 6.402576446533203, 6.568051815032959, 6.733526706695557, 6.8990020751953125, 7.06447696685791, 7.229951858520508, 7.3954267501831055, 7.560902118682861]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 3.0, 8.0, 5.0, 10.0, 21.0, 14.0, 12.0, 10.0, 21.0, 16.0, 21.0, 25.0, 33.0, 34.0, 29.0, 32.0, 28.0, 39.0, 32.0, 40.0, 42.0, 46.0, 34.0, 40.0, 38.0, 32.0, 45.0, 26.0, 22.0, 26.0, 25.0, 24.0, 17.0, 17.0, 11.0, 10.0, 16.0, 12.0, 10.0, 9.0, 18.0, 11.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6110713481903076, -1.5594319105148315, -1.5077924728393555, -1.4561530351638794, -1.4045135974884033, -1.3528741598129272, -1.3012347221374512, -1.2495954036712646, -1.197955846786499, -1.146316409111023, -1.0946769714355469, -1.0430375337600708, -0.9913980960845947, -0.9397586584091187, -0.8881192803382874, -0.8364798426628113, -0.78484046459198, -0.7332010269165039, -0.6815615892410278, -0.6299221515655518, -0.5782827138900757, -0.5266432762145996, -0.4750038981437683, -0.42336446046829224, -0.37172502279281616, -0.3200855851173401, -0.268446147441864, -0.21680673956871033, -0.16516730189323425, -0.11352786421775818, -0.06188845634460449, -0.010249018669128418, 0.041390299797058105, 0.09302973002195358, 0.14466916024684906, 0.19630858302116394, 0.24794802069664001, 0.2995874583721161, 0.3512268662452698, 0.40286630392074585, 0.4545057415962219, 0.506145179271698, 0.5577846169471741, 0.6094239950180054, 0.6610634326934814, 0.7127028703689575, 0.7643423080444336, 0.8159817457199097, 0.8676211833953857, 0.9192606210708618, 0.9709000587463379, 1.022539496421814, 1.07417893409729, 1.1258183717727661, 1.1774578094482422, 1.2290971279144287, 1.2807366847991943, 1.3323761224746704, 1.3840155601501465, 1.4356549978256226, 1.4872944355010986, 1.5389338731765747, 1.5905733108520508, 1.6422126293182373, 1.6938520669937134]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 7.0, 8.0, 6.0, 18.0, 10.0, 21.0, 48.0, 58.0, 86.0, 143.0, 223.0, 349.0, 592.0, 1077.0, 1928.0, 3418.0, 6447.0, 11062.0, 19964.0, 35873.0, 75183.0, 183643.0, 324494.0, 209768.0, 84988.0, 39988.0, 21505.0, 12227.0, 6914.0, 3693.0, 2041.0, 1114.0, 645.0, 377.0, 205.0, 139.0, 106.0, 57.0, 47.0, 29.0, 16.0, 13.0, 14.0, 1.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3312492370605469, -0.31923675537109375, -0.3072242736816406, -0.2952117919921875, -0.2831993103027344, -0.27118682861328125, -0.2591743469238281, -0.247161865234375, -0.23514938354492188, -0.22313690185546875, -0.21112442016601562, -0.1991119384765625, -0.18709945678710938, -0.17508697509765625, -0.16307449340820312, -0.15106201171875, -0.13904953002929688, -0.12703704833984375, -0.11502456665039062, -0.1030120849609375, -0.09099960327148438, -0.07898712158203125, -0.06697463989257812, -0.054962158203125, -0.042949676513671875, -0.03093719482421875, -0.018924713134765625, -0.0069122314453125, 0.005100250244140625, 0.01711273193359375, 0.029125213623046875, 0.0411376953125, 0.053150177001953125, 0.06516265869140625, 0.07717514038085938, 0.0891876220703125, 0.10120010375976562, 0.11321258544921875, 0.12522506713867188, 0.137237548828125, 0.14925003051757812, 0.16126251220703125, 0.17327499389648438, 0.1852874755859375, 0.19729995727539062, 0.20931243896484375, 0.22132492065429688, 0.23333740234375, 0.24534988403320312, 0.25736236572265625, 0.2693748474121094, 0.2813873291015625, 0.2933998107910156, 0.30541229248046875, 0.3174247741699219, 0.329437255859375, 0.3414497375488281, 0.35346221923828125, 0.3654747009277344, 0.3774871826171875, 0.3894996643066406, 0.40151214599609375, 0.4135246276855469, 0.425537109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 6.0, 6.0, 8.0, 11.0, 6.0, 13.0, 18.0, 13.0, 13.0, 21.0, 23.0, 31.0, 21.0, 25.0, 35.0, 26.0, 39.0, 44.0, 36.0, 35.0, 45.0, 40.0, 39.0, 39.0, 30.0, 42.0, 34.0, 35.0, 41.0, 29.0, 24.0, 21.0, 25.0, 28.0, 21.0, 14.0, 10.0, 8.0, 14.0, 9.0, 7.0, 7.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.2169036865234375, -0.209197998046875, -0.2014923095703125, -0.19378662109375, -0.1860809326171875, -0.178375244140625, -0.1706695556640625, -0.1629638671875, -0.1552581787109375, -0.147552490234375, -0.1398468017578125, -0.13214111328125, -0.1244354248046875, -0.116729736328125, -0.1090240478515625, -0.101318359375, -0.0936126708984375, -0.085906982421875, -0.0782012939453125, -0.07049560546875, -0.0627899169921875, -0.055084228515625, -0.0473785400390625, -0.0396728515625, -0.0319671630859375, -0.024261474609375, -0.0165557861328125, -0.00885009765625, -0.0011444091796875, 0.006561279296875, 0.0142669677734375, 0.02197265625, 0.0296783447265625, 0.037384033203125, 0.0450897216796875, 0.05279541015625, 0.0605010986328125, 0.068206787109375, 0.0759124755859375, 0.0836181640625, 0.0913238525390625, 0.099029541015625, 0.1067352294921875, 0.11444091796875, 0.1221466064453125, 0.129852294921875, 0.1375579833984375, 0.145263671875, 0.1529693603515625, 0.160675048828125, 0.1683807373046875, 0.17608642578125, 0.1837921142578125, 0.191497802734375, 0.1992034912109375, 0.2069091796875, 0.2146148681640625, 0.222320556640625, 0.2300262451171875, 0.23773193359375, 0.2454376220703125, 0.253143310546875, 0.2608489990234375, 0.2685546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 13.0, 20.0, 24.0, 35.0, 66.0, 93.0, 130.0, 211.0, 337.0, 620.0, 1176.0, 3064.0, 8602.0, 27214.0, 96886.0, 447677.0, 353052.0, 75235.0, 21748.0, 7237.0, 2526.0, 1105.0, 597.0, 319.0, 200.0, 112.0, 82.0, 49.0, 39.0, 16.0, 14.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.6050643920898438, -0.5797576904296875, -0.5544509887695312, -0.529144287109375, -0.5038375854492188, -0.4785308837890625, -0.45322418212890625, -0.42791748046875, -0.40261077880859375, -0.3773040771484375, -0.35199737548828125, -0.326690673828125, -0.30138397216796875, -0.2760772705078125, -0.25077056884765625, -0.2254638671875, -0.20015716552734375, -0.1748504638671875, -0.14954376220703125, -0.124237060546875, -0.09893035888671875, -0.0736236572265625, -0.04831695556640625, -0.02301025390625, 0.00229644775390625, 0.0276031494140625, 0.05290985107421875, 0.078216552734375, 0.10352325439453125, 0.1288299560546875, 0.15413665771484375, 0.179443359375, 0.20475006103515625, 0.2300567626953125, 0.25536346435546875, 0.280670166015625, 0.30597686767578125, 0.3312835693359375, 0.35659027099609375, 0.38189697265625, 0.40720367431640625, 0.4325103759765625, 0.45781707763671875, 0.483123779296875, 0.5084304809570312, 0.5337371826171875, 0.5590438842773438, 0.5843505859375, 0.6096572875976562, 0.6349639892578125, 0.6602706909179688, 0.685577392578125, 0.7108840942382812, 0.7361907958984375, 0.7614974975585938, 0.78680419921875, 0.8121109008789062, 0.8374176025390625, 0.8627243041992188, 0.888031005859375, 0.9133377075195312, 0.9386444091796875, 0.9639511108398438, 0.9892578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 8.0, 3.0, 3.0, 7.0, 15.0, 5.0, 8.0, 13.0, 21.0, 23.0, 36.0, 29.0, 25.0, 29.0, 26.0, 40.0, 49.0, 49.0, 36.0, 50.0, 56.0, 45.0, 30.0, 39.0, 32.0, 28.0, 45.0, 34.0, 42.0, 26.0, 19.0, 24.0, 17.0, 12.0, 14.0, 15.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87890625, -0.8538818359375, -0.828857421875, -0.8038330078125, -0.77880859375, -0.7537841796875, -0.728759765625, -0.7037353515625, -0.6787109375, -0.6536865234375, -0.628662109375, -0.6036376953125, -0.57861328125, -0.5535888671875, -0.528564453125, -0.5035400390625, -0.478515625, -0.4534912109375, -0.428466796875, -0.4034423828125, -0.37841796875, -0.3533935546875, -0.328369140625, -0.3033447265625, -0.2783203125, -0.2532958984375, -0.228271484375, -0.2032470703125, -0.17822265625, -0.1531982421875, -0.128173828125, -0.1031494140625, -0.078125, -0.0531005859375, -0.028076171875, -0.0030517578125, 0.02197265625, 0.0469970703125, 0.072021484375, 0.0970458984375, 0.1220703125, 0.1470947265625, 0.172119140625, 0.1971435546875, 0.22216796875, 0.2471923828125, 0.272216796875, 0.2972412109375, 0.322265625, 0.3472900390625, 0.372314453125, 0.3973388671875, 0.42236328125, 0.4473876953125, 0.472412109375, 0.4974365234375, 0.5224609375, 0.5474853515625, 0.572509765625, 0.5975341796875, 0.62255859375, 0.6475830078125, 0.672607421875, 0.6976318359375, 0.72265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 7.0, 25.0, 38.0, 40.0, 75.0, 127.0, 164.0, 249.0, 453.0, 768.0, 1452.0, 2654.0, 4900.0, 9494.0, 19177.0, 44054.0, 118558.0, 315669.0, 322440.0, 122402.0, 45191.0, 19709.0, 9678.0, 4881.0, 2756.0, 1478.0, 834.0, 489.0, 287.0, 165.0, 101.0, 76.0, 45.0, 33.0, 15.0, 13.0, 14.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17897987365722656, -0.17338943481445312, -0.1677989959716797, -0.16220855712890625, -0.1566181182861328, -0.15102767944335938, -0.14543724060058594, -0.1398468017578125, -0.13425636291503906, -0.12866592407226562, -0.12307548522949219, -0.11748504638671875, -0.11189460754394531, -0.10630416870117188, -0.10071372985839844, -0.095123291015625, -0.08953285217285156, -0.08394241333007812, -0.07835197448730469, -0.07276153564453125, -0.06717109680175781, -0.061580657958984375, -0.05599021911621094, -0.0503997802734375, -0.04480934143066406, -0.039218902587890625, -0.03362846374511719, -0.02803802490234375, -0.022447586059570312, -0.016857147216796875, -0.011266708374023438, -0.00567626953125, -8.58306884765625e-05, 0.005504608154296875, 0.011095046997070312, 0.01668548583984375, 0.022275924682617188, 0.027866363525390625, 0.03345680236816406, 0.0390472412109375, 0.04463768005371094, 0.050228118896484375, 0.05581855773925781, 0.06140899658203125, 0.06699943542480469, 0.07258987426757812, 0.07818031311035156, 0.083770751953125, 0.08936119079589844, 0.09495162963867188, 0.10054206848144531, 0.10613250732421875, 0.11172294616699219, 0.11731338500976562, 0.12290382385253906, 0.1284942626953125, 0.13408470153808594, 0.13967514038085938, 0.1452655792236328, 0.15085601806640625, 0.1564464569091797, 0.16203689575195312, 0.16762733459472656, 0.1732177734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 11.0, 10.0, 13.0, 16.0, 29.0, 27.0, 39.0, 54.0, 87.0, 127.0, 160.0, 136.0, 78.0, 60.0, 35.0, 17.0, 19.0, 16.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.900331497192383e-05, -9.66126099228859e-05, -9.422190487384796e-05, -9.183119982481003e-05, -8.94404947757721e-05, -8.704978972673416e-05, -8.465908467769623e-05, -8.22683796286583e-05, -7.987767457962036e-05, -7.748696953058243e-05, -7.50962644815445e-05, -7.270555943250656e-05, -7.031485438346863e-05, -6.79241493344307e-05, -6.553344428539276e-05, -6.314273923635483e-05, -6.0752034187316895e-05, -5.836132913827896e-05, -5.597062408924103e-05, -5.3579919040203094e-05, -5.118921399116516e-05, -4.879850894212723e-05, -4.6407803893089294e-05, -4.401709884405136e-05, -4.162639379501343e-05, -3.9235688745975494e-05, -3.684498369693756e-05, -3.445427864789963e-05, -3.2063573598861694e-05, -2.967286854982376e-05, -2.7282163500785828e-05, -2.4891458451747894e-05, -2.250075340270996e-05, -2.0110048353672028e-05, -1.7719343304634094e-05, -1.532863825559616e-05, -1.2937933206558228e-05, -1.0547228157520294e-05, -8.15652310848236e-06, -5.7658180594444275e-06, -3.375113010406494e-06, -9.844079613685608e-07, 1.4062970876693726e-06, 3.797002136707306e-06, 6.187707185745239e-06, 8.578412234783173e-06, 1.0969117283821106e-05, 1.335982233285904e-05, 1.5750527381896973e-05, 1.8141232430934906e-05, 2.053193747997284e-05, 2.2922642529010773e-05, 2.5313347578048706e-05, 2.770405262708664e-05, 3.0094757676124573e-05, 3.2485462725162506e-05, 3.487616777420044e-05, 3.726687282323837e-05, 3.9657577872276306e-05, 4.204828292131424e-05, 4.443898797035217e-05, 4.6829693019390106e-05, 4.922039806842804e-05, 5.161110311746597e-05, 5.4001808166503906e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 10.0, 23.0, 25.0, 34.0, 42.0, 53.0, 79.0, 116.0, 162.0, 261.0, 445.0, 833.0, 1518.0, 2993.0, 6322.0, 13882.0, 34152.0, 95058.0, 253053.0, 353626.0, 178279.0, 63362.0, 23961.0, 10389.0, 4641.0, 2326.0, 1173.0, 626.0, 407.0, 199.0, 137.0, 100.0, 66.0, 47.0, 38.0, 18.0, 24.0, 16.0, 17.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17333984375, -0.16797447204589844, -0.16260910034179688, -0.1572437286376953, -0.15187835693359375, -0.1465129852294922, -0.14114761352539062, -0.13578224182128906, -0.1304168701171875, -0.12505149841308594, -0.11968612670898438, -0.11432075500488281, -0.10895538330078125, -0.10359001159667969, -0.09822463989257812, -0.09285926818847656, -0.087493896484375, -0.08212852478027344, -0.07676315307617188, -0.07139778137207031, -0.06603240966796875, -0.06066703796386719, -0.055301666259765625, -0.04993629455566406, -0.0445709228515625, -0.03920555114746094, -0.033840179443359375, -0.028474807739257812, -0.02310943603515625, -0.017744064331054688, -0.012378692626953125, -0.0070133209228515625, -0.00164794921875, 0.0037174224853515625, 0.009082794189453125, 0.014448165893554688, 0.01981353759765625, 0.025178909301757812, 0.030544281005859375, 0.03590965270996094, 0.0412750244140625, 0.04664039611816406, 0.052005767822265625, 0.05737113952636719, 0.06273651123046875, 0.06810188293457031, 0.07346725463867188, 0.07883262634277344, 0.084197998046875, 0.08956336975097656, 0.09492874145507812, 0.10029411315917969, 0.10565948486328125, 0.11102485656738281, 0.11639022827148438, 0.12175559997558594, 0.1271209716796875, 0.13248634338378906, 0.13785171508789062, 0.1432170867919922, 0.14858245849609375, 0.1539478302001953, 0.15931320190429688, 0.16467857360839844, 0.1700439453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 10.0, 12.0, 9.0, 24.0, 28.0, 30.0, 41.0, 32.0, 49.0, 54.0, 74.0, 78.0, 84.0, 70.0, 65.0, 64.0, 44.0, 57.0, 39.0, 36.0, 18.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.22997093200683594, -0.22312545776367188, -0.2162799835205078, -0.20943450927734375, -0.2025890350341797, -0.19574356079101562, -0.18889808654785156, -0.1820526123046875, -0.17520713806152344, -0.16836166381835938, -0.1615161895751953, -0.15467071533203125, -0.1478252410888672, -0.14097976684570312, -0.13413429260253906, -0.127288818359375, -0.12044334411621094, -0.11359786987304688, -0.10675239562988281, -0.09990692138671875, -0.09306144714355469, -0.08621597290039062, -0.07937049865722656, -0.0725250244140625, -0.06567955017089844, -0.058834075927734375, -0.05198860168457031, -0.04514312744140625, -0.03829765319824219, -0.031452178955078125, -0.024606704711914062, -0.01776123046875, -0.010915756225585938, -0.004070281982421875, 0.0027751922607421875, 0.00962066650390625, 0.016466140747070312, 0.023311614990234375, 0.030157089233398438, 0.0370025634765625, 0.04384803771972656, 0.050693511962890625, 0.05753898620605469, 0.06438446044921875, 0.07122993469238281, 0.07807540893554688, 0.08492088317871094, 0.091766357421875, 0.09861183166503906, 0.10545730590820312, 0.11230278015136719, 0.11914825439453125, 0.1259937286376953, 0.13283920288085938, 0.13968467712402344, 0.1465301513671875, 0.15337562561035156, 0.16022109985351562, 0.1670665740966797, 0.17391204833984375, 0.1807575225830078, 0.18760299682617188, 0.19444847106933594, 0.2012939453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 17.0, 29.0, 96.0, 180.0, 220.0, 202.0, 147.0, 64.0, 22.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.009251117706299, -4.861154556274414, -4.713057994842529, -4.5649614334106445, -4.416865348815918, -4.268768787384033, -4.120672225952148, -3.9725756645202637, -3.824479103088379, -3.676382541656494, -3.5282859802246094, -3.3801896572113037, -3.232093095779419, -3.083996534347534, -2.9359002113342285, -2.7878036499023438, -2.639707088470459, -2.491610527038574, -2.3435139656066895, -2.195417642593384, -2.047321081161499, -1.8992245197296143, -1.751128077507019, -1.6030316352844238, -1.454935073852539, -1.3068385124206543, -1.158742070198059, -1.0106456279754639, -0.8625490665435791, -0.7144525647163391, -0.5663560628890991, -0.4182596206665039, -0.27016353607177734, -0.12206703424453735, 0.026029467582702637, 0.17412596940994263, 0.3222224712371826, 0.4703189730644226, 0.6184154748916626, 0.7665119171142578, 0.9146084785461426, 1.0627050399780273, 1.2108014822006226, 1.3588979244232178, 1.5069944858551025, 1.6550910472869873, 1.8031874895095825, 1.9512839317321777, 2.0993804931640625, 2.2474770545959473, 2.395573616027832, 2.5436699390411377, 2.6917665004730225, 2.8398630619049072, 2.987959384918213, 3.1360559463500977, 3.2841525077819824, 3.432249069213867, 3.580345630645752, 3.7284419536590576, 3.8765385150909424, 4.024634838104248, 4.172731399536133, 4.320827960968018, 4.468924522399902]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 4.0, 10.0, 3.0, 12.0, 8.0, 17.0, 19.0, 24.0, 19.0, 21.0, 30.0, 27.0, 30.0, 25.0, 34.0, 29.0, 43.0, 38.0, 55.0, 39.0, 26.0, 56.0, 51.0, 34.0, 49.0, 44.0, 38.0, 27.0, 29.0, 21.0, 17.0, 24.0, 13.0, 17.0, 11.0, 7.0, 6.0, 14.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8780732154846191, -1.820070743560791, -1.762068271636963, -1.7040657997131348, -1.6460633277893066, -1.5880608558654785, -1.5300583839416504, -1.4720559120178223, -1.4140534400939941, -1.356050968170166, -1.298048496246338, -1.2400460243225098, -1.1820435523986816, -1.1240410804748535, -1.0660386085510254, -1.0080361366271973, -0.9500337243080139, -0.8920312523841858, -0.8340287804603577, -0.7760263085365295, -0.7180238366127014, -0.6600214242935181, -0.6020189523696899, -0.5440164804458618, -0.4860139787197113, -0.4280115067958832, -0.37000903487205505, -0.3120065927505493, -0.2540041208267212, -0.19600164890289307, -0.13799917697906494, -0.07999670505523682, -0.02199423313140869, 0.036008235067129135, 0.09401070326566696, 0.1520131677389145, 0.21001563966274261, 0.26801809668540955, 0.32602056860923767, 0.3840230405330658, 0.4420255124568939, 0.5000279545783997, 0.5580304265022278, 0.6160328984260559, 0.674035370349884, 0.7320378422737122, 0.7900403141975403, 0.8480427861213684, 0.9060452580451965, 0.9640477299690247, 1.022050142288208, 1.0800526142120361, 1.1380550861358643, 1.1960575580596924, 1.2540600299835205, 1.3120625019073486, 1.3700649738311768, 1.4280674457550049, 1.486069917678833, 1.5440723896026611, 1.6020748615264893, 1.6600773334503174, 1.7180798053741455, 1.7760822772979736, 1.8340847492218018]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 10.0, 7.0, 10.0, 13.0, 17.0, 22.0, 31.0, 45.0, 52.0, 100.0, 184.0, 393.0, 879.0, 2265.0, 5808.0, 15325.0, 42805.0, 137936.0, 561904.0, 1693543.0, 1269216.0, 329915.0, 87188.0, 29235.0, 10619.0, 3875.0, 1527.0, 630.0, 300.0, 143.0, 100.0, 36.0, 36.0, 33.0, 24.0, 7.0, 12.0, 9.0, 8.0, 1.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.37841796875, -0.36652374267578125, -0.3546295166015625, -0.34273529052734375, -0.330841064453125, -0.31894683837890625, -0.3070526123046875, -0.29515838623046875, -0.28326416015625, -0.27136993408203125, -0.2594757080078125, -0.24758148193359375, -0.235687255859375, -0.22379302978515625, -0.2118988037109375, -0.20000457763671875, -0.1881103515625, -0.17621612548828125, -0.1643218994140625, -0.15242767333984375, -0.140533447265625, -0.12863922119140625, -0.1167449951171875, -0.10485076904296875, -0.09295654296875, -0.08106231689453125, -0.0691680908203125, -0.05727386474609375, -0.045379638671875, -0.03348541259765625, -0.0215911865234375, -0.00969696044921875, 0.002197265625, 0.01409149169921875, 0.0259857177734375, 0.03787994384765625, 0.049774169921875, 0.06166839599609375, 0.0735626220703125, 0.08545684814453125, 0.09735107421875, 0.10924530029296875, 0.1211395263671875, 0.13303375244140625, 0.144927978515625, 0.15682220458984375, 0.1687164306640625, 0.18061065673828125, 0.1925048828125, 0.20439910888671875, 0.2162933349609375, 0.22818756103515625, 0.240081787109375, 0.25197601318359375, 0.2638702392578125, 0.27576446533203125, 0.28765869140625, 0.29955291748046875, 0.3114471435546875, 0.32334136962890625, 0.335235595703125, 0.34712982177734375, 0.3590240478515625, 0.37091827392578125, 0.3828125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 1.0, 5.0, 2.0, 7.0, 9.0, 5.0, 9.0, 11.0, 9.0, 13.0, 16.0, 20.0, 17.0, 24.0, 22.0, 19.0, 29.0, 38.0, 39.0, 35.0, 35.0, 39.0, 29.0, 45.0, 42.0, 39.0, 35.0, 39.0, 38.0, 35.0, 31.0, 31.0, 24.0, 20.0, 28.0, 21.0, 19.0, 21.0, 13.0, 14.0, 18.0, 16.0, 2.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2186279296875, -0.211456298828125, -0.20428466796875, -0.197113037109375, -0.18994140625, -0.182769775390625, -0.17559814453125, -0.168426513671875, -0.1612548828125, -0.154083251953125, -0.14691162109375, -0.139739990234375, -0.132568359375, -0.125396728515625, -0.11822509765625, -0.111053466796875, -0.1038818359375, -0.096710205078125, -0.08953857421875, -0.082366943359375, -0.0751953125, -0.068023681640625, -0.06085205078125, -0.053680419921875, -0.0465087890625, -0.039337158203125, -0.03216552734375, -0.024993896484375, -0.017822265625, -0.010650634765625, -0.00347900390625, 0.003692626953125, 0.0108642578125, 0.018035888671875, 0.02520751953125, 0.032379150390625, 0.03955078125, 0.046722412109375, 0.05389404296875, 0.061065673828125, 0.0682373046875, 0.075408935546875, 0.08258056640625, 0.089752197265625, 0.096923828125, 0.104095458984375, 0.11126708984375, 0.118438720703125, 0.1256103515625, 0.132781982421875, 0.13995361328125, 0.147125244140625, 0.154296875, 0.161468505859375, 0.16864013671875, 0.175811767578125, 0.1829833984375, 0.190155029296875, 0.19732666015625, 0.204498291015625, 0.211669921875, 0.218841552734375, 0.22601318359375, 0.233184814453125, 0.2403564453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 18.0, 22.0, 54.0, 58.0, 121.0, 199.0, 378.0, 662.0, 1335.0, 2962.0, 7414.0, 23105.0, 85013.0, 398170.0, 2389776.0, 1052696.0, 169273.0, 42078.0, 12422.0, 4410.0, 1929.0, 957.0, 503.0, 278.0, 137.0, 89.0, 68.0, 41.0, 27.0, 20.0, 7.0, 13.0, 10.0, 5.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5774078369140625, -0.558624267578125, -0.5398406982421875, -0.52105712890625, -0.5022735595703125, -0.483489990234375, -0.4647064208984375, -0.4459228515625, -0.4271392822265625, -0.408355712890625, -0.3895721435546875, -0.37078857421875, -0.3520050048828125, -0.333221435546875, -0.3144378662109375, -0.295654296875, -0.2768707275390625, -0.258087158203125, -0.2393035888671875, -0.22052001953125, -0.2017364501953125, -0.182952880859375, -0.1641693115234375, -0.1453857421875, -0.1266021728515625, -0.107818603515625, -0.0890350341796875, -0.07025146484375, -0.0514678955078125, -0.032684326171875, -0.0139007568359375, 0.0048828125, 0.0236663818359375, 0.042449951171875, 0.0612335205078125, 0.08001708984375, 0.0988006591796875, 0.117584228515625, 0.1363677978515625, 0.1551513671875, 0.1739349365234375, 0.192718505859375, 0.2115020751953125, 0.23028564453125, 0.2490692138671875, 0.267852783203125, 0.2866363525390625, 0.305419921875, 0.3242034912109375, 0.342987060546875, 0.3617706298828125, 0.38055419921875, 0.3993377685546875, 0.418121337890625, 0.4369049072265625, 0.4556884765625, 0.4744720458984375, 0.493255615234375, 0.5120391845703125, 0.53082275390625, 0.5496063232421875, 0.568389892578125, 0.5871734619140625, 0.60595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 14.0, 3.0, 14.0, 13.0, 18.0, 22.0, 32.0, 54.0, 57.0, 66.0, 92.0, 143.0, 211.0, 291.0, 420.0, 528.0, 546.0, 450.0, 309.0, 223.0, 133.0, 101.0, 68.0, 59.0, 60.0, 28.0, 29.0, 20.0, 14.0, 10.0, 13.0, 3.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.459564208984375, -0.44256591796875, -0.425567626953125, -0.4085693359375, -0.391571044921875, -0.37457275390625, -0.357574462890625, -0.340576171875, -0.323577880859375, -0.30657958984375, -0.289581298828125, -0.2725830078125, -0.255584716796875, -0.23858642578125, -0.221588134765625, -0.20458984375, -0.187591552734375, -0.17059326171875, -0.153594970703125, -0.1365966796875, -0.119598388671875, -0.10260009765625, -0.085601806640625, -0.068603515625, -0.051605224609375, -0.03460693359375, -0.017608642578125, -0.0006103515625, 0.016387939453125, 0.03338623046875, 0.050384521484375, 0.0673828125, 0.084381103515625, 0.10137939453125, 0.118377685546875, 0.1353759765625, 0.152374267578125, 0.16937255859375, 0.186370849609375, 0.203369140625, 0.220367431640625, 0.23736572265625, 0.254364013671875, 0.2713623046875, 0.288360595703125, 0.30535888671875, 0.322357177734375, 0.33935546875, 0.356353759765625, 0.37335205078125, 0.390350341796875, 0.4073486328125, 0.424346923828125, 0.44134521484375, 0.458343505859375, 0.475341796875, 0.492340087890625, 0.50933837890625, 0.526336669921875, 0.5433349609375, 0.560333251953125, 0.57733154296875, 0.594329833984375, 0.611328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 18.0, 25.0, 51.0, 91.0, 154.0, 173.0, 188.0, 145.0, 83.0, 33.0, 17.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9025442600250244, -2.7388224601745605, -2.5751004219055176, -2.4113783836364746, -2.2476565837860107, -2.083934783935547, -1.920212745666504, -1.7564908266067505, -1.592768907546997, -1.4290469884872437, -1.2653250694274902, -1.1016031503677368, -0.9378812313079834, -0.77415931224823, -0.6104373931884766, -0.44671547412872314, -0.2829935550689697, -0.11927163600921631, 0.04445028305053711, 0.20817220211029053, 0.37189412117004395, 0.5356160402297974, 0.6993379592895508, 0.8630598783493042, 1.0267817974090576, 1.190503716468811, 1.3542256355285645, 1.5179475545883179, 1.6816694736480713, 1.8453913927078247, 2.009113311767578, 2.172835350036621, 2.336557388305664, 2.500279426574707, 2.664001226425171, 2.8277230262756348, 2.9914450645446777, 3.1551671028137207, 3.3188889026641846, 3.4826107025146484, 3.6463327407836914, 3.8100547790527344, 3.9737765789031982, 4.137498378753662, 4.301220417022705, 4.464942455291748, 4.628664016723633, 4.792386054992676, 4.956108093261719, 5.119830131530762, 5.283552169799805, 5.4472737312316895, 5.610995769500732, 5.774717807769775, 5.93843936920166, 6.102161407470703, 6.265883445739746, 6.429605484008789, 6.593327522277832, 6.757049083709717, 6.92077112197876, 7.084493160247803, 7.2482147216796875, 7.4119367599487305, 7.575658798217773]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 5.0, 10.0, 14.0, 18.0, 20.0, 29.0, 29.0, 45.0, 38.0, 42.0, 57.0, 31.0, 43.0, 47.0, 50.0, 45.0, 58.0, 48.0, 59.0, 33.0, 35.0, 34.0, 35.0, 35.0, 17.0, 18.0, 16.0, 16.0, 11.0, 10.0, 10.0, 2.0, 3.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0], "bins": [-2.575913429260254, -2.5085458755493164, -2.441178321838379, -2.3738107681274414, -2.306443214416504, -2.2390758991241455, -2.171708345413208, -2.1043407917022705, -2.036973237991333, -1.9696056842803955, -1.902238130569458, -1.83487069606781, -1.7675031423568726, -1.700135588645935, -1.632768154144287, -1.5654006004333496, -1.498033046722412, -1.4306654930114746, -1.363297939300537, -1.2959305047988892, -1.2285629510879517, -1.1611953973770142, -1.0938279628753662, -1.0264604091644287, -0.9590928554534912, -0.8917253017425537, -0.824357807636261, -0.7569903135299683, -0.6896227598190308, -0.6222552061080933, -0.5548877120018005, -0.4875201880931854, -0.4201526641845703, -0.3527851402759552, -0.2854176163673401, -0.21805009245872498, -0.15068256855010986, -0.08331504464149475, -0.01594752073287964, 0.051420003175735474, 0.11878752708435059, 0.1861550509929657, 0.2535225749015808, 0.3208900988101959, 0.38825762271881104, 0.45562514662742615, 0.5229926705360413, 0.590360164642334, 0.6577277183532715, 0.725095272064209, 0.7924627661705017, 0.8598302602767944, 0.9271978139877319, 0.9945653676986694, 1.0619328022003174, 1.1293003559112549, 1.1966679096221924, 1.2640354633331299, 1.3314030170440674, 1.3987704515457153, 1.4661380052566528, 1.5335055589675903, 1.6008729934692383, 1.6682405471801758, 1.7356081008911133]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 12.0, 13.0, 18.0, 30.0, 39.0, 66.0, 91.0, 164.0, 323.0, 570.0, 1118.0, 2231.0, 4623.0, 10036.0, 23311.0, 56035.0, 129886.0, 233217.0, 265266.0, 175900.0, 83218.0, 34849.0, 14583.0, 6671.0, 3031.0, 1520.0, 779.0, 398.0, 208.0, 140.0, 76.0, 36.0, 41.0, 20.0, 17.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3187751770019531, -0.30918121337890625, -0.2995872497558594, -0.2899932861328125, -0.2803993225097656, -0.27080535888671875, -0.2612113952636719, -0.251617431640625, -0.24202346801757812, -0.23242950439453125, -0.22283554077148438, -0.2132415771484375, -0.20364761352539062, -0.19405364990234375, -0.18445968627929688, -0.17486572265625, -0.16527175903320312, -0.15567779541015625, -0.14608383178710938, -0.1364898681640625, -0.12689590454101562, -0.11730194091796875, -0.10770797729492188, -0.098114013671875, -0.08852005004882812, -0.07892608642578125, -0.06933212280273438, -0.0597381591796875, -0.050144195556640625, -0.04055023193359375, -0.030956268310546875, -0.0213623046875, -0.011768341064453125, -0.00217437744140625, 0.007419586181640625, 0.0170135498046875, 0.026607513427734375, 0.03620147705078125, 0.045795440673828125, 0.055389404296875, 0.06498336791992188, 0.07457733154296875, 0.08417129516601562, 0.0937652587890625, 0.10335922241210938, 0.11295318603515625, 0.12254714965820312, 0.13214111328125, 0.14173507690429688, 0.15132904052734375, 0.16092300415039062, 0.1705169677734375, 0.18011093139648438, 0.18970489501953125, 0.19929885864257812, 0.208892822265625, 0.21848678588867188, 0.22808074951171875, 0.23767471313476562, 0.2472686767578125, 0.2568626403808594, 0.26645660400390625, 0.2760505676269531, 0.28564453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 7.0, 11.0, 6.0, 8.0, 18.0, 23.0, 14.0, 29.0, 31.0, 29.0, 29.0, 30.0, 39.0, 31.0, 32.0, 50.0, 38.0, 28.0, 29.0, 37.0, 44.0, 35.0, 34.0, 40.0, 31.0, 25.0, 31.0, 33.0, 29.0, 21.0, 17.0, 15.0, 25.0, 19.0, 11.0, 9.0, 11.0, 5.0, 5.0, 8.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19067001342773438, -0.18370819091796875, -0.17674636840820312, -0.1697845458984375, -0.16282272338867188, -0.15586090087890625, -0.14889907836914062, -0.141937255859375, -0.13497543334960938, -0.12801361083984375, -0.12105178833007812, -0.1140899658203125, -0.10712814331054688, -0.10016632080078125, -0.09320449829101562, -0.08624267578125, -0.07928085327148438, -0.07231903076171875, -0.06535720825195312, -0.0583953857421875, -0.051433563232421875, -0.04447174072265625, -0.037509918212890625, -0.030548095703125, -0.023586273193359375, -0.01662445068359375, -0.009662628173828125, -0.0027008056640625, 0.004261016845703125, 0.01122283935546875, 0.018184661865234375, 0.025146484375, 0.032108306884765625, 0.03907012939453125, 0.046031951904296875, 0.0529937744140625, 0.059955596923828125, 0.06691741943359375, 0.07387924194335938, 0.080841064453125, 0.08780288696289062, 0.09476470947265625, 0.10172653198242188, 0.1086883544921875, 0.11565017700195312, 0.12261199951171875, 0.12957382202148438, 0.13653564453125, 0.14349746704101562, 0.15045928955078125, 0.15742111206054688, 0.1643829345703125, 0.17134475708007812, 0.17830657958984375, 0.18526840209960938, 0.192230224609375, 0.19919204711914062, 0.20615386962890625, 0.21311569213867188, 0.2200775146484375, 0.22703933715820312, 0.23400115966796875, 0.24096298217773438, 0.2479248046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 18.0, 21.0, 23.0, 43.0, 62.0, 78.0, 125.0, 219.0, 408.0, 787.0, 1723.0, 3919.0, 9232.0, 23914.0, 69961.0, 196517.0, 348962.0, 245736.0, 93648.0, 32215.0, 11884.0, 4796.0, 2054.0, 964.0, 508.0, 254.0, 149.0, 88.0, 66.0, 43.0, 27.0, 22.0, 11.0, 15.0, 11.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.44287109375, -0.430084228515625, -0.41729736328125, -0.404510498046875, -0.3917236328125, -0.378936767578125, -0.36614990234375, -0.353363037109375, -0.340576171875, -0.327789306640625, -0.31500244140625, -0.302215576171875, -0.2894287109375, -0.276641845703125, -0.26385498046875, -0.251068115234375, -0.23828125, -0.225494384765625, -0.21270751953125, -0.199920654296875, -0.1871337890625, -0.174346923828125, -0.16156005859375, -0.148773193359375, -0.135986328125, -0.123199462890625, -0.11041259765625, -0.097625732421875, -0.0848388671875, -0.072052001953125, -0.05926513671875, -0.046478271484375, -0.03369140625, -0.020904541015625, -0.00811767578125, 0.004669189453125, 0.0174560546875, 0.030242919921875, 0.04302978515625, 0.055816650390625, 0.068603515625, 0.081390380859375, 0.09417724609375, 0.106964111328125, 0.1197509765625, 0.132537841796875, 0.14532470703125, 0.158111572265625, 0.1708984375, 0.183685302734375, 0.19647216796875, 0.209259033203125, 0.2220458984375, 0.234832763671875, 0.24761962890625, 0.260406494140625, 0.273193359375, 0.285980224609375, 0.29876708984375, 0.311553955078125, 0.3243408203125, 0.337127685546875, 0.34991455078125, 0.362701416015625, 0.37548828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 8.0, 9.0, 17.0, 19.0, 17.0, 24.0, 25.0, 24.0, 26.0, 29.0, 34.0, 34.0, 34.0, 35.0, 30.0, 32.0, 46.0, 54.0, 35.0, 31.0, 37.0, 39.0, 32.0, 31.0, 30.0, 36.0, 22.0, 29.0, 20.0, 21.0, 16.0, 19.0, 14.0, 16.0, 7.0, 3.0, 12.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.6552734375, -0.6363677978515625, -0.617462158203125, -0.5985565185546875, -0.57965087890625, -0.5607452392578125, -0.541839599609375, -0.5229339599609375, -0.5040283203125, -0.4851226806640625, -0.466217041015625, -0.4473114013671875, -0.42840576171875, -0.4095001220703125, -0.390594482421875, -0.3716888427734375, -0.352783203125, -0.3338775634765625, -0.314971923828125, -0.2960662841796875, -0.27716064453125, -0.2582550048828125, -0.239349365234375, -0.2204437255859375, -0.2015380859375, -0.1826324462890625, -0.163726806640625, -0.1448211669921875, -0.12591552734375, -0.1070098876953125, -0.088104248046875, -0.0691986083984375, -0.05029296875, -0.0313873291015625, -0.012481689453125, 0.0064239501953125, 0.02532958984375, 0.0442352294921875, 0.063140869140625, 0.0820465087890625, 0.1009521484375, 0.1198577880859375, 0.138763427734375, 0.1576690673828125, 0.17657470703125, 0.1954803466796875, 0.214385986328125, 0.2332916259765625, 0.252197265625, 0.2711029052734375, 0.290008544921875, 0.3089141845703125, 0.32781982421875, 0.3467254638671875, 0.365631103515625, 0.3845367431640625, 0.4034423828125, 0.4223480224609375, 0.441253662109375, 0.4601593017578125, 0.47906494140625, 0.4979705810546875, 0.516876220703125, 0.5357818603515625, 0.5546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 11.0, 8.0, 17.0, 28.0, 29.0, 56.0, 78.0, 155.0, 217.0, 387.0, 734.0, 1417.0, 3037.0, 6742.0, 15578.0, 38777.0, 98407.0, 232189.0, 322014.0, 194739.0, 78806.0, 31234.0, 12981.0, 5645.0, 2562.0, 1246.0, 604.0, 327.0, 201.0, 96.0, 68.0, 49.0, 36.0, 12.0, 17.0, 9.0, 10.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1580810546875, -0.1528778076171875, -0.147674560546875, -0.1424713134765625, -0.13726806640625, -0.1320648193359375, -0.126861572265625, -0.1216583251953125, -0.116455078125, -0.1112518310546875, -0.106048583984375, -0.1008453369140625, -0.09564208984375, -0.0904388427734375, -0.085235595703125, -0.0800323486328125, -0.0748291015625, -0.0696258544921875, -0.064422607421875, -0.0592193603515625, -0.05401611328125, -0.0488128662109375, -0.043609619140625, -0.0384063720703125, -0.033203125, -0.0279998779296875, -0.022796630859375, -0.0175933837890625, -0.01239013671875, -0.0071868896484375, -0.001983642578125, 0.0032196044921875, 0.0084228515625, 0.0136260986328125, 0.018829345703125, 0.0240325927734375, 0.02923583984375, 0.0344390869140625, 0.039642333984375, 0.0448455810546875, 0.050048828125, 0.0552520751953125, 0.060455322265625, 0.0656585693359375, 0.07086181640625, 0.0760650634765625, 0.081268310546875, 0.0864715576171875, 0.0916748046875, 0.0968780517578125, 0.102081298828125, 0.1072845458984375, 0.11248779296875, 0.1176910400390625, 0.122894287109375, 0.1280975341796875, 0.13330078125, 0.1385040283203125, 0.143707275390625, 0.1489105224609375, 0.15411376953125, 0.1593170166015625, 0.164520263671875, 0.1697235107421875, 0.1749267578125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 17.0, 12.0, 26.0, 27.0, 34.0, 27.0, 53.0, 57.0, 54.0, 76.0, 83.0, 91.0, 65.0, 66.0, 44.0, 46.0, 44.0, 29.0, 28.0, 15.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.07099723815918e-05, -3.935955464839935e-05, -3.800913691520691e-05, -3.6658719182014465e-05, -3.530830144882202e-05, -3.395788371562958e-05, -3.2607465982437134e-05, -3.125704824924469e-05, -2.9906630516052246e-05, -2.8556212782859802e-05, -2.720579504966736e-05, -2.5855377316474915e-05, -2.450495958328247e-05, -2.3154541850090027e-05, -2.1804124116897583e-05, -2.045370638370514e-05, -1.9103288650512695e-05, -1.775287091732025e-05, -1.6402453184127808e-05, -1.5052035450935364e-05, -1.370161771774292e-05, -1.2351199984550476e-05, -1.1000782251358032e-05, -9.650364518165588e-06, -8.299946784973145e-06, -6.949529051780701e-06, -5.599111318588257e-06, -4.248693585395813e-06, -2.898275852203369e-06, -1.5478581190109253e-06, -1.9744038581848145e-07, 1.1529773473739624e-06, 2.5033950805664062e-06, 3.85381281375885e-06, 5.204230546951294e-06, 6.554648280143738e-06, 7.905066013336182e-06, 9.255483746528625e-06, 1.060590147972107e-05, 1.1956319212913513e-05, 1.3306736946105957e-05, 1.4657154679298401e-05, 1.6007572412490845e-05, 1.735799014568329e-05, 1.8708407878875732e-05, 2.0058825612068176e-05, 2.140924334526062e-05, 2.2759661078453064e-05, 2.4110078811645508e-05, 2.546049654483795e-05, 2.6810914278030396e-05, 2.816133201122284e-05, 2.9511749744415283e-05, 3.086216747760773e-05, 3.221258521080017e-05, 3.3563002943992615e-05, 3.491342067718506e-05, 3.62638384103775e-05, 3.7614256143569946e-05, 3.896467387676239e-05, 4.0315091609954834e-05, 4.166550934314728e-05, 4.301592707633972e-05, 4.4366344809532166e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 9.0, 16.0, 17.0, 37.0, 55.0, 98.0, 177.0, 233.0, 471.0, 883.0, 1594.0, 3696.0, 8788.0, 21493.0, 54856.0, 135787.0, 272025.0, 288124.0, 154521.0, 62881.0, 24512.0, 10089.0, 4110.0, 1844.0, 934.0, 535.0, 280.0, 155.0, 93.0, 77.0, 53.0, 29.0, 16.0, 21.0, 7.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.183837890625, -0.17859649658203125, -0.1733551025390625, -0.16811370849609375, -0.162872314453125, -0.15763092041015625, -0.1523895263671875, -0.14714813232421875, -0.14190673828125, -0.13666534423828125, -0.1314239501953125, -0.12618255615234375, -0.120941162109375, -0.11569976806640625, -0.1104583740234375, -0.10521697998046875, -0.0999755859375, -0.09473419189453125, -0.0894927978515625, -0.08425140380859375, -0.079010009765625, -0.07376861572265625, -0.0685272216796875, -0.06328582763671875, -0.05804443359375, -0.05280303955078125, -0.0475616455078125, -0.04232025146484375, -0.037078857421875, -0.03183746337890625, -0.0265960693359375, -0.02135467529296875, -0.01611328125, -0.01087188720703125, -0.0056304931640625, -0.00038909912109375, 0.004852294921875, 0.01009368896484375, 0.0153350830078125, 0.02057647705078125, 0.02581787109375, 0.03105926513671875, 0.0363006591796875, 0.04154205322265625, 0.046783447265625, 0.05202484130859375, 0.0572662353515625, 0.06250762939453125, 0.0677490234375, 0.07299041748046875, 0.0782318115234375, 0.08347320556640625, 0.088714599609375, 0.09395599365234375, 0.0991973876953125, 0.10443878173828125, 0.10968017578125, 0.11492156982421875, 0.1201629638671875, 0.12540435791015625, 0.130645751953125, 0.13588714599609375, 0.1411285400390625, 0.14636993408203125, 0.151611328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 6.0, 12.0, 16.0, 12.0, 20.0, 17.0, 39.0, 38.0, 35.0, 45.0, 58.0, 44.0, 62.0, 70.0, 67.0, 48.0, 52.0, 56.0, 49.0, 32.0, 32.0, 27.0, 21.0, 17.0, 24.0, 16.0, 6.0, 6.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.147705078125, -0.1431713104248047, -0.13863754272460938, -0.13410377502441406, -0.12957000732421875, -0.12503623962402344, -0.12050247192382812, -0.11596870422363281, -0.1114349365234375, -0.10690116882324219, -0.10236740112304688, -0.09783363342285156, -0.09329986572265625, -0.08876609802246094, -0.08423233032226562, -0.07969856262207031, -0.075164794921875, -0.07063102722167969, -0.06609725952148438, -0.06156349182128906, -0.05702972412109375, -0.05249595642089844, -0.047962188720703125, -0.04342842102050781, -0.0388946533203125, -0.03436088562011719, -0.029827117919921875, -0.025293350219726562, -0.02075958251953125, -0.016225814819335938, -0.011692047119140625, -0.0071582794189453125, -0.00262451171875, 0.0019092559814453125, 0.006443023681640625, 0.010976791381835938, 0.01551055908203125, 0.020044326782226562, 0.024578094482421875, 0.029111862182617188, 0.0336456298828125, 0.03817939758300781, 0.042713165283203125, 0.04724693298339844, 0.05178070068359375, 0.05631446838378906, 0.060848236083984375, 0.06538200378417969, 0.069915771484375, 0.07444953918457031, 0.07898330688476562, 0.08351707458496094, 0.08805084228515625, 0.09258460998535156, 0.09711837768554688, 0.10165214538574219, 0.1061859130859375, 0.11071968078613281, 0.11525344848632812, 0.11978721618652344, 0.12432098388671875, 0.12885475158691406, 0.13338851928710938, 0.1379222869873047, 0.1424560546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 13.0, 31.0, 133.0, 303.0, 325.0, 136.0, 49.0, 13.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125173568725586, -2.9417195320129395, -2.758265256881714, -2.5748112201690674, -2.391356945037842, -2.2079029083251953, -2.024448871612549, -1.8409947156906128, -1.6575405597686768, -1.4740864038467407, -1.2906322479248047, -1.1071782112121582, -0.9237240552902222, -0.7402698993682861, -0.5568158626556396, -0.3733617067337036, -0.18990755081176758, -0.006453424692153931, 0.17700070142745972, 0.360454797744751, 0.543908953666687, 0.727363109588623, 0.9108171463012695, 1.0942713022232056, 1.2777254581451416, 1.4611796140670776, 1.6446337699890137, 1.8280878067016602, 2.0115418434143066, 2.1949961185455322, 2.3784501552581787, 2.5619044303894043, 2.745358467102051, 2.9288125038146973, 3.112266778945923, 3.2957208156585693, 3.479175090789795, 3.6626291275024414, 3.846083164215088, 4.029537200927734, 4.212991714477539, 4.3964457511901855, 4.579899787902832, 4.763354301452637, 4.946808338165283, 5.13026237487793, 5.313716411590576, 5.497170448303223, 5.680624485015869, 5.864078521728516, 6.047532558441162, 6.230986595153809, 6.414441108703613, 6.59789514541626, 6.781349182128906, 6.964803218841553, 7.148257255554199, 7.331711292266846, 7.515165328979492, 7.698619842529297, 7.882073879241943, 8.06552791595459, 8.248981475830078, 8.432435989379883, 8.615890502929688]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 15.0, 6.0, 16.0, 21.0, 27.0, 22.0, 34.0, 26.0, 26.0, 32.0, 35.0, 37.0, 31.0, 38.0, 41.0, 46.0, 28.0, 49.0, 42.0, 48.0, 41.0, 39.0, 34.0, 31.0, 27.0, 24.0, 27.0, 31.0, 12.0, 19.0, 13.0, 12.0, 7.0, 12.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.80169677734375, -1.7469565868377686, -1.6922165155410767, -1.6374764442443848, -1.5827362537384033, -1.5279960632324219, -1.47325599193573, -1.418515920639038, -1.3637757301330566, -1.3090355396270752, -1.2542954683303833, -1.1995553970336914, -1.14481520652771, -1.0900750160217285, -1.0353349447250366, -0.9805948138237, -0.9258546829223633, -0.8711145520210266, -0.8163744211196899, -0.7616342902183533, -0.7068941593170166, -0.6521540284156799, -0.5974138975143433, -0.5426737666130066, -0.4879336357116699, -0.43319350481033325, -0.3784533739089966, -0.3237132430076599, -0.26897311210632324, -0.21423298120498657, -0.1594928503036499, -0.10475271940231323, -0.05001258850097656, 0.004727542400360107, 0.05946767330169678, 0.11420780420303345, 0.16894793510437012, 0.2236880660057068, 0.27842819690704346, 0.3331683278083801, 0.3879084587097168, 0.44264858961105347, 0.49738872051239014, 0.5521288514137268, 0.6068689823150635, 0.6616091132164001, 0.7163492441177368, 0.7710893750190735, 0.8258295059204102, 0.8805696368217468, 0.9353097677230835, 0.9900498986244202, 1.0447900295257568, 1.0995302200317383, 1.1542702913284302, 1.209010362625122, 1.2637505531311035, 1.318490743637085, 1.3732308149337769, 1.4279708862304688, 1.4827110767364502, 1.5374512672424316, 1.5921913385391235, 1.6469314098358154, 1.7016716003417969]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 10.0, 11.0, 24.0, 17.0, 38.0, 36.0, 48.0, 89.0, 117.0, 184.0, 395.0, 846.0, 2288.0, 7613.0, 33460.0, 194052.0, 1238050.0, 2105048.0, 511361.0, 78762.0, 15502.0, 3909.0, 1239.0, 516.0, 241.0, 126.0, 81.0, 48.0, 50.0, 23.0, 22.0, 10.0, 12.0, 9.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.4792366027832031, -0.46482086181640625, -0.4504051208496094, -0.4359893798828125, -0.4215736389160156, -0.40715789794921875, -0.3927421569824219, -0.378326416015625, -0.3639106750488281, -0.34949493408203125, -0.3350791931152344, -0.3206634521484375, -0.3062477111816406, -0.29183197021484375, -0.2774162292480469, -0.26300048828125, -0.24858474731445312, -0.23416900634765625, -0.21975326538085938, -0.2053375244140625, -0.19092178344726562, -0.17650604248046875, -0.16209030151367188, -0.147674560546875, -0.13325881958007812, -0.11884307861328125, -0.10442733764648438, -0.0900115966796875, -0.07559585571289062, -0.06118011474609375, -0.046764373779296875, -0.0323486328125, -0.017932891845703125, -0.00351715087890625, 0.010898590087890625, 0.0253143310546875, 0.039730072021484375, 0.05414581298828125, 0.06856155395507812, 0.082977294921875, 0.09739303588867188, 0.11180877685546875, 0.12622451782226562, 0.1406402587890625, 0.15505599975585938, 0.16947174072265625, 0.18388748168945312, 0.19830322265625, 0.21271896362304688, 0.22713470458984375, 0.24155044555664062, 0.2559661865234375, 0.2703819274902344, 0.28479766845703125, 0.2992134094238281, 0.313629150390625, 0.3280448913574219, 0.34246063232421875, 0.3568763732910156, 0.3712921142578125, 0.3857078552246094, 0.40012359619140625, 0.4145393371582031, 0.428955078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 13.0, 7.0, 22.0, 17.0, 19.0, 18.0, 23.0, 29.0, 31.0, 28.0, 30.0, 35.0, 43.0, 34.0, 67.0, 44.0, 47.0, 42.0, 37.0, 43.0, 42.0, 34.0, 39.0, 43.0, 23.0, 27.0, 28.0, 26.0, 19.0, 14.0, 7.0, 10.0, 6.0, 7.0, 4.0, 1.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.26827239990234375, -0.2596893310546875, -0.25110626220703125, -0.242523193359375, -0.23394012451171875, -0.2253570556640625, -0.21677398681640625, -0.20819091796875, -0.19960784912109375, -0.1910247802734375, -0.18244171142578125, -0.173858642578125, -0.16527557373046875, -0.1566925048828125, -0.14810943603515625, -0.1395263671875, -0.13094329833984375, -0.1223602294921875, -0.11377716064453125, -0.105194091796875, -0.09661102294921875, -0.0880279541015625, -0.07944488525390625, -0.07086181640625, -0.06227874755859375, -0.0536956787109375, -0.04511260986328125, -0.036529541015625, -0.02794647216796875, -0.0193634033203125, -0.01078033447265625, -0.002197265625, 0.00638580322265625, 0.0149688720703125, 0.02355194091796875, 0.032135009765625, 0.04071807861328125, 0.0493011474609375, 0.05788421630859375, 0.06646728515625, 0.07505035400390625, 0.0836334228515625, 0.09221649169921875, 0.100799560546875, 0.10938262939453125, 0.1179656982421875, 0.12654876708984375, 0.1351318359375, 0.14371490478515625, 0.1522979736328125, 0.16088104248046875, 0.169464111328125, 0.17804718017578125, 0.1866302490234375, 0.19521331787109375, 0.20379638671875, 0.21237945556640625, 0.2209625244140625, 0.22954559326171875, 0.238128662109375, 0.24671173095703125, 0.2552947998046875, 0.26387786865234375, 0.2724609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 12.0, 24.0, 42.0, 47.0, 78.0, 118.0, 179.0, 302.0, 569.0, 1021.0, 2117.0, 5606.0, 16735.0, 60251.0, 294149.0, 2053007.0, 1487028.0, 205467.0, 45712.0, 13099.0, 4692.0, 1893.0, 907.0, 492.0, 280.0, 148.0, 88.0, 58.0, 44.0, 37.0, 15.0, 11.0, 9.0, 8.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4817237854003906, -0.46613311767578125, -0.4505424499511719, -0.4349517822265625, -0.4193611145019531, -0.40377044677734375, -0.3881797790527344, -0.372589111328125, -0.3569984436035156, -0.34140777587890625, -0.3258171081542969, -0.3102264404296875, -0.2946357727050781, -0.27904510498046875, -0.2634544372558594, -0.24786376953125, -0.23227310180664062, -0.21668243408203125, -0.20109176635742188, -0.1855010986328125, -0.16991043090820312, -0.15431976318359375, -0.13872909545898438, -0.123138427734375, -0.10754776000976562, -0.09195709228515625, -0.07636642456054688, -0.0607757568359375, -0.045185089111328125, -0.02959442138671875, -0.014003753662109375, 0.0015869140625, 0.017177581787109375, 0.03276824951171875, 0.048358917236328125, 0.0639495849609375, 0.07954025268554688, 0.09513092041015625, 0.11072158813476562, 0.126312255859375, 0.14190292358398438, 0.15749359130859375, 0.17308425903320312, 0.1886749267578125, 0.20426559448242188, 0.21985626220703125, 0.23544692993164062, 0.25103759765625, 0.2666282653808594, 0.28221893310546875, 0.2978096008300781, 0.3134002685546875, 0.3289909362792969, 0.34458160400390625, 0.3601722717285156, 0.375762939453125, 0.3913536071777344, 0.40694427490234375, 0.4225349426269531, 0.4381256103515625, 0.4537162780761719, 0.46930694580078125, 0.4848976135253906, 0.50048828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 26.0, 29.0, 43.0, 60.0, 95.0, 138.0, 213.0, 388.0, 531.0, 672.0, 652.0, 428.0, 291.0, 158.0, 98.0, 63.0, 32.0, 35.0, 23.0, 15.0, 15.0, 13.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5504684448242188, -0.5330657958984375, -0.5156631469726562, -0.498260498046875, -0.48085784912109375, -0.4634552001953125, -0.44605255126953125, -0.42864990234375, -0.41124725341796875, -0.3938446044921875, -0.37644195556640625, -0.359039306640625, -0.34163665771484375, -0.3242340087890625, -0.30683135986328125, -0.2894287109375, -0.27202606201171875, -0.2546234130859375, -0.23722076416015625, -0.219818115234375, -0.20241546630859375, -0.1850128173828125, -0.16761016845703125, -0.15020751953125, -0.13280487060546875, -0.1154022216796875, -0.09799957275390625, -0.080596923828125, -0.06319427490234375, -0.0457916259765625, -0.02838897705078125, -0.010986328125, 0.00641632080078125, 0.0238189697265625, 0.04122161865234375, 0.058624267578125, 0.07602691650390625, 0.0934295654296875, 0.11083221435546875, 0.12823486328125, 0.14563751220703125, 0.1630401611328125, 0.18044281005859375, 0.197845458984375, 0.21524810791015625, 0.2326507568359375, 0.25005340576171875, 0.2674560546875, 0.28485870361328125, 0.3022613525390625, 0.31966400146484375, 0.337066650390625, 0.35446929931640625, 0.3718719482421875, 0.38927459716796875, 0.40667724609375, 0.42407989501953125, 0.4414825439453125, 0.45888519287109375, 0.476287841796875, 0.49369049072265625, 0.5110931396484375, 0.5284957885742188, 0.5458984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 7.0, 13.0, 30.0, 57.0, 85.0, 146.0, 129.0, 158.0, 152.0, 90.0, 57.0, 34.0, 16.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4671103954315186, -3.3625025749206543, -3.257894992828369, -3.153287172317505, -3.0486793518066406, -2.9440717697143555, -2.839463949203491, -2.734856128692627, -2.630248546600342, -2.5256407260894775, -2.4210331439971924, -2.316425323486328, -2.211817502975464, -2.1072096824645996, -2.0026021003723145, -1.8979942798614502, -1.793386459350586, -1.6887787580490112, -1.584170937538147, -1.4795632362365723, -1.374955415725708, -1.2703477144241333, -1.1657400131225586, -1.0611321926116943, -0.9565244913101196, -0.8519167304039001, -0.7473089694976807, -0.642701268196106, -0.5380935072898865, -0.433485746383667, -0.3288780450820923, -0.2242702841758728, -0.11966228485107422, -0.01505453884601593, 0.08955320715904236, 0.19416093826293945, 0.29876869916915894, 0.4033764600753784, 0.5079841613769531, 0.6125919222831726, 0.7171996831893921, 0.8218074440956116, 0.926415205001831, 1.0310229063034058, 1.1356306076049805, 1.2402384281158447, 1.3448461294174194, 1.4494538307189941, 1.5540616512298584, 1.658669352531433, 1.7632771730422974, 1.867884874343872, 1.9724926948547363, 2.0771002769470215, 2.1817080974578857, 2.28631591796875, 2.390923500061035, 2.4955313205718994, 2.6001389026641846, 2.704746723175049, 2.809354543685913, 2.9139623641967773, 3.0185699462890625, 3.1231777667999268, 3.227785587310791]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 10.0, 17.0, 15.0, 21.0, 24.0, 24.0, 32.0, 26.0, 23.0, 29.0, 43.0, 41.0, 37.0, 43.0, 38.0, 46.0, 37.0, 43.0, 27.0, 40.0, 42.0, 26.0, 29.0, 33.0, 30.0, 29.0, 28.0, 30.0, 15.0, 19.0, 14.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.4681293964385986, -1.4269018173217773, -1.3856743574142456, -1.3444467782974243, -1.3032193183898926, -1.2619917392730713, -1.2207642793655396, -1.1795367002487183, -1.1383092403411865, -1.0970816612243652, -1.0558542013168335, -1.0146266222000122, -0.9733991622924805, -0.9321715831756592, -0.8909440636634827, -0.8497165441513062, -0.8084889650344849, -0.7672614455223083, -0.7260339260101318, -0.6848064064979553, -0.6435788869857788, -0.6023513078689575, -0.561123788356781, -0.5198962688446045, -0.478668749332428, -0.43744122982025146, -0.39621371030807495, -0.35498616099357605, -0.31375864148139954, -0.272531121969223, -0.23130358755588531, -0.1900760531425476, -0.1488485336303711, -0.10762100666761398, -0.06639347970485687, -0.025165952742099762, 0.01606157422065735, 0.05728909373283386, 0.09851662814617157, 0.13974416255950928, 0.1809716820716858, 0.2221992015838623, 0.2634267210960388, 0.3046542704105377, 0.34588178992271423, 0.38710930943489075, 0.42833685874938965, 0.46956437826156616, 0.5107918977737427, 0.5520194172859192, 0.5932469367980957, 0.6344744563102722, 0.6757019758224487, 0.71692955493927, 0.7581570744514465, 0.799384593963623, 0.8406121134757996, 0.8818396329879761, 0.9230671525001526, 0.9642946720123291, 1.0055222511291504, 1.0467497110366821, 1.0879772901535034, 1.1292047500610352, 1.1704323291778564]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 12.0, 16.0, 27.0, 25.0, 31.0, 48.0, 64.0, 117.0, 170.0, 270.0, 445.0, 712.0, 1135.0, 2105.0, 3597.0, 6349.0, 11993.0, 24709.0, 58479.0, 145657.0, 284903.0, 272446.0, 133199.0, 53508.0, 22964.0, 11125.0, 6155.0, 3426.0, 1918.0, 1114.0, 644.0, 401.0, 256.0, 151.0, 102.0, 67.0, 56.0, 26.0, 32.0, 25.0, 19.0, 12.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.38671875, -0.3759613037109375, -0.365203857421875, -0.3544464111328125, -0.34368896484375, -0.3329315185546875, -0.322174072265625, -0.3114166259765625, -0.3006591796875, -0.2899017333984375, -0.279144287109375, -0.2683868408203125, -0.25762939453125, -0.2468719482421875, -0.236114501953125, -0.2253570556640625, -0.214599609375, -0.2038421630859375, -0.193084716796875, -0.1823272705078125, -0.17156982421875, -0.1608123779296875, -0.150054931640625, -0.1392974853515625, -0.1285400390625, -0.1177825927734375, -0.107025146484375, -0.0962677001953125, -0.08551025390625, -0.0747528076171875, -0.063995361328125, -0.0532379150390625, -0.04248046875, -0.0317230224609375, -0.020965576171875, -0.0102081298828125, 0.00054931640625, 0.0113067626953125, 0.022064208984375, 0.0328216552734375, 0.0435791015625, 0.0543365478515625, 0.065093994140625, 0.0758514404296875, 0.08660888671875, 0.0973663330078125, 0.108123779296875, 0.1188812255859375, 0.129638671875, 0.1403961181640625, 0.151153564453125, 0.1619110107421875, 0.17266845703125, 0.1834259033203125, 0.194183349609375, 0.2049407958984375, 0.2156982421875, 0.2264556884765625, 0.237213134765625, 0.2479705810546875, 0.25872802734375, 0.2694854736328125, 0.280242919921875, 0.2910003662109375, 0.3017578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 14.0, 19.0, 4.0, 16.0, 17.0, 18.0, 18.0, 22.0, 23.0, 27.0, 29.0, 43.0, 41.0, 30.0, 41.0, 31.0, 47.0, 38.0, 44.0, 56.0, 35.0, 47.0, 36.0, 36.0, 35.0, 27.0, 35.0, 28.0, 24.0, 25.0, 20.0, 14.0, 11.0, 7.0, 11.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.281982421875, -0.2738456726074219, -0.26570892333984375, -0.2575721740722656, -0.2494354248046875, -0.24129867553710938, -0.23316192626953125, -0.22502517700195312, -0.216888427734375, -0.20875167846679688, -0.20061492919921875, -0.19247817993164062, -0.1843414306640625, -0.17620468139648438, -0.16806793212890625, -0.15993118286132812, -0.15179443359375, -0.14365768432617188, -0.13552093505859375, -0.12738418579101562, -0.1192474365234375, -0.11111068725585938, -0.10297393798828125, -0.09483718872070312, -0.086700439453125, -0.07856369018554688, -0.07042694091796875, -0.062290191650390625, -0.0541534423828125, -0.046016693115234375, -0.03787994384765625, -0.029743194580078125, -0.0216064453125, -0.013469696044921875, -0.00533294677734375, 0.002803802490234375, 0.0109405517578125, 0.019077301025390625, 0.02721405029296875, 0.035350799560546875, 0.043487548828125, 0.051624298095703125, 0.05976104736328125, 0.06789779663085938, 0.0760345458984375, 0.08417129516601562, 0.09230804443359375, 0.10044479370117188, 0.10858154296875, 0.11671829223632812, 0.12485504150390625, 0.13299179077148438, 0.1411285400390625, 0.14926528930664062, 0.15740203857421875, 0.16553878784179688, 0.173675537109375, 0.18181228637695312, 0.18994903564453125, 0.19808578491210938, 0.2062225341796875, 0.21435928344726562, 0.22249603271484375, 0.23063278198242188, 0.23876953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 2.0, 10.0, 10.0, 9.0, 24.0, 26.0, 37.0, 47.0, 62.0, 128.0, 203.0, 348.0, 614.0, 1310.0, 2861.0, 6690.0, 16551.0, 47702.0, 166776.0, 416963.0, 268812.0, 77250.0, 24788.0, 9446.0, 4056.0, 1861.0, 858.0, 436.0, 264.0, 154.0, 81.0, 57.0, 40.0, 23.0, 18.0, 10.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.50732421875, -0.4918098449707031, -0.47629547119140625, -0.4607810974121094, -0.4452667236328125, -0.4297523498535156, -0.41423797607421875, -0.3987236022949219, -0.383209228515625, -0.3676948547363281, -0.35218048095703125, -0.3366661071777344, -0.3211517333984375, -0.3056373596191406, -0.29012298583984375, -0.2746086120605469, -0.25909423828125, -0.24357986450195312, -0.22806549072265625, -0.21255111694335938, -0.1970367431640625, -0.18152236938476562, -0.16600799560546875, -0.15049362182617188, -0.134979248046875, -0.11946487426757812, -0.10395050048828125, -0.08843612670898438, -0.0729217529296875, -0.057407379150390625, -0.04189300537109375, -0.026378631591796875, -0.0108642578125, 0.004650115966796875, 0.02016448974609375, 0.035678863525390625, 0.0511932373046875, 0.06670761108398438, 0.08222198486328125, 0.09773635864257812, 0.113250732421875, 0.12876510620117188, 0.14427947998046875, 0.15979385375976562, 0.1753082275390625, 0.19082260131835938, 0.20633697509765625, 0.22185134887695312, 0.23736572265625, 0.2528800964355469, 0.26839447021484375, 0.2839088439941406, 0.2994232177734375, 0.3149375915527344, 0.33045196533203125, 0.3459663391113281, 0.361480712890625, 0.3769950866699219, 0.39250946044921875, 0.4080238342285156, 0.4235382080078125, 0.4390525817871094, 0.45456695556640625, 0.4700813293457031, 0.485595703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 9.0, 12.0, 17.0, 20.0, 25.0, 22.0, 14.0, 34.0, 29.0, 37.0, 40.0, 33.0, 44.0, 49.0, 38.0, 37.0, 43.0, 40.0, 41.0, 47.0, 38.0, 31.0, 25.0, 30.0, 35.0, 29.0, 16.0, 26.0, 16.0, 22.0, 11.0, 12.0, 15.0, 8.0, 6.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.7685546875, -0.7467498779296875, -0.724945068359375, -0.7031402587890625, -0.68133544921875, -0.6595306396484375, -0.637725830078125, -0.6159210205078125, -0.5941162109375, -0.5723114013671875, -0.550506591796875, -0.5287017822265625, -0.50689697265625, -0.4850921630859375, -0.463287353515625, -0.4414825439453125, -0.419677734375, -0.3978729248046875, -0.376068115234375, -0.3542633056640625, -0.33245849609375, -0.3106536865234375, -0.288848876953125, -0.2670440673828125, -0.2452392578125, -0.2234344482421875, -0.201629638671875, -0.1798248291015625, -0.15802001953125, -0.1362152099609375, -0.114410400390625, -0.0926055908203125, -0.07080078125, -0.0489959716796875, -0.027191162109375, -0.0053863525390625, 0.01641845703125, 0.0382232666015625, 0.060028076171875, 0.0818328857421875, 0.1036376953125, 0.1254425048828125, 0.147247314453125, 0.1690521240234375, 0.19085693359375, 0.2126617431640625, 0.234466552734375, 0.2562713623046875, 0.278076171875, 0.2998809814453125, 0.321685791015625, 0.3434906005859375, 0.36529541015625, 0.3871002197265625, 0.408905029296875, 0.4307098388671875, 0.4525146484375, 0.4743194580078125, 0.496124267578125, 0.5179290771484375, 0.53973388671875, 0.5615386962890625, 0.583343505859375, 0.6051483154296875, 0.626953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 12.0, 23.0, 24.0, 50.0, 120.0, 188.0, 406.0, 819.0, 1643.0, 3486.0, 7504.0, 16670.0, 42278.0, 127163.0, 345550.0, 323122.0, 112650.0, 38301.0, 15361.0, 6870.0, 3187.0, 1533.0, 795.0, 388.0, 179.0, 109.0, 56.0, 28.0, 15.0, 13.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143310546875, -0.13799285888671875, -0.1326751708984375, -0.12735748291015625, -0.122039794921875, -0.11672210693359375, -0.1114044189453125, -0.10608673095703125, -0.10076904296875, -0.09545135498046875, -0.0901336669921875, -0.08481597900390625, -0.079498291015625, -0.07418060302734375, -0.0688629150390625, -0.06354522705078125, -0.0582275390625, -0.05290985107421875, -0.0475921630859375, -0.04227447509765625, -0.036956787109375, -0.03163909912109375, -0.0263214111328125, -0.02100372314453125, -0.01568603515625, -0.01036834716796875, -0.0050506591796875, 0.00026702880859375, 0.005584716796875, 0.01090240478515625, 0.0162200927734375, 0.02153778076171875, 0.02685546875, 0.03217315673828125, 0.0374908447265625, 0.04280853271484375, 0.048126220703125, 0.05344390869140625, 0.0587615966796875, 0.06407928466796875, 0.06939697265625, 0.07471466064453125, 0.0800323486328125, 0.08535003662109375, 0.090667724609375, 0.09598541259765625, 0.1013031005859375, 0.10662078857421875, 0.1119384765625, 0.11725616455078125, 0.1225738525390625, 0.12789154052734375, 0.133209228515625, 0.13852691650390625, 0.1438446044921875, 0.14916229248046875, 0.15447998046875, 0.15979766845703125, 0.1651153564453125, 0.17043304443359375, 0.175750732421875, 0.18106842041015625, 0.1863861083984375, 0.19170379638671875, 0.197021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 5.0, 6.0, 10.0, 10.0, 11.0, 13.0, 32.0, 34.0, 47.0, 60.0, 91.0, 110.0, 127.0, 92.0, 79.0, 56.0, 43.0, 33.0, 20.0, 16.0, 17.0, 14.0, 13.0, 6.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-6.109476089477539e-05, -5.951337516307831e-05, -5.7931989431381226e-05, -5.635060369968414e-05, -5.476921796798706e-05, -5.318783223628998e-05, -5.1606446504592896e-05, -5.002506077289581e-05, -4.844367504119873e-05, -4.686228930950165e-05, -4.5280903577804565e-05, -4.369951784610748e-05, -4.21181321144104e-05, -4.053674638271332e-05, -3.8955360651016235e-05, -3.737397491931915e-05, -3.579258918762207e-05, -3.421120345592499e-05, -3.2629817724227905e-05, -3.104843199253082e-05, -2.946704626083374e-05, -2.7885660529136658e-05, -2.6304274797439575e-05, -2.4722889065742493e-05, -2.314150333404541e-05, -2.1560117602348328e-05, -1.9978731870651245e-05, -1.8397346138954163e-05, -1.681596040725708e-05, -1.5234574675559998e-05, -1.3653188943862915e-05, -1.2071803212165833e-05, -1.049041748046875e-05, -8.909031748771667e-06, -7.327646017074585e-06, -5.7462602853775024e-06, -4.16487455368042e-06, -2.5834888219833374e-06, -1.0021030902862549e-06, 5.792826414108276e-07, 2.16066837310791e-06, 3.7420541048049927e-06, 5.323439836502075e-06, 6.904825568199158e-06, 8.48621129989624e-06, 1.0067597031593323e-05, 1.1648982763290405e-05, 1.3230368494987488e-05, 1.481175422668457e-05, 1.6393139958381653e-05, 1.7974525690078735e-05, 1.9555911421775818e-05, 2.11372971534729e-05, 2.2718682885169983e-05, 2.4300068616867065e-05, 2.5881454348564148e-05, 2.746284008026123e-05, 2.9044225811958313e-05, 3.0625611543655396e-05, 3.220699727535248e-05, 3.378838300704956e-05, 3.536976873874664e-05, 3.6951154470443726e-05, 3.853254020214081e-05, 4.011392593383789e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 8.0, 15.0, 15.0, 35.0, 48.0, 75.0, 150.0, 288.0, 683.0, 1916.0, 5530.0, 17513.0, 56996.0, 195989.0, 416114.0, 246387.0, 73542.0, 22216.0, 6996.0, 2455.0, 837.0, 338.0, 166.0, 92.0, 52.0, 27.0, 21.0, 20.0, 8.0, 5.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1708984375, -0.16470718383789062, -0.15851593017578125, -0.15232467651367188, -0.1461334228515625, -0.13994216918945312, -0.13375091552734375, -0.12755966186523438, -0.121368408203125, -0.11517715454101562, -0.10898590087890625, -0.10279464721679688, -0.0966033935546875, -0.09041213989257812, -0.08422088623046875, -0.07802963256835938, -0.07183837890625, -0.06564712524414062, -0.05945587158203125, -0.053264617919921875, -0.0470733642578125, -0.040882110595703125, -0.03469085693359375, -0.028499603271484375, -0.022308349609375, -0.016117095947265625, -0.00992584228515625, -0.003734588623046875, 0.0024566650390625, 0.008647918701171875, 0.01483917236328125, 0.021030426025390625, 0.0272216796875, 0.033412933349609375, 0.03960418701171875, 0.045795440673828125, 0.0519866943359375, 0.058177947998046875, 0.06436920166015625, 0.07056045532226562, 0.076751708984375, 0.08294296264648438, 0.08913421630859375, 0.09532546997070312, 0.1015167236328125, 0.10770797729492188, 0.11389923095703125, 0.12009048461914062, 0.12628173828125, 0.13247299194335938, 0.13866424560546875, 0.14485549926757812, 0.1510467529296875, 0.15723800659179688, 0.16342926025390625, 0.16962051391601562, 0.175811767578125, 0.18200302124023438, 0.18819427490234375, 0.19438552856445312, 0.2005767822265625, 0.20676803588867188, 0.21295928955078125, 0.21915054321289062, 0.225341796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 2.0, 9.0, 8.0, 19.0, 19.0, 16.0, 48.0, 45.0, 54.0, 62.0, 74.0, 80.0, 93.0, 72.0, 80.0, 63.0, 51.0, 34.0, 30.0, 20.0, 24.0, 24.0, 10.0, 13.0, 8.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17490768432617188, -0.16951751708984375, -0.16412734985351562, -0.1587371826171875, -0.15334701538085938, -0.14795684814453125, -0.14256668090820312, -0.137176513671875, -0.13178634643554688, -0.12639617919921875, -0.12100601196289062, -0.1156158447265625, -0.11022567749023438, -0.10483551025390625, -0.09944534301757812, -0.09405517578125, -0.08866500854492188, -0.08327484130859375, -0.07788467407226562, -0.0724945068359375, -0.06710433959960938, -0.06171417236328125, -0.056324005126953125, -0.050933837890625, -0.045543670654296875, -0.04015350341796875, -0.034763336181640625, -0.0293731689453125, -0.023983001708984375, -0.01859283447265625, -0.013202667236328125, -0.0078125, -0.002422332763671875, 0.00296783447265625, 0.008358001708984375, 0.0137481689453125, 0.019138336181640625, 0.02452850341796875, 0.029918670654296875, 0.035308837890625, 0.040699005126953125, 0.04608917236328125, 0.051479339599609375, 0.0568695068359375, 0.062259674072265625, 0.06764984130859375, 0.07304000854492188, 0.07843017578125, 0.08382034301757812, 0.08921051025390625, 0.09460067749023438, 0.0999908447265625, 0.10538101196289062, 0.11077117919921875, 0.11616134643554688, 0.121551513671875, 0.12694168090820312, 0.13233184814453125, 0.13772201538085938, 0.1431121826171875, 0.14850234985351562, 0.15389251708984375, 0.15928268432617188, 0.1646728515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 14.0, 18.0, 36.0, 42.0, 83.0, 119.0, 113.0, 142.0, 119.0, 103.0, 74.0, 49.0, 17.0, 21.0, 11.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8853745460510254, -1.8137964010238647, -1.742218255996704, -1.670640230178833, -1.5990620851516724, -1.5274839401245117, -1.4559059143066406, -1.38432776927948, -1.3127496242523193, -1.2411714792251587, -1.169593334197998, -1.098015308380127, -1.0264371633529663, -0.9548590183258057, -0.8832809329032898, -0.8117028474807739, -0.7401247024536133, -0.6685465574264526, -0.5969684720039368, -0.5253903865814209, -0.45381224155426025, -0.382234126329422, -0.31065601110458374, -0.23907792568206787, -0.16749978065490723, -0.09592166543006897, -0.024343550205230713, 0.047234565019607544, 0.1188126802444458, 0.19039079546928406, 0.2619689106941223, 0.3335469961166382, 0.40512537956237793, 0.4767034947872162, 0.5482816100120544, 0.6198596954345703, 0.691437840461731, 0.7630159854888916, 0.8345940709114075, 0.9061721563339233, 0.977750301361084, 1.0493284463882446, 1.1209065914154053, 1.1924846172332764, 1.264062762260437, 1.3356409072875977, 1.4072189331054688, 1.4787970781326294, 1.55037522315979, 1.6219533681869507, 1.6935315132141113, 1.7651095390319824, 1.836687684059143, 1.9082658290863037, 1.9798438549041748, 2.051422119140625, 2.123000144958496, 2.194578170776367, 2.2661564350128174, 2.3377344608306885, 2.4093127250671387, 2.4808907508850098, 2.552468776702881, 2.624046802520752, 2.695625066757202]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 17.0, 5.0, 8.0, 8.0, 11.0, 22.0, 25.0, 18.0, 20.0, 28.0, 33.0, 35.0, 33.0, 44.0, 37.0, 35.0, 42.0, 48.0, 44.0, 38.0, 42.0, 40.0, 38.0, 37.0, 33.0, 36.0, 32.0, 29.0, 30.0, 24.0, 23.0, 11.0, 11.0, 14.0, 8.0, 12.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6571247577667236, -1.5989245176315308, -1.540724277496338, -1.4825239181518555, -1.4243236780166626, -1.3661234378814697, -1.3079230785369873, -1.2497228384017944, -1.1915225982666016, -1.1333223581314087, -1.0751221179962158, -1.0169217586517334, -0.9587215185165405, -0.9005212783813477, -0.84232097864151, -0.7841206789016724, -0.7259204387664795, -0.6677201986312866, -0.609519898891449, -0.5513195991516113, -0.49311935901641846, -0.4349190890789032, -0.37671881914138794, -0.3185185492038727, -0.2603182792663574, -0.20211800932884216, -0.1439177393913269, -0.08571746945381165, -0.027517199516296387, 0.030683070421218872, 0.08888334035873413, 0.1470836102962494, 0.20528388023376465, 0.2634841501712799, 0.32168442010879517, 0.3798846900463104, 0.4380849599838257, 0.49628522992134094, 0.5544854998588562, 0.6126857995986938, 0.6708860397338867, 0.7290862798690796, 0.7872865796089172, 0.8454868793487549, 0.9036871194839478, 0.9618873596191406, 1.020087718963623, 1.078287959098816, 1.1364881992340088, 1.1946884393692017, 1.2528886795043945, 1.311089038848877, 1.3692892789840698, 1.4274895191192627, 1.4856898784637451, 1.543890118598938, 1.6020903587341309, 1.6602905988693237, 1.7184908390045166, 1.776691198348999, 1.834891438484192, 1.8930916786193848, 1.9512920379638672, 2.0094921588897705, 2.067692518234253]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 13.0, 15.0, 13.0, 18.0, 33.0, 46.0, 62.0, 92.0, 125.0, 224.0, 358.0, 536.0, 895.0, 1501.0, 2437.0, 4345.0, 7687.0, 14211.0, 27013.0, 52089.0, 100668.0, 187164.0, 328147.0, 527203.0, 718974.0, 755633.0, 598379.0, 387061.0, 220718.0, 119877.0, 64072.0, 33792.0, 18126.0, 9887.0, 5233.0, 2998.0, 1774.0, 1117.0, 624.0, 392.0, 264.0, 155.0, 107.0, 67.0, 49.0, 29.0, 21.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1498546600341797, -0.14504623413085938, -0.14023780822753906, -0.13542938232421875, -0.13062095642089844, -0.12581253051757812, -0.12100410461425781, -0.1161956787109375, -0.11138725280761719, -0.10657882690429688, -0.10177040100097656, -0.09696197509765625, -0.09215354919433594, -0.08734512329101562, -0.08253669738769531, -0.077728271484375, -0.07291984558105469, -0.06811141967773438, -0.06330299377441406, -0.05849456787109375, -0.05368614196777344, -0.048877716064453125, -0.04406929016113281, -0.0392608642578125, -0.03445243835449219, -0.029644012451171875, -0.024835586547851562, -0.02002716064453125, -0.015218734741210938, -0.010410308837890625, -0.0056018829345703125, -0.00079345703125, 0.0040149688720703125, 0.008823394775390625, 0.013631820678710938, 0.01844024658203125, 0.023248672485351562, 0.028057098388671875, 0.03286552429199219, 0.0376739501953125, 0.04248237609863281, 0.047290802001953125, 0.05209922790527344, 0.05690765380859375, 0.06171607971191406, 0.06652450561523438, 0.07133293151855469, 0.076141357421875, 0.08094978332519531, 0.08575820922851562, 0.09056663513183594, 0.09537506103515625, 0.10018348693847656, 0.10499191284179688, 0.10980033874511719, 0.1146087646484375, 0.11941719055175781, 0.12422561645507812, 0.12903404235839844, 0.13384246826171875, 0.13865089416503906, 0.14345932006835938, 0.1482677459716797, 0.153076171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 9.0, 11.0, 12.0, 18.0, 19.0, 23.0, 25.0, 26.0, 42.0, 39.0, 44.0, 47.0, 49.0, 44.0, 34.0, 37.0, 51.0, 37.0, 45.0, 40.0, 48.0, 39.0, 34.0, 33.0, 27.0, 24.0, 16.0, 18.0, 12.0, 11.0, 9.0, 13.0, 7.0, 9.0, 6.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.293212890625, -0.2842674255371094, -0.27532196044921875, -0.2663764953613281, -0.2574310302734375, -0.24848556518554688, -0.23954010009765625, -0.23059463500976562, -0.221649169921875, -0.21270370483398438, -0.20375823974609375, -0.19481277465820312, -0.1858673095703125, -0.17692184448242188, -0.16797637939453125, -0.15903091430664062, -0.15008544921875, -0.14113998413085938, -0.13219451904296875, -0.12324905395507812, -0.1143035888671875, -0.10535812377929688, -0.09641265869140625, -0.08746719360351562, -0.078521728515625, -0.06957626342773438, -0.06063079833984375, -0.051685333251953125, -0.0427398681640625, -0.033794403076171875, -0.02484893798828125, -0.015903472900390625, -0.0069580078125, 0.001987457275390625, 0.01093292236328125, 0.019878387451171875, 0.0288238525390625, 0.037769317626953125, 0.04671478271484375, 0.055660247802734375, 0.064605712890625, 0.07355117797851562, 0.08249664306640625, 0.09144210815429688, 0.1003875732421875, 0.10933303833007812, 0.11827850341796875, 0.12722396850585938, 0.13616943359375, 0.14511489868164062, 0.15406036376953125, 0.16300582885742188, 0.1719512939453125, 0.18089675903320312, 0.18984222412109375, 0.19878768920898438, 0.207733154296875, 0.21667861938476562, 0.22562408447265625, 0.23456954956054688, 0.2435150146484375, 0.2524604797363281, 0.26140594482421875, 0.2703514099121094, 0.279296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 11.0, 20.0, 35.0, 51.0, 68.0, 119.0, 248.0, 495.0, 1028.0, 2596.0, 7517.0, 28384.0, 141288.0, 1026129.0, 2440387.0, 449078.0, 72327.0, 16421.0, 4771.0, 1693.0, 750.0, 391.0, 174.0, 116.0, 70.0, 36.0, 23.0, 15.0, 15.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3539886474609375, -0.337371826171875, -0.3207550048828125, -0.30413818359375, -0.2875213623046875, -0.270904541015625, -0.2542877197265625, -0.2376708984375, -0.2210540771484375, -0.204437255859375, -0.1878204345703125, -0.17120361328125, -0.1545867919921875, -0.137969970703125, -0.1213531494140625, -0.104736328125, -0.0881195068359375, -0.071502685546875, -0.0548858642578125, -0.03826904296875, -0.0216522216796875, -0.005035400390625, 0.0115814208984375, 0.0281982421875, 0.0448150634765625, 0.061431884765625, 0.0780487060546875, 0.09466552734375, 0.1112823486328125, 0.127899169921875, 0.1445159912109375, 0.1611328125, 0.1777496337890625, 0.194366455078125, 0.2109832763671875, 0.22760009765625, 0.2442169189453125, 0.260833740234375, 0.2774505615234375, 0.2940673828125, 0.3106842041015625, 0.327301025390625, 0.3439178466796875, 0.36053466796875, 0.3771514892578125, 0.393768310546875, 0.4103851318359375, 0.427001953125, 0.4436187744140625, 0.460235595703125, 0.4768524169921875, 0.49346923828125, 0.5100860595703125, 0.526702880859375, 0.5433197021484375, 0.5599365234375, 0.5765533447265625, 0.593170166015625, 0.6097869873046875, 0.62640380859375, 0.6430206298828125, 0.659637451171875, 0.6762542724609375, 0.69287109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 10.0, 13.0, 23.0, 26.0, 38.0, 64.0, 70.0, 130.0, 183.0, 278.0, 405.0, 502.0, 573.0, 526.0, 399.0, 261.0, 190.0, 120.0, 74.0, 54.0, 42.0, 18.0, 23.0, 16.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.4609870910644531, -0.44419097900390625, -0.4273948669433594, -0.4105987548828125, -0.3938026428222656, -0.37700653076171875, -0.3602104187011719, -0.343414306640625, -0.3266181945800781, -0.30982208251953125, -0.2930259704589844, -0.2762298583984375, -0.2594337463378906, -0.24263763427734375, -0.22584152221679688, -0.20904541015625, -0.19224929809570312, -0.17545318603515625, -0.15865707397460938, -0.1418609619140625, -0.12506484985351562, -0.10826873779296875, -0.09147262573242188, -0.074676513671875, -0.057880401611328125, -0.04108428955078125, -0.024288177490234375, -0.0074920654296875, 0.009304046630859375, 0.02610015869140625, 0.042896270751953125, 0.0596923828125, 0.07648849487304688, 0.09328460693359375, 0.11008071899414062, 0.1268768310546875, 0.14367294311523438, 0.16046905517578125, 0.17726516723632812, 0.194061279296875, 0.21085739135742188, 0.22765350341796875, 0.24444961547851562, 0.2612457275390625, 0.2780418395996094, 0.29483795166015625, 0.3116340637207031, 0.32843017578125, 0.3452262878417969, 0.36202239990234375, 0.3788185119628906, 0.3956146240234375, 0.4124107360839844, 0.42920684814453125, 0.4460029602050781, 0.462799072265625, 0.4795951843261719, 0.49639129638671875, 0.5131874084472656, 0.5299835205078125, 0.5467796325683594, 0.5635757446289062, 0.5803718566894531, 0.59716796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 12.0, 11.0, 27.0, 34.0, 58.0, 84.0, 125.0, 163.0, 168.0, 123.0, 90.0, 52.0, 21.0, 17.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3478312492370605, -3.2429308891296387, -3.138030529022217, -3.033130168914795, -2.928229808807373, -2.823329448699951, -2.71842885017395, -2.6135284900665283, -2.5086281299591064, -2.4037277698516846, -2.2988274097442627, -2.193927049636841, -2.08902645111084, -1.9841262102127075, -1.879225730895996, -1.7743253707885742, -1.6694250106811523, -1.5645246505737305, -1.4596242904663086, -1.3547238111495972, -1.2498234510421753, -1.1449230909347534, -1.040022611618042, -0.9351222515106201, -0.8302218914031982, -0.7253215312957764, -0.6204211115837097, -0.5155206918716431, -0.4106203317642212, -0.3057199716567993, -0.20081955194473267, -0.09591913223266602, 0.00898122787475586, 0.11388161778450012, 0.21878200769424438, 0.32368239760398865, 0.4285827875137329, 0.5334831476211548, 0.6383835673332214, 0.7432839870452881, 0.84818434715271, 0.9530847072601318, 1.0579850673675537, 1.1628855466842651, 1.267785906791687, 1.3726862668991089, 1.4775867462158203, 1.5824871063232422, 1.687387466430664, 1.792287826538086, 1.8971881866455078, 2.0020885467529297, 2.1069889068603516, 2.2118892669677734, 2.3167898654937744, 2.4216902256011963, 2.526590585708618, 2.63149094581604, 2.736391305923462, 2.841291666030884, 2.9461922645568848, 3.0510926246643066, 3.1559929847717285, 3.2608933448791504, 3.3657937049865723]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 6.0, 10.0, 11.0, 11.0, 19.0, 19.0, 21.0, 23.0, 41.0, 33.0, 37.0, 25.0, 32.0, 35.0, 39.0, 50.0, 51.0, 43.0, 51.0, 44.0, 52.0, 37.0, 34.0, 35.0, 36.0, 28.0, 24.0, 29.0, 16.0, 22.0, 11.0, 17.0, 12.0, 13.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5104460716247559, -1.4645224809646606, -1.4185988903045654, -1.3726751804351807, -1.3267515897750854, -1.2808279991149902, -1.234904408454895, -1.1889808177947998, -1.143057107925415, -1.0971335172653198, -1.0512099266052246, -1.0052862167358398, -0.9593626260757446, -0.9134390354156494, -0.8675154447555542, -0.8215917944908142, -0.775668203830719, -0.7297446131706238, -0.6838209629058838, -0.6378973722457886, -0.5919737219810486, -0.5460501313209534, -0.5001264810562134, -0.45420289039611816, -0.40827926993370056, -0.36235564947128296, -0.31643202900886536, -0.27050840854644775, -0.22458480298519135, -0.17866118252277374, -0.13273757696151733, -0.08681395649909973, -0.04089033603668213, 0.005033280700445175, 0.05095689743757248, 0.09688051044940948, 0.1428041309118271, 0.1887277513742447, 0.2346513569355011, 0.2805749773979187, 0.3264985978603363, 0.3724222183227539, 0.4183458387851715, 0.4642694592475891, 0.5101930499076843, 0.5561167001724243, 0.6020402908325195, 0.6479638814926147, 0.6938875317573547, 0.73981112241745, 0.7857347726821899, 0.8316583633422852, 0.8775820136070251, 0.9235056042671204, 0.9694292545318604, 1.0153528451919556, 1.0612764358520508, 1.107200026512146, 1.1531236171722412, 1.199047327041626, 1.2449709177017212, 1.2908945083618164, 1.3368180990219116, 1.3827416896820068, 1.4286653995513916]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 12.0, 14.0, 22.0, 26.0, 34.0, 64.0, 68.0, 111.0, 156.0, 264.0, 372.0, 548.0, 894.0, 1423.0, 2395.0, 3858.0, 6015.0, 10329.0, 18778.0, 39944.0, 92291.0, 190668.0, 264150.0, 210255.0, 108484.0, 46834.0, 21245.0, 11313.0, 6827.0, 4031.0, 2654.0, 1738.0, 1028.0, 598.0, 375.0, 239.0, 146.0, 111.0, 79.0, 43.0, 37.0, 21.0, 22.0, 16.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3301277160644531, -0.31967926025390625, -0.3092308044433594, -0.2987823486328125, -0.2883338928222656, -0.27788543701171875, -0.2674369812011719, -0.256988525390625, -0.24654006958007812, -0.23609161376953125, -0.22564315795898438, -0.2151947021484375, -0.20474624633789062, -0.19429779052734375, -0.18384933471679688, -0.17340087890625, -0.16295242309570312, -0.15250396728515625, -0.14205551147460938, -0.1316070556640625, -0.12115859985351562, -0.11071014404296875, -0.10026168823242188, -0.089813232421875, -0.07936477661132812, -0.06891632080078125, -0.058467864990234375, -0.0480194091796875, -0.037570953369140625, -0.02712249755859375, -0.016674041748046875, -0.0062255859375, 0.004222869873046875, 0.01467132568359375, 0.025119781494140625, 0.0355682373046875, 0.046016693115234375, 0.05646514892578125, 0.06691360473632812, 0.077362060546875, 0.08781051635742188, 0.09825897216796875, 0.10870742797851562, 0.1191558837890625, 0.12960433959960938, 0.14005279541015625, 0.15050125122070312, 0.16094970703125, 0.17139816284179688, 0.18184661865234375, 0.19229507446289062, 0.2027435302734375, 0.21319198608398438, 0.22364044189453125, 0.23408889770507812, 0.244537353515625, 0.2549858093261719, 0.26543426513671875, 0.2758827209472656, 0.2863311767578125, 0.2967796325683594, 0.30722808837890625, 0.3176765441894531, 0.328125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 7.0, 9.0, 16.0, 14.0, 14.0, 13.0, 28.0, 26.0, 30.0, 36.0, 32.0, 35.0, 45.0, 52.0, 46.0, 36.0, 40.0, 40.0, 41.0, 40.0, 38.0, 39.0, 42.0, 29.0, 35.0, 32.0, 27.0, 16.0, 24.0, 18.0, 18.0, 4.0, 15.0, 14.0, 11.0, 13.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.319580078125, -0.3108234405517578, -0.3020668029785156, -0.29331016540527344, -0.28455352783203125, -0.27579689025878906, -0.2670402526855469, -0.2582836151123047, -0.2495269775390625, -0.2407703399658203, -0.23201370239257812, -0.22325706481933594, -0.21450042724609375, -0.20574378967285156, -0.19698715209960938, -0.1882305145263672, -0.179473876953125, -0.1707172393798828, -0.16196060180664062, -0.15320396423339844, -0.14444732666015625, -0.13569068908691406, -0.12693405151367188, -0.11817741394042969, -0.1094207763671875, -0.10066413879394531, -0.09190750122070312, -0.08315086364746094, -0.07439422607421875, -0.06563758850097656, -0.056880950927734375, -0.04812431335449219, -0.03936767578125, -0.030611038208007812, -0.021854400634765625, -0.013097763061523438, -0.00434112548828125, 0.0044155120849609375, 0.013172149658203125, 0.021928787231445312, 0.0306854248046875, 0.03944206237792969, 0.048198699951171875, 0.05695533752441406, 0.06571197509765625, 0.07446861267089844, 0.08322525024414062, 0.09198188781738281, 0.100738525390625, 0.10949516296386719, 0.11825180053710938, 0.12700843811035156, 0.13576507568359375, 0.14452171325683594, 0.15327835083007812, 0.1620349884033203, 0.1707916259765625, 0.1795482635498047, 0.18830490112304688, 0.19706153869628906, 0.20581817626953125, 0.21457481384277344, 0.22333145141601562, 0.2320880889892578, 0.2408447265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 6.0, 11.0, 15.0, 17.0, 30.0, 42.0, 52.0, 109.0, 160.0, 283.0, 564.0, 1150.0, 2498.0, 5723.0, 13389.0, 35867.0, 119190.0, 369761.0, 341657.0, 103946.0, 31906.0, 12361.0, 5182.0, 2253.0, 1077.0, 522.0, 291.0, 175.0, 93.0, 61.0, 50.0, 26.0, 24.0, 19.0, 9.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56005859375, -0.541961669921875, -0.52386474609375, -0.505767822265625, -0.4876708984375, -0.469573974609375, -0.45147705078125, -0.433380126953125, -0.415283203125, -0.397186279296875, -0.37908935546875, -0.360992431640625, -0.3428955078125, -0.324798583984375, -0.30670166015625, -0.288604736328125, -0.2705078125, -0.252410888671875, -0.23431396484375, -0.216217041015625, -0.1981201171875, -0.180023193359375, -0.16192626953125, -0.143829345703125, -0.125732421875, -0.107635498046875, -0.08953857421875, -0.071441650390625, -0.0533447265625, -0.035247802734375, -0.01715087890625, 0.000946044921875, 0.01904296875, 0.037139892578125, 0.05523681640625, 0.073333740234375, 0.0914306640625, 0.109527587890625, 0.12762451171875, 0.145721435546875, 0.163818359375, 0.181915283203125, 0.20001220703125, 0.218109130859375, 0.2362060546875, 0.254302978515625, 0.27239990234375, 0.290496826171875, 0.30859375, 0.326690673828125, 0.34478759765625, 0.362884521484375, 0.3809814453125, 0.399078369140625, 0.41717529296875, 0.435272216796875, 0.453369140625, 0.471466064453125, 0.48956298828125, 0.507659912109375, 0.5257568359375, 0.543853759765625, 0.56195068359375, 0.580047607421875, 0.59814453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 17.0, 13.0, 16.0, 16.0, 25.0, 23.0, 29.0, 30.0, 33.0, 30.0, 49.0, 37.0, 44.0, 52.0, 30.0, 46.0, 44.0, 38.0, 42.0, 37.0, 28.0, 30.0, 34.0, 32.0, 21.0, 27.0, 24.0, 30.0, 18.0, 16.0, 14.0, 10.0, 7.0, 8.0, 6.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.84521484375, -0.8201141357421875, -0.795013427734375, -0.7699127197265625, -0.74481201171875, -0.7197113037109375, -0.694610595703125, -0.6695098876953125, -0.6444091796875, -0.6193084716796875, -0.594207763671875, -0.5691070556640625, -0.54400634765625, -0.5189056396484375, -0.493804931640625, -0.4687042236328125, -0.443603515625, -0.4185028076171875, -0.393402099609375, -0.3683013916015625, -0.34320068359375, -0.3180999755859375, -0.292999267578125, -0.2678985595703125, -0.2427978515625, -0.2176971435546875, -0.192596435546875, -0.1674957275390625, -0.14239501953125, -0.1172943115234375, -0.092193603515625, -0.0670928955078125, -0.0419921875, -0.0168914794921875, 0.008209228515625, 0.0333099365234375, 0.05841064453125, 0.0835113525390625, 0.108612060546875, 0.1337127685546875, 0.1588134765625, 0.1839141845703125, 0.209014892578125, 0.2341156005859375, 0.25921630859375, 0.2843170166015625, 0.309417724609375, 0.3345184326171875, 0.359619140625, 0.3847198486328125, 0.409820556640625, 0.4349212646484375, 0.46002197265625, 0.4851226806640625, 0.510223388671875, 0.5353240966796875, 0.5604248046875, 0.5855255126953125, 0.610626220703125, 0.6357269287109375, 0.66082763671875, 0.6859283447265625, 0.711029052734375, 0.7361297607421875, 0.76123046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 6.0, 14.0, 31.0, 28.0, 25.0, 49.0, 73.0, 95.0, 129.0, 167.0, 280.0, 352.0, 475.0, 705.0, 1058.0, 1538.0, 2536.0, 4797.0, 12578.0, 56408.0, 542132.0, 366295.0, 37994.0, 9815.0, 3959.0, 2173.0, 1483.0, 1003.0, 672.0, 455.0, 349.0, 228.0, 187.0, 121.0, 104.0, 60.0, 45.0, 32.0, 19.0, 20.0, 14.0, 11.0, 13.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3623046875, -0.3497657775878906, -0.33722686767578125, -0.3246879577636719, -0.3121490478515625, -0.2996101379394531, -0.28707122802734375, -0.2745323181152344, -0.261993408203125, -0.24945449829101562, -0.23691558837890625, -0.22437667846679688, -0.2118377685546875, -0.19929885864257812, -0.18675994873046875, -0.17422103881835938, -0.16168212890625, -0.14914321899414062, -0.13660430908203125, -0.12406539916992188, -0.1115264892578125, -0.09898757934570312, -0.08644866943359375, -0.07390975952148438, -0.061370849609375, -0.048831939697265625, -0.03629302978515625, -0.023754119873046875, -0.0112152099609375, 0.001323699951171875, 0.01386260986328125, 0.026401519775390625, 0.0389404296875, 0.051479339599609375, 0.06401824951171875, 0.07655715942382812, 0.0890960693359375, 0.10163497924804688, 0.11417388916015625, 0.12671279907226562, 0.139251708984375, 0.15179061889648438, 0.16432952880859375, 0.17686843872070312, 0.1894073486328125, 0.20194625854492188, 0.21448516845703125, 0.22702407836914062, 0.23956298828125, 0.2521018981933594, 0.26464080810546875, 0.2771797180175781, 0.2897186279296875, 0.3022575378417969, 0.31479644775390625, 0.3273353576660156, 0.339874267578125, 0.3524131774902344, 0.36495208740234375, 0.3774909973144531, 0.3900299072265625, 0.4025688171386719, 0.41510772705078125, 0.4276466369628906, 0.440185546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 10.0, 17.0, 55.0, 179.0, 340.0, 236.0, 80.0, 32.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019919872283935547, -0.00019289925694465637, -0.00018659979104995728, -0.00018030032515525818, -0.00017400085926055908, -0.00016770139336585999, -0.0001614019274711609, -0.0001551024615764618, -0.0001488029956817627, -0.0001425035297870636, -0.0001362040638923645, -0.0001299045979976654, -0.0001236051321029663, -0.00011730566620826721, -0.00011100620031356812, -0.00010470673441886902, -9.840726852416992e-05, -9.210780262947083e-05, -8.580833673477173e-05, -7.950887084007263e-05, -7.320940494537354e-05, -6.690993905067444e-05, -6.061047315597534e-05, -5.4311007261276245e-05, -4.801154136657715e-05, -4.171207547187805e-05, -3.5412609577178955e-05, -2.911314368247986e-05, -2.2813677787780762e-05, -1.6514211893081665e-05, -1.0214745998382568e-05, -3.915280103683472e-06, 2.384185791015625e-06, 8.683651685714722e-06, 1.4983117580413818e-05, 2.1282583475112915e-05, 2.7582049369812012e-05, 3.388151526451111e-05, 4.0180981159210205e-05, 4.64804470539093e-05, 5.27799129486084e-05, 5.9079378843307495e-05, 6.537884473800659e-05, 7.167831063270569e-05, 7.797777652740479e-05, 8.427724242210388e-05, 9.057670831680298e-05, 9.687617421150208e-05, 0.00010317564010620117, 0.00010947510600090027, 0.00011577457189559937, 0.00012207403779029846, 0.00012837350368499756, 0.00013467296957969666, 0.00014097243547439575, 0.00014727190136909485, 0.00015357136726379395, 0.00015987083315849304, 0.00016617029905319214, 0.00017246976494789124, 0.00017876923084259033, 0.00018506869673728943, 0.00019136816263198853, 0.00019766762852668762, 0.00020396709442138672]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 12.0, 14.0, 9.0, 21.0, 25.0, 41.0, 64.0, 132.0, 216.0, 321.0, 500.0, 832.0, 1457.0, 2904.0, 8540.0, 51444.0, 546223.0, 389462.0, 33754.0, 6634.0, 2590.0, 1284.0, 768.0, 475.0, 312.0, 179.0, 108.0, 62.0, 41.0, 28.0, 25.0, 14.0, 9.0, 10.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.451904296875, -0.43857574462890625, -0.4252471923828125, -0.41191864013671875, -0.398590087890625, -0.38526153564453125, -0.3719329833984375, -0.35860443115234375, -0.34527587890625, -0.33194732666015625, -0.3186187744140625, -0.30529022216796875, -0.291961669921875, -0.27863311767578125, -0.2653045654296875, -0.25197601318359375, -0.2386474609375, -0.22531890869140625, -0.2119903564453125, -0.19866180419921875, -0.185333251953125, -0.17200469970703125, -0.1586761474609375, -0.14534759521484375, -0.13201904296875, -0.11869049072265625, -0.1053619384765625, -0.09203338623046875, -0.078704833984375, -0.06537628173828125, -0.0520477294921875, -0.03871917724609375, -0.025390625, -0.01206207275390625, 0.0012664794921875, 0.01459503173828125, 0.027923583984375, 0.04125213623046875, 0.0545806884765625, 0.06790924072265625, 0.08123779296875, 0.09456634521484375, 0.1078948974609375, 0.12122344970703125, 0.134552001953125, 0.14788055419921875, 0.1612091064453125, 0.17453765869140625, 0.1878662109375, 0.20119476318359375, 0.2145233154296875, 0.22785186767578125, 0.241180419921875, 0.25450897216796875, 0.2678375244140625, 0.28116607666015625, 0.29449462890625, 0.30782318115234375, 0.3211517333984375, 0.33448028564453125, 0.347808837890625, 0.36113739013671875, 0.3744659423828125, 0.38779449462890625, 0.401123046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 12.0, 23.0, 33.0, 58.0, 95.0, 137.0, 161.0, 134.0, 112.0, 79.0, 49.0, 37.0, 15.0, 7.0, 12.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.35039520263671875, -0.3382415771484375, -0.32608795166015625, -0.313934326171875, -0.30178070068359375, -0.2896270751953125, -0.27747344970703125, -0.26531982421875, -0.25316619873046875, -0.2410125732421875, -0.22885894775390625, -0.216705322265625, -0.20455169677734375, -0.1923980712890625, -0.18024444580078125, -0.1680908203125, -0.15593719482421875, -0.1437835693359375, -0.13162994384765625, -0.119476318359375, -0.10732269287109375, -0.0951690673828125, -0.08301544189453125, -0.07086181640625, -0.05870819091796875, -0.0465545654296875, -0.03440093994140625, -0.022247314453125, -0.01009368896484375, 0.0020599365234375, 0.01421356201171875, 0.0263671875, 0.03852081298828125, 0.0506744384765625, 0.06282806396484375, 0.074981689453125, 0.08713531494140625, 0.0992889404296875, 0.11144256591796875, 0.12359619140625, 0.13574981689453125, 0.1479034423828125, 0.16005706787109375, 0.172210693359375, 0.18436431884765625, 0.1965179443359375, 0.20867156982421875, 0.2208251953125, 0.23297882080078125, 0.2451324462890625, 0.25728607177734375, 0.269439697265625, 0.28159332275390625, 0.2937469482421875, 0.30590057373046875, 0.31805419921875, 0.33020782470703125, 0.3423614501953125, 0.35451507568359375, 0.366668701171875, 0.37882232666015625, 0.3909759521484375, 0.40312957763671875, 0.415283203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 13.0, 23.0, 33.0, 64.0, 109.0, 189.0, 183.0, 165.0, 108.0, 49.0, 18.0, 10.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.606661319732666, -4.471972942352295, -4.337285041809082, -4.202596664428711, -4.06790828704834, -3.933220386505127, -3.798532009124756, -3.663843870162964, -3.529155731201172, -3.39446759223938, -3.259779453277588, -3.125091075897217, -2.990402936935425, -2.855714797973633, -2.7210264205932617, -2.5863382816314697, -2.4516501426696777, -2.3169620037078857, -2.1822738647460938, -2.0475854873657227, -1.9128973484039307, -1.7782092094421387, -1.6435209512710571, -1.5088326930999756, -1.3741445541381836, -1.2394564151763916, -1.10476815700531, -0.9700799584388733, -0.8353917598724365, -0.7007035613059998, -0.566015362739563, -0.4313271641731262, -0.29663896560668945, -0.16195076704025269, -0.027262568473815918, 0.10742563009262085, 0.24211382865905762, 0.3768020272254944, 0.5114902257919312, 0.6461784243583679, 0.7808666229248047, 0.9155548214912415, 1.0502430200576782, 1.1849312782287598, 1.3196194171905518, 1.4543075561523438, 1.5889958143234253, 1.7236840724945068, 1.8583722114562988, 1.9930603504180908, 2.127748489379883, 2.262436866760254, 2.397125005722046, 2.531813144683838, 2.666501522064209, 2.801189661026001, 2.935877799987793, 3.070565938949585, 3.205254077911377, 3.339942455291748, 3.47463059425354, 3.609318733215332, 3.744007110595703, 3.878695249557495, 4.013383388519287]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 8.0, 11.0, 11.0, 7.0, 11.0, 13.0, 22.0, 26.0, 31.0, 20.0, 36.0, 31.0, 47.0, 37.0, 44.0, 34.0, 38.0, 55.0, 36.0, 47.0, 38.0, 43.0, 29.0, 26.0, 42.0, 45.0, 26.0, 21.0, 24.0, 23.0, 22.0, 15.0, 11.0, 9.0, 12.0, 9.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7436070442199707, -1.6839699745178223, -1.6243329048156738, -1.5646958351135254, -1.505058765411377, -1.4454216957092285, -1.38578462600708, -1.3261475563049316, -1.2665104866027832, -1.2068734169006348, -1.1472363471984863, -1.087599277496338, -1.0279622077941895, -0.968325138092041, -0.9086880683898926, -0.8490509986877441, -0.7894139289855957, -0.7297768592834473, -0.6701397895812988, -0.6105027198791504, -0.550865650177002, -0.4912285804748535, -0.4315915107727051, -0.37195444107055664, -0.3123173713684082, -0.25268030166625977, -0.19304323196411133, -0.1334061622619629, -0.07376909255981445, -0.014132022857666016, 0.04550504684448242, 0.10514211654663086, 0.1647791862487793, 0.22441625595092773, 0.28405332565307617, 0.3436903953552246, 0.40332746505737305, 0.4629645347595215, 0.5226016044616699, 0.5822386741638184, 0.6418757438659668, 0.7015128135681152, 0.7611498832702637, 0.8207869529724121, 0.8804240226745605, 0.940061092376709, 0.9996981620788574, 1.0593352317810059, 1.1189723014831543, 1.1786093711853027, 1.2382464408874512, 1.2978835105895996, 1.357520580291748, 1.4171576499938965, 1.476794719696045, 1.5364317893981934, 1.5960688591003418, 1.6557059288024902, 1.7153429985046387, 1.774980068206787, 1.8346171379089355, 1.894254207611084, 1.9538912773132324, 2.013528347015381, 2.0731654167175293]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 10.0, 16.0, 25.0, 49.0, 55.0, 81.0, 155.0, 253.0, 526.0, 1081.0, 1894.0, 4577.0, 12181.0, 38790.0, 145263.0, 516107.0, 1249145.0, 1348953.0, 622566.0, 180862.0, 47329.0, 14361.0, 5205.0, 2215.0, 1091.0, 591.0, 320.0, 192.0, 120.0, 68.0, 53.0, 33.0, 24.0, 28.0, 12.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.38037109375, -0.36920928955078125, -0.3580474853515625, -0.34688568115234375, -0.335723876953125, -0.32456207275390625, -0.3134002685546875, -0.30223846435546875, -0.29107666015625, -0.27991485595703125, -0.2687530517578125, -0.25759124755859375, -0.246429443359375, -0.23526763916015625, -0.2241058349609375, -0.21294403076171875, -0.2017822265625, -0.19062042236328125, -0.1794586181640625, -0.16829681396484375, -0.157135009765625, -0.14597320556640625, -0.1348114013671875, -0.12364959716796875, -0.11248779296875, -0.10132598876953125, -0.0901641845703125, -0.07900238037109375, -0.067840576171875, -0.05667877197265625, -0.0455169677734375, -0.03435516357421875, -0.023193359375, -0.01203155517578125, -0.0008697509765625, 0.01029205322265625, 0.021453857421875, 0.03261566162109375, 0.0437774658203125, 0.05493927001953125, 0.06610107421875, 0.07726287841796875, 0.0884246826171875, 0.09958648681640625, 0.110748291015625, 0.12191009521484375, 0.1330718994140625, 0.14423370361328125, 0.1553955078125, 0.16655731201171875, 0.1777191162109375, 0.18888092041015625, 0.200042724609375, 0.21120452880859375, 0.2223663330078125, 0.23352813720703125, 0.24468994140625, 0.25585174560546875, 0.2670135498046875, 0.27817535400390625, 0.289337158203125, 0.30049896240234375, 0.3116607666015625, 0.32282257080078125, 0.333984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 17.0, 17.0, 22.0, 23.0, 38.0, 38.0, 45.0, 54.0, 51.0, 66.0, 75.0, 62.0, 69.0, 58.0, 66.0, 59.0, 54.0, 39.0, 40.0, 27.0, 16.0, 21.0, 10.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.40325164794921875, -0.3875579833984375, -0.37186431884765625, -0.356170654296875, -0.34047698974609375, -0.3247833251953125, -0.30908966064453125, -0.29339599609375, -0.27770233154296875, -0.2620086669921875, -0.24631500244140625, -0.230621337890625, -0.21492767333984375, -0.1992340087890625, -0.18354034423828125, -0.1678466796875, -0.15215301513671875, -0.1364593505859375, -0.12076568603515625, -0.105072021484375, -0.08937835693359375, -0.0736846923828125, -0.05799102783203125, -0.04229736328125, -0.02660369873046875, -0.0109100341796875, 0.00478363037109375, 0.020477294921875, 0.03617095947265625, 0.0518646240234375, 0.06755828857421875, 0.083251953125, 0.09894561767578125, 0.1146392822265625, 0.13033294677734375, 0.146026611328125, 0.16172027587890625, 0.1774139404296875, 0.19310760498046875, 0.20880126953125, 0.22449493408203125, 0.2401885986328125, 0.25588226318359375, 0.271575927734375, 0.28726959228515625, 0.3029632568359375, 0.31865692138671875, 0.3343505859375, 0.35004425048828125, 0.3657379150390625, 0.38143157958984375, 0.397125244140625, 0.41281890869140625, 0.4285125732421875, 0.44420623779296875, 0.45989990234375, 0.47559356689453125, 0.4912872314453125, 0.5069808959960938, 0.522674560546875, 0.5383682250976562, 0.5540618896484375, 0.5697555541992188, 0.58544921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 15.0, 21.0, 31.0, 48.0, 75.0, 120.0, 208.0, 314.0, 656.0, 1429.0, 3989.0, 13795.0, 66542.0, 514598.0, 2702598.0, 772274.0, 92018.0, 17462.0, 4808.0, 1667.0, 692.0, 369.0, 212.0, 122.0, 71.0, 37.0, 26.0, 16.0, 18.0, 11.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5268020629882812, -0.5077056884765625, -0.48860931396484375, -0.469512939453125, -0.45041656494140625, -0.4313201904296875, -0.41222381591796875, -0.39312744140625, -0.37403106689453125, -0.3549346923828125, -0.33583831787109375, -0.316741943359375, -0.29764556884765625, -0.2785491943359375, -0.25945281982421875, -0.2403564453125, -0.22126007080078125, -0.2021636962890625, -0.18306732177734375, -0.163970947265625, -0.14487457275390625, -0.1257781982421875, -0.10668182373046875, -0.08758544921875, -0.06848907470703125, -0.0493927001953125, -0.03029632568359375, -0.011199951171875, 0.00789642333984375, 0.0269927978515625, 0.04608917236328125, 0.065185546875, 0.08428192138671875, 0.1033782958984375, 0.12247467041015625, 0.141571044921875, 0.16066741943359375, 0.1797637939453125, 0.19886016845703125, 0.21795654296875, 0.23705291748046875, 0.2561492919921875, 0.27524566650390625, 0.294342041015625, 0.31343841552734375, 0.3325347900390625, 0.35163116455078125, 0.3707275390625, 0.38982391357421875, 0.4089202880859375, 0.42801666259765625, 0.447113037109375, 0.46620941162109375, 0.4853057861328125, 0.5044021606445312, 0.52349853515625, 0.5425949096679688, 0.5616912841796875, 0.5807876586914062, 0.599884033203125, 0.6189804077148438, 0.6380767822265625, 0.6571731567382812, 0.67626953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 18.0, 17.0, 29.0, 51.0, 78.0, 140.0, 228.0, 381.0, 529.0, 666.0, 677.0, 458.0, 297.0, 185.0, 101.0, 69.0, 43.0, 37.0, 12.0, 10.0, 11.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5023651123046875, -0.480316162109375, -0.4582672119140625, -0.43621826171875, -0.4141693115234375, -0.392120361328125, -0.3700714111328125, -0.3480224609375, -0.3259735107421875, -0.303924560546875, -0.2818756103515625, -0.25982666015625, -0.2377777099609375, -0.215728759765625, -0.1936798095703125, -0.171630859375, -0.1495819091796875, -0.127532958984375, -0.1054840087890625, -0.08343505859375, -0.0613861083984375, -0.039337158203125, -0.0172882080078125, 0.0047607421875, 0.0268096923828125, 0.048858642578125, 0.0709075927734375, 0.09295654296875, 0.1150054931640625, 0.137054443359375, 0.1591033935546875, 0.18115234375, 0.2032012939453125, 0.225250244140625, 0.2472991943359375, 0.26934814453125, 0.2913970947265625, 0.313446044921875, 0.3354949951171875, 0.3575439453125, 0.3795928955078125, 0.401641845703125, 0.4236907958984375, 0.44573974609375, 0.4677886962890625, 0.489837646484375, 0.5118865966796875, 0.533935546875, 0.5559844970703125, 0.578033447265625, 0.6000823974609375, 0.62213134765625, 0.6441802978515625, 0.666229248046875, 0.6882781982421875, 0.7103271484375, 0.7323760986328125, 0.754425048828125, 0.7764739990234375, 0.79852294921875, 0.8205718994140625, 0.842620849609375, 0.8646697998046875, 0.88671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 11.0, 15.0, 30.0, 48.0, 97.0, 121.0, 160.0, 149.0, 133.0, 98.0, 48.0, 41.0, 17.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220745086669922, -3.1059622764587402, -2.9911797046661377, -2.876397132873535, -2.7616143226623535, -2.646831512451172, -2.5320489406585693, -2.417266368865967, -2.302483558654785, -2.1877007484436035, -2.072918176651001, -1.9581354856491089, -1.8433527946472168, -1.7285701036453247, -1.6137874126434326, -1.4990047216415405, -1.3842220306396484, -1.2694393396377563, -1.1546566486358643, -1.0398739576339722, -0.9250912666320801, -0.810308575630188, -0.6955258846282959, -0.5807431936264038, -0.4659605026245117, -0.35117781162261963, -0.23639512062072754, -0.12161242961883545, -0.006829738616943359, 0.10795295238494873, 0.22273564338684082, 0.3375183343887329, 0.452301025390625, 0.5670837163925171, 0.6818664073944092, 0.7966490983963013, 0.9114317893981934, 1.0262144804000854, 1.1409971714019775, 1.2557798624038696, 1.3705625534057617, 1.4853452444076538, 1.600127935409546, 1.714910626411438, 1.82969331741333, 1.9444760084152222, 2.0592586994171143, 2.174041271209717, 2.2888240814208984, 2.40360689163208, 2.5183894634246826, 2.633172035217285, 2.747954845428467, 2.8627376556396484, 2.977520227432251, 3.0923027992248535, 3.207085609436035, 3.321868419647217, 3.4366509914398193, 3.551433563232422, 3.6662163734436035, 3.780999183654785, 3.8957817554473877, 4.01056432723999, 4.125347137451172]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 2.0, 8.0, 8.0, 6.0, 10.0, 12.0, 23.0, 22.0, 17.0, 25.0, 25.0, 21.0, 32.0, 23.0, 26.0, 36.0, 39.0, 38.0, 46.0, 44.0, 47.0, 42.0, 38.0, 45.0, 26.0, 31.0, 34.0, 28.0, 19.0, 23.0, 27.0, 16.0, 21.0, 22.0, 21.0, 12.0, 16.0, 7.0, 8.0, 8.0, 3.0, 8.0, 6.0, 5.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.375675082206726, -1.3328278064727783, -1.2899805307388306, -1.2471332550048828, -1.2042860984802246, -1.1614388227462769, -1.118591547012329, -1.0757442712783813, -1.0328969955444336, -0.9900497198104858, -0.9472024440765381, -0.9043552279472351, -0.8615079522132874, -0.8186606764793396, -0.7758134603500366, -0.7329661846160889, -0.6901189088821411, -0.6472716331481934, -0.6044243574142456, -0.5615771412849426, -0.5187298655509949, -0.4758825898170471, -0.43303534388542175, -0.3901880979537964, -0.34734082221984863, -0.3044935464859009, -0.2616463005542755, -0.21879903972148895, -0.1759517788887024, -0.13310451805591583, -0.09025725722312927, -0.047410011291503906, -0.004562854766845703, 0.03828440606594086, 0.08113166689872742, 0.12397892773151398, 0.16682618856430054, 0.2096734493970871, 0.25252071022987366, 0.295367956161499, 0.3382152318954468, 0.38106250762939453, 0.4239097535610199, 0.46675699949264526, 0.509604275226593, 0.5524515509605408, 0.5952987670898438, 0.6381460428237915, 0.6809933185577393, 0.723840594291687, 0.7666878700256348, 0.8095350861549377, 0.8523823618888855, 0.8952296376228333, 0.9380768537521362, 0.980924129486084, 1.0237714052200317, 1.0666186809539795, 1.1094659566879272, 1.152313232421875, 1.1951603889465332, 1.238007664680481, 1.2808549404144287, 1.3237022161483765, 1.3665494918823242]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 11.0, 7.0, 12.0, 32.0, 35.0, 59.0, 132.0, 273.0, 515.0, 1057.0, 2520.0, 6358.0, 21625.0, 132842.0, 564253.0, 265039.0, 38223.0, 9302.0, 3436.0, 1434.0, 659.0, 302.0, 193.0, 91.0, 52.0, 22.0, 22.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.9658203125, -0.9408493041992188, -0.9158782958984375, -0.8909072875976562, -0.865936279296875, -0.8409652709960938, -0.8159942626953125, -0.7910232543945312, -0.76605224609375, -0.7410812377929688, -0.7161102294921875, -0.6911392211914062, -0.666168212890625, -0.6411972045898438, -0.6162261962890625, -0.5912551879882812, -0.5662841796875, -0.5413131713867188, -0.5163421630859375, -0.49137115478515625, -0.466400146484375, -0.44142913818359375, -0.4164581298828125, -0.39148712158203125, -0.36651611328125, -0.34154510498046875, -0.3165740966796875, -0.29160308837890625, -0.266632080078125, -0.24166107177734375, -0.2166900634765625, -0.19171905517578125, -0.166748046875, -0.14177703857421875, -0.1168060302734375, -0.09183502197265625, -0.066864013671875, -0.04189300537109375, -0.0169219970703125, 0.00804901123046875, 0.03302001953125, 0.05799102783203125, 0.0829620361328125, 0.10793304443359375, 0.132904052734375, 0.15787506103515625, 0.1828460693359375, 0.20781707763671875, 0.2327880859375, 0.25775909423828125, 0.2827301025390625, 0.30770111083984375, 0.332672119140625, 0.35764312744140625, 0.3826141357421875, 0.40758514404296875, 0.43255615234375, 0.45752716064453125, 0.4824981689453125, 0.5074691772460938, 0.532440185546875, 0.5574111938476562, 0.5823822021484375, 0.6073532104492188, 0.63232421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 11.0, 7.0, 11.0, 18.0, 11.0, 18.0, 22.0, 20.0, 22.0, 34.0, 35.0, 50.0, 62.0, 45.0, 44.0, 45.0, 58.0, 57.0, 44.0, 60.0, 48.0, 31.0, 40.0, 22.0, 21.0, 26.0, 29.0, 20.0, 15.0, 19.0, 17.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40459442138671875, -0.3921966552734375, -0.37979888916015625, -0.367401123046875, -0.35500335693359375, -0.3426055908203125, -0.33020782470703125, -0.31781005859375, -0.30541229248046875, -0.2930145263671875, -0.28061676025390625, -0.268218994140625, -0.25582122802734375, -0.2434234619140625, -0.23102569580078125, -0.2186279296875, -0.20623016357421875, -0.1938323974609375, -0.18143463134765625, -0.169036865234375, -0.15663909912109375, -0.1442413330078125, -0.13184356689453125, -0.11944580078125, -0.10704803466796875, -0.0946502685546875, -0.08225250244140625, -0.069854736328125, -0.05745697021484375, -0.0450592041015625, -0.03266143798828125, -0.020263671875, -0.00786590576171875, 0.0045318603515625, 0.01692962646484375, 0.029327392578125, 0.04172515869140625, 0.0541229248046875, 0.06652069091796875, 0.07891845703125, 0.09131622314453125, 0.1037139892578125, 0.11611175537109375, 0.128509521484375, 0.14090728759765625, 0.1533050537109375, 0.16570281982421875, 0.1781005859375, 0.19049835205078125, 0.2028961181640625, 0.21529388427734375, 0.227691650390625, 0.24008941650390625, 0.2524871826171875, 0.26488494873046875, 0.27728271484375, 0.28968048095703125, 0.3020782470703125, 0.31447601318359375, 0.326873779296875, 0.33927154541015625, 0.3516693115234375, 0.36406707763671875, 0.37646484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 15.0, 30.0, 30.0, 39.0, 65.0, 111.0, 203.0, 344.0, 640.0, 1248.0, 2473.0, 4750.0, 10224.0, 23227.0, 65226.0, 202243.0, 372765.0, 236605.0, 78691.0, 26925.0, 11401.0, 5500.0, 2742.0, 1376.0, 721.0, 393.0, 220.0, 120.0, 66.0, 54.0, 22.0, 19.0, 13.0, 7.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487548828125, -0.47303009033203125, -0.4585113525390625, -0.44399261474609375, -0.429473876953125, -0.41495513916015625, -0.4004364013671875, -0.38591766357421875, -0.37139892578125, -0.35688018798828125, -0.3423614501953125, -0.32784271240234375, -0.313323974609375, -0.29880523681640625, -0.2842864990234375, -0.26976776123046875, -0.2552490234375, -0.24073028564453125, -0.2262115478515625, -0.21169281005859375, -0.197174072265625, -0.18265533447265625, -0.1681365966796875, -0.15361785888671875, -0.13909912109375, -0.12458038330078125, -0.1100616455078125, -0.09554290771484375, -0.081024169921875, -0.06650543212890625, -0.0519866943359375, -0.03746795654296875, -0.02294921875, -0.00843048095703125, 0.0060882568359375, 0.02060699462890625, 0.035125732421875, 0.04964447021484375, 0.0641632080078125, 0.07868194580078125, 0.09320068359375, 0.10771942138671875, 0.1222381591796875, 0.13675689697265625, 0.151275634765625, 0.16579437255859375, 0.1803131103515625, 0.19483184814453125, 0.2093505859375, 0.22386932373046875, 0.2383880615234375, 0.25290679931640625, 0.267425537109375, 0.28194427490234375, 0.2964630126953125, 0.31098175048828125, 0.32550048828125, 0.34001922607421875, 0.3545379638671875, 0.36905670166015625, 0.383575439453125, 0.39809417724609375, 0.4126129150390625, 0.42713165283203125, 0.441650390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 4.0, 11.0, 8.0, 7.0, 8.0, 9.0, 28.0, 22.0, 12.0, 19.0, 33.0, 41.0, 40.0, 37.0, 38.0, 50.0, 54.0, 56.0, 39.0, 48.0, 48.0, 37.0, 42.0, 51.0, 42.0, 40.0, 35.0, 23.0, 22.0, 16.0, 11.0, 11.0, 8.0, 8.0, 6.0, 8.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1070938110351562, -1.0764923095703125, -1.0458908081054688, -1.015289306640625, -0.9846878051757812, -0.9540863037109375, -0.9234848022460938, -0.89288330078125, -0.8622817993164062, -0.8316802978515625, -0.8010787963867188, -0.770477294921875, -0.7398757934570312, -0.7092742919921875, -0.6786727905273438, -0.6480712890625, -0.6174697875976562, -0.5868682861328125, -0.5562667846679688, -0.525665283203125, -0.49506378173828125, -0.4644622802734375, -0.43386077880859375, -0.40325927734375, -0.37265777587890625, -0.3420562744140625, -0.31145477294921875, -0.280853271484375, -0.25025177001953125, -0.2196502685546875, -0.18904876708984375, -0.158447265625, -0.12784576416015625, -0.0972442626953125, -0.06664276123046875, -0.036041259765625, -0.00543975830078125, 0.0251617431640625, 0.05576324462890625, 0.08636474609375, 0.11696624755859375, 0.1475677490234375, 0.17816925048828125, 0.208770751953125, 0.23937225341796875, 0.2699737548828125, 0.30057525634765625, 0.3311767578125, 0.36177825927734375, 0.3923797607421875, 0.42298126220703125, 0.453582763671875, 0.48418426513671875, 0.5147857666015625, 0.5453872680664062, 0.57598876953125, 0.6065902709960938, 0.6371917724609375, 0.6677932739257812, 0.698394775390625, 0.7289962768554688, 0.7595977783203125, 0.7901992797851562, 0.82080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 13.0, 25.0, 39.0, 52.0, 71.0, 102.0, 167.0, 223.0, 378.0, 659.0, 1249.0, 2496.0, 5470.0, 14311.0, 51543.0, 329269.0, 516159.0, 91097.0, 20865.0, 7466.0, 3225.0, 1571.0, 813.0, 458.0, 291.0, 176.0, 112.0, 72.0, 52.0, 38.0, 27.0, 12.0, 14.0, 13.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22731399536132812, -0.21952056884765625, -0.21172714233398438, -0.2039337158203125, -0.19614028930664062, -0.18834686279296875, -0.18055343627929688, -0.172760009765625, -0.16496658325195312, -0.15717315673828125, -0.14937973022460938, -0.1415863037109375, -0.13379287719726562, -0.12599945068359375, -0.11820602416992188, -0.11041259765625, -0.10261917114257812, -0.09482574462890625, -0.08703231811523438, -0.0792388916015625, -0.07144546508789062, -0.06365203857421875, -0.055858612060546875, -0.048065185546875, -0.040271759033203125, -0.03247833251953125, -0.024684906005859375, -0.0168914794921875, -0.009098052978515625, -0.00130462646484375, 0.006488800048828125, 0.0142822265625, 0.022075653076171875, 0.02986907958984375, 0.037662506103515625, 0.0454559326171875, 0.053249359130859375, 0.06104278564453125, 0.06883621215820312, 0.076629638671875, 0.08442306518554688, 0.09221649169921875, 0.10000991821289062, 0.1078033447265625, 0.11559677124023438, 0.12339019775390625, 0.13118362426757812, 0.13897705078125, 0.14677047729492188, 0.15456390380859375, 0.16235733032226562, 0.1701507568359375, 0.17794418334960938, 0.18573760986328125, 0.19353103637695312, 0.201324462890625, 0.20911788940429688, 0.21691131591796875, 0.22470474243164062, 0.2324981689453125, 0.24029159545898438, 0.24808502197265625, 0.2558784484863281, 0.263671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 7.0, 11.0, 10.0, 7.0, 21.0, 39.0, 76.0, 162.0, 212.0, 199.0, 122.0, 62.0, 17.0, 20.0, 9.0, 11.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.666515350341797e-05, -8.302740752696991e-05, -7.938966155052185e-05, -7.575191557407379e-05, -7.211416959762573e-05, -6.847642362117767e-05, -6.483867764472961e-05, -6.120093166828156e-05, -5.7563185691833496e-05, -5.392543971538544e-05, -5.028769373893738e-05, -4.664994776248932e-05, -4.301220178604126e-05, -3.93744558095932e-05, -3.573670983314514e-05, -3.209896385669708e-05, -2.8461217880249023e-05, -2.4823471903800964e-05, -2.1185725927352905e-05, -1.7547979950904846e-05, -1.3910233974456787e-05, -1.0272487998008728e-05, -6.634742021560669e-06, -2.99699604511261e-06, 6.407499313354492e-07, 4.278495907783508e-06, 7.916241884231567e-06, 1.1553987860679626e-05, 1.5191733837127686e-05, 1.8829479813575745e-05, 2.2467225790023804e-05, 2.6104971766471863e-05, 2.9742717742919922e-05, 3.338046371936798e-05, 3.701820969581604e-05, 4.06559556722641e-05, 4.429370164871216e-05, 4.793144762516022e-05, 5.1569193601608276e-05, 5.5206939578056335e-05, 5.8844685554504395e-05, 6.248243153095245e-05, 6.612017750740051e-05, 6.975792348384857e-05, 7.339566946029663e-05, 7.703341543674469e-05, 8.067116141319275e-05, 8.430890738964081e-05, 8.794665336608887e-05, 9.158439934253693e-05, 9.522214531898499e-05, 9.885989129543304e-05, 0.0001024976372718811, 0.00010613538324832916, 0.00010977312922477722, 0.00011341087520122528, 0.00011704862117767334, 0.0001206863671541214, 0.00012432411313056946, 0.00012796185910701752, 0.00013159960508346558, 0.00013523735105991364, 0.0001388750970363617, 0.00014251284301280975, 0.0001461505889892578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 18.0, 21.0, 37.0, 68.0, 119.0, 199.0, 409.0, 692.0, 1479.0, 4079.0, 12482.0, 50392.0, 255613.0, 516361.0, 159643.0, 32646.0, 8864.0, 3059.0, 1106.0, 558.0, 251.0, 151.0, 102.0, 64.0, 55.0, 23.0, 17.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.26318359375, -0.2561378479003906, -0.24909210205078125, -0.24204635620117188, -0.2350006103515625, -0.22795486450195312, -0.22090911865234375, -0.21386337280273438, -0.206817626953125, -0.19977188110351562, -0.19272613525390625, -0.18568038940429688, -0.1786346435546875, -0.17158889770507812, -0.16454315185546875, -0.15749740600585938, -0.15045166015625, -0.14340591430664062, -0.13636016845703125, -0.12931442260742188, -0.1222686767578125, -0.11522293090820312, -0.10817718505859375, -0.10113143920898438, -0.094085693359375, -0.08703994750976562, -0.07999420166015625, -0.07294845581054688, -0.0659027099609375, -0.058856964111328125, -0.05181121826171875, -0.044765472412109375, -0.0377197265625, -0.030673980712890625, -0.02362823486328125, -0.016582489013671875, -0.0095367431640625, -0.002490997314453125, 0.00455474853515625, 0.011600494384765625, 0.018646240234375, 0.025691986083984375, 0.03273773193359375, 0.039783477783203125, 0.0468292236328125, 0.053874969482421875, 0.06092071533203125, 0.06796646118164062, 0.07501220703125, 0.08205795288085938, 0.08910369873046875, 0.09614944458007812, 0.1031951904296875, 0.11024093627929688, 0.11728668212890625, 0.12433242797851562, 0.131378173828125, 0.13842391967773438, 0.14546966552734375, 0.15251541137695312, 0.1595611572265625, 0.16660690307617188, 0.17365264892578125, 0.18069839477539062, 0.187744140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 11.0, 7.0, 13.0, 11.0, 16.0, 19.0, 42.0, 48.0, 78.0, 96.0, 97.0, 96.0, 93.0, 84.0, 64.0, 49.0, 48.0, 26.0, 25.0, 11.0, 21.0, 9.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.1699981689453125, -0.162994384765625, -0.1559906005859375, -0.14898681640625, -0.1419830322265625, -0.134979248046875, -0.1279754638671875, -0.1209716796875, -0.1139678955078125, -0.106964111328125, -0.0999603271484375, -0.09295654296875, -0.0859527587890625, -0.078948974609375, -0.0719451904296875, -0.06494140625, -0.0579376220703125, -0.050933837890625, -0.0439300537109375, -0.03692626953125, -0.0299224853515625, -0.022918701171875, -0.0159149169921875, -0.0089111328125, -0.0019073486328125, 0.005096435546875, 0.0121002197265625, 0.01910400390625, 0.0261077880859375, 0.033111572265625, 0.0401153564453125, 0.047119140625, 0.0541229248046875, 0.061126708984375, 0.0681304931640625, 0.07513427734375, 0.0821380615234375, 0.089141845703125, 0.0961456298828125, 0.1031494140625, 0.1101531982421875, 0.117156982421875, 0.1241607666015625, 0.13116455078125, 0.1381683349609375, 0.145172119140625, 0.1521759033203125, 0.1591796875, 0.1661834716796875, 0.173187255859375, 0.1801910400390625, 0.18719482421875, 0.1941986083984375, 0.201202392578125, 0.2082061767578125, 0.2152099609375, 0.2222137451171875, 0.229217529296875, 0.2362213134765625, 0.24322509765625, 0.2502288818359375, 0.257232666015625, 0.2642364501953125, 0.271240234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 10.0, 12.0, 15.0, 37.0, 63.0, 91.0, 120.0, 182.0, 143.0, 114.0, 74.0, 49.0, 34.0, 14.0, 13.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.7111592292785645, -2.613602876663208, -2.5160465240478516, -2.418490171432495, -2.3209338188171387, -2.2233774662017822, -2.125821113586426, -2.0282645225524902, -1.9307082891464233, -1.833151936531067, -1.7355955839157104, -1.6380391120910645, -1.540482759475708, -1.4429264068603516, -1.3453700542449951, -1.2478137016296387, -1.1502573490142822, -1.0527009963989258, -0.9551446437835693, -0.8575882315635681, -0.7600318789482117, -0.6624755263328552, -0.564919114112854, -0.46736276149749756, -0.3698064088821411, -0.27225005626678467, -0.17469367384910583, -0.077137291431427, 0.020419061183929443, 0.11797541379928589, 0.2155318260192871, 0.31308817863464355, 0.4106447696685791, 0.5082011222839355, 0.605757474899292, 0.7033138871192932, 0.8008702397346497, 0.8984265923500061, 0.9959830045700073, 1.0935393571853638, 1.1910957098007202, 1.2886520624160767, 1.386208415031433, 1.483764886856079, 1.5813212394714355, 1.678877592086792, 1.7764339447021484, 1.8739902973175049, 1.9715466499328613, 2.0691030025482178, 2.166659355163574, 2.2642157077789307, 2.361772060394287, 2.4593284130096436, 2.556884765625, 2.6544413566589355, 2.751997470855713, 2.8495538234710693, 2.947110176086426, 3.0446665287017822, 3.1422228813171387, 3.239779233932495, 3.3373355865478516, 3.434892177581787, 3.5324485301971436]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 5.0, 4.0, 6.0, 10.0, 15.0, 23.0, 15.0, 26.0, 30.0, 28.0, 40.0, 38.0, 39.0, 39.0, 40.0, 37.0, 44.0, 47.0, 51.0, 42.0, 33.0, 35.0, 36.0, 35.0, 40.0, 28.0, 28.0, 22.0, 30.0, 22.0, 11.0, 18.0, 17.0, 10.0, 10.0, 5.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.0485012531280518, -1.9815906286239624, -1.9146798849105835, -1.8477692604064941, -1.7808585166931152, -1.7139478921890259, -1.6470372676849365, -1.5801265239715576, -1.5132158994674683, -1.446305274963379, -1.37939453125, -1.3124839067459106, -1.2455732822418213, -1.1786625385284424, -1.111751914024353, -1.0448412895202637, -0.9779305458068848, -0.9110198616981506, -0.8441091775894165, -0.7771985530853271, -0.710287868976593, -0.6433771848678589, -0.5764665603637695, -0.5095558762550354, -0.44264519214630127, -0.37573450803756714, -0.3088238537311554, -0.24191318452358246, -0.17500251531600952, -0.10809183120727539, -0.04118117690086365, 0.025729477405548096, 0.09263992309570312, 0.15955059230327606, 0.226461261510849, 0.29337191581726074, 0.3602825999259949, 0.427193284034729, 0.49410393834114075, 0.5610145926475525, 0.6279252767562866, 0.6948359608650208, 0.7617466449737549, 0.8286572694778442, 0.8955679535865784, 0.9624786376953125, 1.0293892621994019, 1.0962998867034912, 1.1632106304168701, 1.2301212549209595, 1.2970319986343384, 1.3639426231384277, 1.4308533668518066, 1.497763991355896, 1.5646746158599854, 1.6315853595733643, 1.6984959840774536, 1.765406608581543, 1.8323173522949219, 1.8992279767990112, 1.9661386013031006, 2.0330493450164795, 2.0999600887298584, 2.166870594024658, 2.233781337738037]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 16.0, 16.0, 28.0, 39.0, 49.0, 101.0, 170.0, 373.0, 668.0, 1568.0, 4284.0, 14246.0, 57224.0, 238484.0, 810297.0, 1550324.0, 1056930.0, 346999.0, 82698.0, 19501.0, 5913.0, 2239.0, 976.0, 456.0, 235.0, 150.0, 88.0, 65.0, 43.0, 31.0, 22.0, 12.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.48779296875, -0.4757881164550781, -0.46378326416015625, -0.4517784118652344, -0.4397735595703125, -0.4277687072753906, -0.41576385498046875, -0.4037590026855469, -0.391754150390625, -0.3797492980957031, -0.36774444580078125, -0.3557395935058594, -0.3437347412109375, -0.3317298889160156, -0.31972503662109375, -0.3077201843261719, -0.29571533203125, -0.2837104797363281, -0.27170562744140625, -0.2597007751464844, -0.2476959228515625, -0.23569107055664062, -0.22368621826171875, -0.21168136596679688, -0.199676513671875, -0.18767166137695312, -0.17566680908203125, -0.16366195678710938, -0.1516571044921875, -0.13965225219726562, -0.12764739990234375, -0.11564254760742188, -0.1036376953125, -0.09163284301757812, -0.07962799072265625, -0.06762313842773438, -0.0556182861328125, -0.043613433837890625, -0.03160858154296875, -0.019603729248046875, -0.007598876953125, 0.004405975341796875, 0.01641082763671875, 0.028415679931640625, 0.0404205322265625, 0.052425384521484375, 0.06443023681640625, 0.07643508911132812, 0.08843994140625, 0.10044479370117188, 0.11244964599609375, 0.12445449829101562, 0.1364593505859375, 0.14846420288085938, 0.16046905517578125, 0.17247390747070312, 0.184478759765625, 0.19648361206054688, 0.20848846435546875, 0.22049331665039062, 0.2324981689453125, 0.24450302124023438, 0.25650787353515625, 0.2685127258300781, 0.280517578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 9.0, 3.0, 7.0, 7.0, 11.0, 11.0, 22.0, 13.0, 19.0, 19.0, 27.0, 28.0, 39.0, 36.0, 38.0, 36.0, 52.0, 46.0, 47.0, 45.0, 51.0, 47.0, 40.0, 41.0, 41.0, 38.0, 28.0, 23.0, 41.0, 19.0, 22.0, 19.0, 13.0, 12.0, 13.0, 6.0, 9.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.394775390625, -0.384033203125, -0.373291015625, -0.362548828125, -0.351806640625, -0.341064453125, -0.330322265625, -0.319580078125, -0.308837890625, -0.298095703125, -0.287353515625, -0.276611328125, -0.265869140625, -0.255126953125, -0.244384765625, -0.233642578125, -0.222900390625, -0.212158203125, -0.201416015625, -0.190673828125, -0.179931640625, -0.169189453125, -0.158447265625, -0.147705078125, -0.136962890625, -0.126220703125, -0.115478515625, -0.104736328125, -0.093994140625, -0.083251953125, -0.072509765625, -0.061767578125, -0.051025390625, -0.040283203125, -0.029541015625, -0.018798828125, -0.008056640625, 0.002685546875, 0.013427734375, 0.024169921875, 0.034912109375, 0.045654296875, 0.056396484375, 0.067138671875, 0.077880859375, 0.088623046875, 0.099365234375, 0.110107421875, 0.120849609375, 0.131591796875, 0.142333984375, 0.153076171875, 0.163818359375, 0.174560546875, 0.185302734375, 0.196044921875, 0.206787109375, 0.217529296875, 0.228271484375, 0.239013671875, 0.249755859375, 0.260498046875, 0.271240234375, 0.281982421875, 0.292724609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 3.0, 14.0, 22.0, 30.0, 41.0, 63.0, 96.0, 173.0, 285.0, 461.0, 912.0, 1666.0, 3554.0, 8600.0, 26704.0, 124287.0, 948767.0, 2511069.0, 464978.0, 72250.0, 18226.0, 6205.0, 2754.0, 1373.0, 728.0, 408.0, 224.0, 156.0, 74.0, 48.0, 42.0, 28.0, 7.0, 10.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55615234375, -0.5404129028320312, -0.5246734619140625, -0.5089340209960938, -0.493194580078125, -0.47745513916015625, -0.4617156982421875, -0.44597625732421875, -0.43023681640625, -0.41449737548828125, -0.3987579345703125, -0.38301849365234375, -0.367279052734375, -0.35153961181640625, -0.3358001708984375, -0.32006072998046875, -0.3043212890625, -0.28858184814453125, -0.2728424072265625, -0.25710296630859375, -0.241363525390625, -0.22562408447265625, -0.2098846435546875, -0.19414520263671875, -0.17840576171875, -0.16266632080078125, -0.1469268798828125, -0.13118743896484375, -0.115447998046875, -0.09970855712890625, -0.0839691162109375, -0.06822967529296875, -0.052490234375, -0.03675079345703125, -0.0210113525390625, -0.00527191162109375, 0.010467529296875, 0.02620697021484375, 0.0419464111328125, 0.05768585205078125, 0.07342529296875, 0.08916473388671875, 0.1049041748046875, 0.12064361572265625, 0.136383056640625, 0.15212249755859375, 0.1678619384765625, 0.18360137939453125, 0.1993408203125, 0.21508026123046875, 0.2308197021484375, 0.24655914306640625, 0.262298583984375, 0.27803802490234375, 0.2937774658203125, 0.30951690673828125, 0.32525634765625, 0.34099578857421875, 0.3567352294921875, 0.37247467041015625, 0.388214111328125, 0.40395355224609375, 0.4196929931640625, 0.43543243408203125, 0.451171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 14.0, 7.0, 16.0, 14.0, 18.0, 38.0, 53.0, 69.0, 122.0, 184.0, 300.0, 428.0, 603.0, 669.0, 511.0, 345.0, 215.0, 146.0, 96.0, 79.0, 43.0, 34.0, 28.0, 9.0, 7.0, 0.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.75390625, -0.7346878051757812, -0.7154693603515625, -0.6962509155273438, -0.677032470703125, -0.6578140258789062, -0.6385955810546875, -0.6193771362304688, -0.60015869140625, -0.5809402465820312, -0.5617218017578125, -0.5425033569335938, -0.523284912109375, -0.5040664672851562, -0.4848480224609375, -0.46562957763671875, -0.4464111328125, -0.42719268798828125, -0.4079742431640625, -0.38875579833984375, -0.369537353515625, -0.35031890869140625, -0.3311004638671875, -0.31188201904296875, -0.29266357421875, -0.27344512939453125, -0.2542266845703125, -0.23500823974609375, -0.215789794921875, -0.19657135009765625, -0.1773529052734375, -0.15813446044921875, -0.138916015625, -0.11969757080078125, -0.1004791259765625, -0.08126068115234375, -0.062042236328125, -0.04282379150390625, -0.0236053466796875, -0.00438690185546875, 0.01483154296875, 0.03404998779296875, 0.0532684326171875, 0.07248687744140625, 0.091705322265625, 0.11092376708984375, 0.1301422119140625, 0.14936065673828125, 0.1685791015625, 0.18779754638671875, 0.2070159912109375, 0.22623443603515625, 0.245452880859375, 0.26467132568359375, 0.2838897705078125, 0.30310821533203125, 0.32232666015625, 0.34154510498046875, 0.3607635498046875, 0.37998199462890625, 0.399200439453125, 0.41841888427734375, 0.4376373291015625, 0.45685577392578125, 0.47607421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 10.0, 22.0, 59.0, 144.0, 197.0, 273.0, 151.0, 78.0, 36.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9995903968811035, -6.806433200836182, -6.61327600479126, -6.420118808746338, -6.226961612701416, -6.033804416656494, -5.840646743774414, -5.647489547729492, -5.45433235168457, -5.261175155639648, -5.068017959594727, -4.874860763549805, -4.681703567504883, -4.488546371459961, -4.295389175415039, -4.102231979370117, -3.9090747833251953, -3.7159175872802734, -3.5227603912353516, -3.3296031951904297, -3.136445999145508, -2.943288803100586, -2.750131368637085, -2.556974172592163, -2.363816976547241, -2.1706597805023193, -1.9775025844573975, -1.784345269203186, -1.5911880731582642, -1.3980308771133423, -1.2048735618591309, -1.011716365814209, -0.8185586929321289, -0.625401496887207, -0.4322442412376404, -0.23908698558807373, -0.045929789543151855, 0.14722740650177002, 0.34038472175598145, 0.5335419178009033, 0.7266991138458252, 0.9198563098907471, 1.113013505935669, 1.3061708211898804, 1.4993280172348022, 1.6924852132797241, 1.8856425285339355, 2.0787997245788574, 2.2719569206237793, 2.465114116668701, 2.658271312713623, 2.851428508758545, 3.044585704803467, 3.2377429008483887, 3.4309003353118896, 3.6240575313568115, 3.8172147274017334, 4.010372161865234, 4.203529357910156, 4.396686553955078, 4.58984375, 4.783000946044922, 4.976158142089844, 5.169315338134766, 5.3624725341796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 14.0, 12.0, 11.0, 19.0, 20.0, 26.0, 40.0, 44.0, 38.0, 42.0, 56.0, 71.0, 58.0, 61.0, 75.0, 43.0, 55.0, 48.0, 43.0, 35.0, 24.0, 30.0, 25.0, 28.0, 17.0, 16.0, 11.0, 11.0, 8.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.229010581970215, -2.1601381301879883, -2.091265916824341, -2.0223934650421143, -1.9535212516784668, -1.8846487998962402, -1.8157764673233032, -1.7469041347503662, -1.6780318021774292, -1.6091594696044922, -1.5402871370315552, -1.4714148044586182, -1.4025423526763916, -1.3336701393127441, -1.2647976875305176, -1.1959253549575806, -1.1270530223846436, -1.0581806898117065, -0.9893083572387695, -0.9204359650611877, -0.8515636324882507, -0.7826912999153137, -0.7138189077377319, -0.6449465751647949, -0.5760742425918579, -0.5072019100189209, -0.4383295476436615, -0.3694571852684021, -0.3005848526954651, -0.23171252012252808, -0.16284015774726868, -0.09396779537200928, -0.025095701217651367, 0.04377664625644684, 0.11264899373054504, 0.18152134120464325, 0.25039368867874146, 0.31926602125167847, 0.38813838362693787, 0.45701074600219727, 0.5258830785751343, 0.5947554111480713, 0.6636277437210083, 0.7325001358985901, 0.8013724684715271, 0.8702448010444641, 0.9391171932220459, 1.007989525794983, 1.07686185836792, 1.145734190940857, 1.214606523513794, 1.283478856086731, 1.352351188659668, 1.4212236404418945, 1.4900959730148315, 1.5589683055877686, 1.6278406381607056, 1.6967129707336426, 1.7655853033065796, 1.8344576358795166, 1.9033300876617432, 1.9722023010253906, 2.041074752807617, 2.1099472045898438, 2.178819417953491]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 8.0, 11.0, 8.0, 6.0, 13.0, 12.0, 26.0, 35.0, 48.0, 82.0, 111.0, 190.0, 296.0, 585.0, 891.0, 1792.0, 3416.0, 6248.0, 12592.0, 24492.0, 48689.0, 91940.0, 160636.0, 217723.0, 200236.0, 130746.0, 71861.0, 36949.0, 18574.0, 9590.0, 4961.0, 2557.0, 1350.0, 776.0, 421.0, 262.0, 137.0, 93.0, 70.0, 50.0, 26.0, 14.0, 14.0, 8.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2617645263671875, -0.253265380859375, -0.2447662353515625, -0.23626708984375, -0.2277679443359375, -0.219268798828125, -0.2107696533203125, -0.2022705078125, -0.1937713623046875, -0.185272216796875, -0.1767730712890625, -0.16827392578125, -0.1597747802734375, -0.151275634765625, -0.1427764892578125, -0.13427734375, -0.1257781982421875, -0.117279052734375, -0.1087799072265625, -0.10028076171875, -0.0917816162109375, -0.083282470703125, -0.0747833251953125, -0.0662841796875, -0.0577850341796875, -0.049285888671875, -0.0407867431640625, -0.03228759765625, -0.0237884521484375, -0.015289306640625, -0.0067901611328125, 0.001708984375, 0.0102081298828125, 0.018707275390625, 0.0272064208984375, 0.03570556640625, 0.0442047119140625, 0.052703857421875, 0.0612030029296875, 0.0697021484375, 0.0782012939453125, 0.086700439453125, 0.0951995849609375, 0.10369873046875, 0.1121978759765625, 0.120697021484375, 0.1291961669921875, 0.1376953125, 0.1461944580078125, 0.154693603515625, 0.1631927490234375, 0.17169189453125, 0.1801910400390625, 0.188690185546875, 0.1971893310546875, 0.2056884765625, 0.2141876220703125, 0.222686767578125, 0.2311859130859375, 0.23968505859375, 0.2481842041015625, 0.256683349609375, 0.2651824951171875, 0.273681640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 12.0, 4.0, 5.0, 15.0, 19.0, 25.0, 25.0, 27.0, 40.0, 29.0, 47.0, 42.0, 47.0, 62.0, 50.0, 46.0, 50.0, 52.0, 41.0, 50.0, 47.0, 43.0, 38.0, 28.0, 30.0, 24.0, 17.0, 17.0, 17.0, 10.0, 8.0, 12.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.34830474853515625, -0.3355255126953125, -0.32274627685546875, -0.309967041015625, -0.29718780517578125, -0.2844085693359375, -0.27162933349609375, -0.25885009765625, -0.24607086181640625, -0.2332916259765625, -0.22051239013671875, -0.207733154296875, -0.19495391845703125, -0.1821746826171875, -0.16939544677734375, -0.1566162109375, -0.14383697509765625, -0.1310577392578125, -0.11827850341796875, -0.105499267578125, -0.09272003173828125, -0.0799407958984375, -0.06716156005859375, -0.05438232421875, -0.04160308837890625, -0.0288238525390625, -0.01604461669921875, -0.003265380859375, 0.00951385498046875, 0.0222930908203125, 0.03507232666015625, 0.0478515625, 0.06063079833984375, 0.0734100341796875, 0.08618927001953125, 0.098968505859375, 0.11174774169921875, 0.1245269775390625, 0.13730621337890625, 0.15008544921875, 0.16286468505859375, 0.1756439208984375, 0.18842315673828125, 0.201202392578125, 0.21398162841796875, 0.2267608642578125, 0.23954010009765625, 0.2523193359375, 0.26509857177734375, 0.2778778076171875, 0.29065704345703125, 0.303436279296875, 0.31621551513671875, 0.3289947509765625, 0.34177398681640625, 0.35455322265625, 0.36733245849609375, 0.3801116943359375, 0.39289093017578125, 0.405670166015625, 0.41844940185546875, 0.4312286376953125, 0.44400787353515625, 0.456787109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 12.0, 13.0, 26.0, 32.0, 47.0, 75.0, 124.0, 217.0, 397.0, 821.0, 1532.0, 3532.0, 8267.0, 20644.0, 54851.0, 143575.0, 319427.0, 285607.0, 128629.0, 48502.0, 18468.0, 7548.0, 3148.0, 1395.0, 760.0, 397.0, 206.0, 99.0, 72.0, 37.0, 18.0, 19.0, 11.0, 7.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.451904296875, -0.4396705627441406, -0.42743682861328125, -0.4152030944824219, -0.4029693603515625, -0.3907356262207031, -0.37850189208984375, -0.3662681579589844, -0.354034423828125, -0.3418006896972656, -0.32956695556640625, -0.3173332214355469, -0.3050994873046875, -0.2928657531738281, -0.28063201904296875, -0.2683982849121094, -0.25616455078125, -0.24393081665039062, -0.23169708251953125, -0.21946334838867188, -0.2072296142578125, -0.19499588012695312, -0.18276214599609375, -0.17052841186523438, -0.158294677734375, -0.14606094360351562, -0.13382720947265625, -0.12159347534179688, -0.1093597412109375, -0.09712600708007812, -0.08489227294921875, -0.07265853881835938, -0.0604248046875, -0.048191070556640625, -0.03595733642578125, -0.023723602294921875, -0.0114898681640625, 0.000743865966796875, 0.01297760009765625, 0.025211334228515625, 0.037445068359375, 0.049678802490234375, 0.06191253662109375, 0.07414627075195312, 0.0863800048828125, 0.09861373901367188, 0.11084747314453125, 0.12308120727539062, 0.13531494140625, 0.14754867553710938, 0.15978240966796875, 0.17201614379882812, 0.1842498779296875, 0.19648361206054688, 0.20871734619140625, 0.22095108032226562, 0.233184814453125, 0.24541854858398438, 0.25765228271484375, 0.2698860168457031, 0.2821197509765625, 0.2943534851074219, 0.30658721923828125, 0.3188209533691406, 0.3310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 7.0, 18.0, 15.0, 17.0, 24.0, 23.0, 25.0, 24.0, 28.0, 44.0, 34.0, 37.0, 34.0, 52.0, 51.0, 42.0, 40.0, 41.0, 44.0, 39.0, 45.0, 30.0, 24.0, 30.0, 30.0, 34.0, 18.0, 27.0, 18.0, 13.0, 15.0, 12.0, 10.0, 10.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9443359375, -0.91766357421875, -0.8909912109375, -0.86431884765625, -0.837646484375, -0.81097412109375, -0.7843017578125, -0.75762939453125, -0.73095703125, -0.70428466796875, -0.6776123046875, -0.65093994140625, -0.624267578125, -0.59759521484375, -0.5709228515625, -0.54425048828125, -0.517578125, -0.49090576171875, -0.4642333984375, -0.43756103515625, -0.410888671875, -0.38421630859375, -0.3575439453125, -0.33087158203125, -0.30419921875, -0.27752685546875, -0.2508544921875, -0.22418212890625, -0.197509765625, -0.17083740234375, -0.1441650390625, -0.11749267578125, -0.0908203125, -0.06414794921875, -0.0374755859375, -0.01080322265625, 0.015869140625, 0.04254150390625, 0.0692138671875, 0.09588623046875, 0.12255859375, 0.14923095703125, 0.1759033203125, 0.20257568359375, 0.229248046875, 0.25592041015625, 0.2825927734375, 0.30926513671875, 0.3359375, 0.36260986328125, 0.3892822265625, 0.41595458984375, 0.442626953125, 0.46929931640625, 0.4959716796875, 0.52264404296875, 0.54931640625, 0.57598876953125, 0.6026611328125, 0.62933349609375, 0.656005859375, 0.68267822265625, 0.7093505859375, 0.73602294921875, 0.7626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 11.0, 10.0, 11.0, 27.0, 23.0, 58.0, 68.0, 101.0, 150.0, 175.0, 316.0, 560.0, 776.0, 1294.0, 2371.0, 5211.0, 15488.0, 66316.0, 301233.0, 480478.0, 130498.0, 27864.0, 7881.0, 3316.0, 1634.0, 923.0, 585.0, 354.0, 257.0, 160.0, 139.0, 88.0, 47.0, 36.0, 21.0, 16.0, 16.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.17822265625, -0.1734333038330078, -0.16864395141601562, -0.16385459899902344, -0.15906524658203125, -0.15427589416503906, -0.14948654174804688, -0.1446971893310547, -0.1399078369140625, -0.1351184844970703, -0.13032913208007812, -0.12553977966308594, -0.12075042724609375, -0.11596107482910156, -0.11117172241210938, -0.10638236999511719, -0.101593017578125, -0.09680366516113281, -0.09201431274414062, -0.08722496032714844, -0.08243560791015625, -0.07764625549316406, -0.07285690307617188, -0.06806755065917969, -0.0632781982421875, -0.05848884582519531, -0.053699493408203125, -0.04891014099121094, -0.04412078857421875, -0.03933143615722656, -0.034542083740234375, -0.029752731323242188, -0.02496337890625, -0.020174026489257812, -0.015384674072265625, -0.010595321655273438, -0.00580596923828125, -0.0010166168212890625, 0.003772735595703125, 0.008562088012695312, 0.0133514404296875, 0.018140792846679688, 0.022930145263671875, 0.027719497680664062, 0.03250885009765625, 0.03729820251464844, 0.042087554931640625, 0.04687690734863281, 0.051666259765625, 0.05645561218261719, 0.061244964599609375, 0.06603431701660156, 0.07082366943359375, 0.07561302185058594, 0.08040237426757812, 0.08519172668457031, 0.0899810791015625, 0.09477043151855469, 0.09955978393554688, 0.10434913635253906, 0.10913848876953125, 0.11392784118652344, 0.11871719360351562, 0.12350654602050781, 0.1282958984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 24.0, 31.0, 89.0, 122.0, 196.0, 206.0, 137.0, 70.0, 32.0, 19.0, 12.0, 6.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.709596633911133e-05, -9.406637400388718e-05, -9.103678166866302e-05, -8.800718933343887e-05, -8.497759699821472e-05, -8.194800466299057e-05, -7.891841232776642e-05, -7.588881999254227e-05, -7.285922765731812e-05, -6.982963532209396e-05, -6.680004298686981e-05, -6.377045065164566e-05, -6.074085831642151e-05, -5.771126598119736e-05, -5.4681673645973206e-05, -5.1652081310749054e-05, -4.86224889755249e-05, -4.559289664030075e-05, -4.25633043050766e-05, -3.953371196985245e-05, -3.6504119634628296e-05, -3.3474527299404144e-05, -3.0444934964179993e-05, -2.741534262895584e-05, -2.438575029373169e-05, -2.1356157958507538e-05, -1.8326565623283386e-05, -1.5296973288059235e-05, -1.2267380952835083e-05, -9.237788617610931e-06, -6.20819628238678e-06, -3.178603947162628e-06, -1.4901161193847656e-07, 2.880580723285675e-06, 5.910173058509827e-06, 8.939765393733978e-06, 1.196935772895813e-05, 1.4998950064182281e-05, 1.8028542399406433e-05, 2.1058134734630585e-05, 2.4087727069854736e-05, 2.7117319405078888e-05, 3.014691174030304e-05, 3.317650407552719e-05, 3.620609641075134e-05, 3.9235688745975494e-05, 4.2265281081199646e-05, 4.52948734164238e-05, 4.832446575164795e-05, 5.13540580868721e-05, 5.438365042209625e-05, 5.7413242757320404e-05, 6.0442835092544556e-05, 6.347242742776871e-05, 6.650201976299286e-05, 6.953161209821701e-05, 7.256120443344116e-05, 7.559079676866531e-05, 7.862038910388947e-05, 8.164998143911362e-05, 8.467957377433777e-05, 8.770916610956192e-05, 9.073875844478607e-05, 9.376835078001022e-05, 9.679794311523438e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 10.0, 9.0, 13.0, 16.0, 18.0, 36.0, 33.0, 69.0, 107.0, 150.0, 234.0, 460.0, 857.0, 1719.0, 3588.0, 10118.0, 45605.0, 253515.0, 537217.0, 153965.0, 27527.0, 7237.0, 2902.0, 1394.0, 713.0, 377.0, 219.0, 156.0, 96.0, 74.0, 37.0, 32.0, 15.0, 11.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2232666015625, -0.2175922393798828, -0.21191787719726562, -0.20624351501464844, -0.20056915283203125, -0.19489479064941406, -0.18922042846679688, -0.1835460662841797, -0.1778717041015625, -0.1721973419189453, -0.16652297973632812, -0.16084861755371094, -0.15517425537109375, -0.14949989318847656, -0.14382553100585938, -0.1381511688232422, -0.132476806640625, -0.1268024444580078, -0.12112808227539062, -0.11545372009277344, -0.10977935791015625, -0.10410499572753906, -0.09843063354492188, -0.09275627136230469, -0.0870819091796875, -0.08140754699707031, -0.07573318481445312, -0.07005882263183594, -0.06438446044921875, -0.05871009826660156, -0.053035736083984375, -0.04736137390136719, -0.04168701171875, -0.03601264953613281, -0.030338287353515625, -0.024663925170898438, -0.01898956298828125, -0.013315200805664062, -0.007640838623046875, -0.0019664764404296875, 0.0037078857421875, 0.009382247924804688, 0.015056610107421875, 0.020730972290039062, 0.02640533447265625, 0.03207969665527344, 0.037754058837890625, 0.04342842102050781, 0.049102783203125, 0.05477714538574219, 0.060451507568359375, 0.06612586975097656, 0.07180023193359375, 0.07747459411621094, 0.08314895629882812, 0.08882331848144531, 0.0944976806640625, 0.10017204284667969, 0.10584640502929688, 0.11152076721191406, 0.11719512939453125, 0.12286949157714844, 0.12854385375976562, 0.1342182159423828, 0.139892578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 3.0, 7.0, 10.0, 9.0, 21.0, 30.0, 48.0, 59.0, 92.0, 96.0, 137.0, 112.0, 119.0, 87.0, 68.0, 38.0, 23.0, 10.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.333251953125, -0.32563018798828125, -0.3180084228515625, -0.31038665771484375, -0.302764892578125, -0.29514312744140625, -0.2875213623046875, -0.27989959716796875, -0.27227783203125, -0.26465606689453125, -0.2570343017578125, -0.24941253662109375, -0.241790771484375, -0.23416900634765625, -0.2265472412109375, -0.21892547607421875, -0.2113037109375, -0.20368194580078125, -0.1960601806640625, -0.18843841552734375, -0.180816650390625, -0.17319488525390625, -0.1655731201171875, -0.15795135498046875, -0.15032958984375, -0.14270782470703125, -0.1350860595703125, -0.12746429443359375, -0.119842529296875, -0.11222076416015625, -0.1045989990234375, -0.09697723388671875, -0.08935546875, -0.08173370361328125, -0.0741119384765625, -0.06649017333984375, -0.058868408203125, -0.05124664306640625, -0.0436248779296875, -0.03600311279296875, -0.02838134765625, -0.02075958251953125, -0.0131378173828125, -0.00551605224609375, 0.002105712890625, 0.00972747802734375, 0.0173492431640625, 0.02497100830078125, 0.0325927734375, 0.04021453857421875, 0.0478363037109375, 0.05545806884765625, 0.063079833984375, 0.07070159912109375, 0.0783233642578125, 0.08594512939453125, 0.09356689453125, 0.10118865966796875, 0.1088104248046875, 0.11643218994140625, 0.124053955078125, 0.13167572021484375, 0.1392974853515625, 0.14691925048828125, 0.154541015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 20.0, 47.0, 128.0, 232.0, 268.0, 170.0, 70.0, 27.0, 15.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990912914276123, -3.83859920501709, -3.6862857341766357, -3.5339720249176025, -3.3816585540771484, -3.2293448448181152, -3.077031135559082, -2.924717426300049, -2.7724039554595947, -2.6200902462005615, -2.4677767753601074, -2.315463066101074, -2.163149356842041, -2.010835886001587, -1.8585221767425537, -1.70620858669281, -1.5538949966430664, -1.4015814065933228, -1.249267816543579, -1.096954107284546, -0.9446405172348022, -0.7923269271850586, -0.6400132775306702, -0.48769962787628174, -0.3353860378265381, -0.18307241797447205, -0.030758798122406006, 0.12155482172966003, 0.2738684415817261, 0.4261820316314697, 0.5784956812858582, 0.7308093309402466, 0.883122444152832, 1.0354360342025757, 1.1877496242523193, 1.3400633335113525, 1.4923769235610962, 1.6446905136108398, 1.797004222869873, 1.9493178129196167, 2.1016314029693604, 2.2539451122283936, 2.4062585830688477, 2.558572292327881, 2.710886001586914, 2.863199472427368, 3.0155131816864014, 3.1678266525268555, 3.3201403617858887, 3.472454071044922, 3.624767541885376, 3.777081251144409, 3.9293947219848633, 4.0817084312438965, 4.23402214050293, 4.386335849761963, 4.538649559020996, 4.690963268280029, 4.8432769775390625, 4.9955902099609375, 5.147903919219971, 5.300217628479004, 5.452531337738037, 5.60484504699707, 5.757158279418945]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 7.0, 13.0, 10.0, 12.0, 13.0, 15.0, 23.0, 37.0, 25.0, 37.0, 60.0, 44.0, 40.0, 56.0, 51.0, 47.0, 53.0, 44.0, 49.0, 52.0, 58.0, 31.0, 36.0, 29.0, 28.0, 29.0, 12.0, 20.0, 13.0, 8.0, 10.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6188805103302, -2.541846513748169, -2.4648125171661377, -2.3877785205841064, -2.310744524002075, -2.233710289001465, -2.1566762924194336, -2.0796422958374023, -2.002608299255371, -1.9255743026733398, -1.8485403060913086, -1.7715063095092773, -1.6944721937179565, -1.6174381971359253, -1.540404200553894, -1.4633700847625732, -1.3863362073898315, -1.3093022108078003, -1.232268214225769, -1.1552340984344482, -1.078200101852417, -1.0011661052703857, -0.9241321086883545, -0.8470980525016785, -0.7700640559196472, -0.693030059337616, -0.6159960031509399, -0.5389620065689087, -0.46192798018455505, -0.3848939538002014, -0.30785995721817017, -0.23082590103149414, -0.1537919044494629, -0.07675788551568985, 0.0002761334180831909, 0.07731014490127563, 0.15434417128562927, 0.2313781976699829, 0.30841219425201416, 0.3854462504386902, 0.46248024702072144, 0.5395142436027527, 0.6165482997894287, 0.69358229637146, 0.7706162929534912, 0.8476503491401672, 0.9246843457221985, 1.0017184019088745, 1.0787523984909058, 1.155786395072937, 1.2328203916549683, 1.309854507446289, 1.3868885040283203, 1.4639225006103516, 1.5409564971923828, 1.617990493774414, 1.6950244903564453, 1.7720584869384766, 1.8490924835205078, 1.926126480102539, 2.0031604766845703, 2.0801944732666016, 2.157228469848633, 2.234262704849243, 2.3112967014312744]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 3.0, 8.0, 4.0, 19.0, 22.0, 30.0, 42.0, 53.0, 88.0, 131.0, 202.0, 353.0, 609.0, 1184.0, 2099.0, 4436.0, 10247.0, 26539.0, 70497.0, 175380.0, 370424.0, 635041.0, 852552.0, 835167.0, 605699.0, 345880.0, 154858.0, 59745.0, 23058.0, 9884.0, 4731.0, 2249.0, 1176.0, 701.0, 472.0, 272.0, 150.0, 108.0, 57.0, 32.0, 18.0, 22.0, 8.0, 13.0, 8.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23318862915039062, -0.22565460205078125, -0.21812057495117188, -0.2105865478515625, -0.20305252075195312, -0.19551849365234375, -0.18798446655273438, -0.180450439453125, -0.17291641235351562, -0.16538238525390625, -0.15784835815429688, -0.1503143310546875, -0.14278030395507812, -0.13524627685546875, -0.12771224975585938, -0.12017822265625, -0.11264419555664062, -0.10511016845703125, -0.09757614135742188, -0.0900421142578125, -0.08250808715820312, -0.07497406005859375, -0.06744003295898438, -0.059906005859375, -0.052371978759765625, -0.04483795166015625, -0.037303924560546875, -0.0297698974609375, -0.022235870361328125, -0.01470184326171875, -0.007167816162109375, 0.0003662109375, 0.007900238037109375, 0.01543426513671875, 0.022968292236328125, 0.0305023193359375, 0.038036346435546875, 0.04557037353515625, 0.053104400634765625, 0.060638427734375, 0.06817245483398438, 0.07570648193359375, 0.08324050903320312, 0.0907745361328125, 0.09830856323242188, 0.10584259033203125, 0.11337661743164062, 0.12091064453125, 0.12844467163085938, 0.13597869873046875, 0.14351272583007812, 0.1510467529296875, 0.15858078002929688, 0.16611480712890625, 0.17364883422851562, 0.181182861328125, 0.18871688842773438, 0.19625091552734375, 0.20378494262695312, 0.2113189697265625, 0.21885299682617188, 0.22638702392578125, 0.23392105102539062, 0.241455078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 14.0, 18.0, 15.0, 18.0, 17.0, 20.0, 25.0, 31.0, 28.0, 33.0, 33.0, 27.0, 31.0, 44.0, 53.0, 43.0, 57.0, 44.0, 40.0, 47.0, 35.0, 41.0, 29.0, 35.0, 34.0, 22.0, 26.0, 21.0, 21.0, 16.0, 14.0, 16.0, 11.0, 6.0, 4.0, 12.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.364013671875, -0.3537712097167969, -0.34352874755859375, -0.3332862854003906, -0.3230438232421875, -0.3128013610839844, -0.30255889892578125, -0.2923164367675781, -0.282073974609375, -0.2718315124511719, -0.26158905029296875, -0.2513465881347656, -0.2411041259765625, -0.23086166381835938, -0.22061920166015625, -0.21037673950195312, -0.20013427734375, -0.18989181518554688, -0.17964935302734375, -0.16940689086914062, -0.1591644287109375, -0.14892196655273438, -0.13867950439453125, -0.12843704223632812, -0.118194580078125, -0.10795211791992188, -0.09770965576171875, -0.08746719360351562, -0.0772247314453125, -0.06698226928710938, -0.05673980712890625, -0.046497344970703125, -0.0362548828125, -0.026012420654296875, -0.01576995849609375, -0.005527496337890625, 0.0047149658203125, 0.014957427978515625, 0.02519989013671875, 0.035442352294921875, 0.045684814453125, 0.055927276611328125, 0.06616973876953125, 0.07641220092773438, 0.0866546630859375, 0.09689712524414062, 0.10713958740234375, 0.11738204956054688, 0.12762451171875, 0.13786697387695312, 0.14810943603515625, 0.15835189819335938, 0.1685943603515625, 0.17883682250976562, 0.18907928466796875, 0.19932174682617188, 0.209564208984375, 0.21980667114257812, 0.23004913330078125, 0.24029159545898438, 0.2505340576171875, 0.2607765197753906, 0.27101898193359375, 0.2812614440917969, 0.29150390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 4.0, 12.0, 24.0, 28.0, 40.0, 112.0, 186.0, 333.0, 720.0, 1787.0, 5994.0, 35727.0, 776931.0, 3214548.0, 138491.0, 13690.0, 3311.0, 1158.0, 517.0, 257.0, 147.0, 84.0, 49.0, 33.0, 21.0, 14.0, 6.0, 5.0, 13.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7818603515625, -0.753173828125, -0.7244873046875, -0.69580078125, -0.6671142578125, -0.638427734375, -0.6097412109375, -0.5810546875, -0.5523681640625, -0.523681640625, -0.4949951171875, -0.46630859375, -0.4376220703125, -0.408935546875, -0.3802490234375, -0.3515625, -0.3228759765625, -0.294189453125, -0.2655029296875, -0.23681640625, -0.2081298828125, -0.179443359375, -0.1507568359375, -0.1220703125, -0.0933837890625, -0.064697265625, -0.0360107421875, -0.00732421875, 0.0213623046875, 0.050048828125, 0.0787353515625, 0.107421875, 0.1361083984375, 0.164794921875, 0.1934814453125, 0.22216796875, 0.2508544921875, 0.279541015625, 0.3082275390625, 0.3369140625, 0.3656005859375, 0.394287109375, 0.4229736328125, 0.45166015625, 0.4803466796875, 0.509033203125, 0.5377197265625, 0.56640625, 0.5950927734375, 0.623779296875, 0.6524658203125, 0.68115234375, 0.7098388671875, 0.738525390625, 0.7672119140625, 0.7958984375, 0.8245849609375, 0.853271484375, 0.8819580078125, 0.91064453125, 0.9393310546875, 0.968017578125, 0.9967041015625, 1.025390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 14.0, 15.0, 22.0, 28.0, 56.0, 85.0, 120.0, 196.0, 265.0, 383.0, 470.0, 506.0, 537.0, 405.0, 285.0, 211.0, 163.0, 93.0, 73.0, 45.0, 26.0, 22.0, 9.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.794921875, -0.77069091796875, -0.7464599609375, -0.72222900390625, -0.697998046875, -0.67376708984375, -0.6495361328125, -0.62530517578125, -0.60107421875, -0.57684326171875, -0.5526123046875, -0.52838134765625, -0.504150390625, -0.47991943359375, -0.4556884765625, -0.43145751953125, -0.4072265625, -0.38299560546875, -0.3587646484375, -0.33453369140625, -0.310302734375, -0.28607177734375, -0.2618408203125, -0.23760986328125, -0.21337890625, -0.18914794921875, -0.1649169921875, -0.14068603515625, -0.116455078125, -0.09222412109375, -0.0679931640625, -0.04376220703125, -0.01953125, 0.00469970703125, 0.0289306640625, 0.05316162109375, 0.077392578125, 0.10162353515625, 0.1258544921875, 0.15008544921875, 0.17431640625, 0.19854736328125, 0.2227783203125, 0.24700927734375, 0.271240234375, 0.29547119140625, 0.3197021484375, 0.34393310546875, 0.3681640625, 0.39239501953125, 0.4166259765625, 0.44085693359375, 0.465087890625, 0.48931884765625, 0.5135498046875, 0.53778076171875, 0.56201171875, 0.58624267578125, 0.6104736328125, 0.63470458984375, 0.658935546875, 0.68316650390625, 0.7073974609375, 0.73162841796875, 0.755859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 18.0, 15.0, 31.0, 39.0, 83.0, 129.0, 164.0, 148.0, 127.0, 92.0, 50.0, 38.0, 20.0, 15.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.603601455688477, -5.3700971603393555, -5.136593341827393, -4.90308952331543, -4.669585227966309, -4.4360809326171875, -4.202577114105225, -3.9690730571746826, -3.7355690002441406, -3.5020649433135986, -3.2685608863830566, -3.0350568294525146, -2.8015527725219727, -2.5680487155914307, -2.3345446586608887, -2.1010406017303467, -1.8675365447998047, -1.6340324878692627, -1.4005284309387207, -1.1670243740081787, -0.9335203170776367, -0.7000162601470947, -0.46651220321655273, -0.23300814628601074, 0.00049591064453125, 0.23399996757507324, 0.46750402450561523, 0.7010080814361572, 0.9345121383666992, 1.1680161952972412, 1.4015202522277832, 1.6350243091583252, 1.8685283660888672, 2.102032423019409, 2.335536479949951, 2.569040536880493, 2.802544593811035, 3.036048650741577, 3.269552707672119, 3.503056764602661, 3.736560821533203, 3.970064878463745, 4.203568935394287, 4.43707275390625, 4.670577049255371, 4.904081344604492, 5.137585163116455, 5.371088981628418, 5.604593276977539, 5.83809757232666, 6.071601390838623, 6.305105209350586, 6.538609504699707, 6.772113800048828, 7.005617618560791, 7.239121437072754, 7.472625732421875, 7.706130027770996, 7.939633846282959, 8.173137664794922, 8.406641960144043, 8.640146255493164, 8.873649597167969, 9.10715389251709, 9.340658187866211]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 7.0, 9.0, 22.0, 13.0, 26.0, 33.0, 24.0, 31.0, 33.0, 40.0, 42.0, 40.0, 52.0, 64.0, 43.0, 52.0, 47.0, 47.0, 41.0, 44.0, 37.0, 34.0, 21.0, 32.0, 16.0, 20.0, 19.0, 13.0, 11.0, 11.0, 11.0, 9.0, 9.0, 6.0, 5.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7309513092041016, -2.641127347946167, -2.5513033866882324, -2.461479425430298, -2.3716554641723633, -2.2818312644958496, -2.192007541656494, -2.1021833419799805, -2.012359380722046, -1.9225354194641113, -1.8327114582061768, -1.7428874969482422, -1.653063416481018, -1.5632394552230835, -1.473415493965149, -1.3835914134979248, -1.2937675714492798, -1.2039436101913452, -1.1141196489334106, -1.0242955684661865, -0.934471607208252, -0.8446476459503174, -0.7548236846923828, -0.6649996638298035, -0.5751757025718689, -0.48535171151161194, -0.395527720451355, -0.3057037591934204, -0.21587976813316345, -0.1260557770729065, -0.036231815814971924, 0.05359220504760742, 0.143416166305542, 0.23324015736579895, 0.3230641484260559, 0.4128881096839905, 0.5027121305465698, 0.5925360918045044, 0.682360053062439, 0.7721840739250183, 0.8620080351829529, 0.9518319964408875, 1.0416560173034668, 1.1314799785614014, 1.221303939819336, 1.3111279010772705, 1.400951862335205, 1.4907759428024292, 1.5805999040603638, 1.6704238653182983, 1.760247826576233, 1.850071907043457, 1.9398958683013916, 2.029719829559326, 2.1195437908172607, 2.2093677520751953, 2.29919171333313, 2.3890156745910645, 2.478839635848999, 2.5686635971069336, 2.658487558364868, 2.7483115196228027, 2.8381357192993164, 2.927959680557251, 3.0177836418151855]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 18.0, 11.0, 15.0, 37.0, 64.0, 89.0, 125.0, 214.0, 443.0, 809.0, 1662.0, 4231.0, 12736.0, 50390.0, 275546.0, 545249.0, 118969.0, 25404.0, 7272.0, 2659.0, 1204.0, 593.0, 307.0, 186.0, 111.0, 73.0, 42.0, 35.0, 14.0, 9.0, 10.0, 2.0, 5.0, 4.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499755859375, -0.4826774597167969, -0.46559906005859375, -0.4485206604003906, -0.4314422607421875, -0.4143638610839844, -0.39728546142578125, -0.3802070617675781, -0.363128662109375, -0.3460502624511719, -0.32897186279296875, -0.3118934631347656, -0.2948150634765625, -0.2777366638183594, -0.26065826416015625, -0.24357986450195312, -0.22650146484375, -0.20942306518554688, -0.19234466552734375, -0.17526626586914062, -0.1581878662109375, -0.14110946655273438, -0.12403106689453125, -0.10695266723632812, -0.089874267578125, -0.07279586791992188, -0.05571746826171875, -0.038639068603515625, -0.0215606689453125, -0.004482269287109375, 0.01259613037109375, 0.029674530029296875, 0.0467529296875, 0.06383132934570312, 0.08090972900390625, 0.09798812866210938, 0.1150665283203125, 0.13214492797851562, 0.14922332763671875, 0.16630172729492188, 0.183380126953125, 0.20045852661132812, 0.21753692626953125, 0.23461532592773438, 0.2516937255859375, 0.2687721252441406, 0.28585052490234375, 0.3029289245605469, 0.32000732421875, 0.3370857238769531, 0.35416412353515625, 0.3712425231933594, 0.3883209228515625, 0.4053993225097656, 0.42247772216796875, 0.4395561218261719, 0.456634521484375, 0.4737129211425781, 0.49079132080078125, 0.5078697204589844, 0.5249481201171875, 0.5420265197753906, 0.5591049194335938, 0.5761833190917969, 0.59326171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 10.0, 18.0, 14.0, 21.0, 42.0, 43.0, 39.0, 51.0, 54.0, 64.0, 82.0, 83.0, 71.0, 69.0, 70.0, 45.0, 46.0, 43.0, 36.0, 23.0, 15.0, 16.0, 8.0, 7.0, 12.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8104934692382812, -0.7894439697265625, -0.7683944702148438, -0.747344970703125, -0.7262954711914062, -0.7052459716796875, -0.6841964721679688, -0.66314697265625, -0.6420974731445312, -0.6210479736328125, -0.5999984741210938, -0.578948974609375, -0.5578994750976562, -0.5368499755859375, -0.5158004760742188, -0.4947509765625, -0.47370147705078125, -0.4526519775390625, -0.43160247802734375, -0.410552978515625, -0.38950347900390625, -0.3684539794921875, -0.34740447998046875, -0.32635498046875, -0.30530548095703125, -0.2842559814453125, -0.26320648193359375, -0.242156982421875, -0.22110748291015625, -0.2000579833984375, -0.17900848388671875, -0.157958984375, -0.13690948486328125, -0.1158599853515625, -0.09481048583984375, -0.073760986328125, -0.05271148681640625, -0.0316619873046875, -0.01061248779296875, 0.01043701171875, 0.03148651123046875, 0.0525360107421875, 0.07358551025390625, 0.094635009765625, 0.11568450927734375, 0.1367340087890625, 0.15778350830078125, 0.1788330078125, 0.19988250732421875, 0.2209320068359375, 0.24198150634765625, 0.263031005859375, 0.28408050537109375, 0.3051300048828125, 0.32617950439453125, 0.34722900390625, 0.36827850341796875, 0.3893280029296875, 0.41037750244140625, 0.431427001953125, 0.45247650146484375, 0.4735260009765625, 0.49457550048828125, 0.515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 10.0, 14.0, 15.0, 13.0, 20.0, 36.0, 56.0, 74.0, 107.0, 151.0, 201.0, 387.0, 666.0, 1127.0, 2011.0, 3889.0, 8036.0, 17483.0, 43236.0, 125842.0, 419149.0, 282836.0, 85935.0, 30981.0, 12938.0, 6147.0, 3067.0, 1653.0, 951.0, 520.0, 320.0, 221.0, 149.0, 89.0, 63.0, 55.0, 23.0, 24.0, 18.0, 7.0, 10.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.2374897003173828, -0.22925186157226562, -0.22101402282714844, -0.21277618408203125, -0.20453834533691406, -0.19630050659179688, -0.1880626678466797, -0.1798248291015625, -0.1715869903564453, -0.16334915161132812, -0.15511131286621094, -0.14687347412109375, -0.13863563537597656, -0.13039779663085938, -0.12215995788574219, -0.113922119140625, -0.10568428039550781, -0.09744644165039062, -0.08920860290527344, -0.08097076416015625, -0.07273292541503906, -0.06449508666992188, -0.05625724792480469, -0.0480194091796875, -0.03978157043457031, -0.031543731689453125, -0.023305892944335938, -0.01506805419921875, -0.0068302154541015625, 0.001407623291015625, 0.009645462036132812, 0.01788330078125, 0.026121139526367188, 0.034358978271484375, 0.04259681701660156, 0.05083465576171875, 0.05907249450683594, 0.06731033325195312, 0.07554817199707031, 0.0837860107421875, 0.09202384948730469, 0.10026168823242188, 0.10849952697753906, 0.11673736572265625, 0.12497520446777344, 0.13321304321289062, 0.1414508819580078, 0.149688720703125, 0.1579265594482422, 0.16616439819335938, 0.17440223693847656, 0.18264007568359375, 0.19087791442871094, 0.19911575317382812, 0.2073535919189453, 0.2155914306640625, 0.2238292694091797, 0.23206710815429688, 0.24030494689941406, 0.24854278564453125, 0.25678062438964844, 0.2650184631347656, 0.2732563018798828, 0.281494140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 9.0, 10.0, 14.0, 22.0, 14.0, 21.0, 30.0, 37.0, 39.0, 59.0, 58.0, 65.0, 69.0, 78.0, 89.0, 63.0, 62.0, 47.0, 47.0, 36.0, 30.0, 22.0, 17.0, 15.0, 16.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23046875, -1.186737060546875, -1.14300537109375, -1.099273681640625, -1.0555419921875, -1.011810302734375, -0.96807861328125, -0.924346923828125, -0.880615234375, -0.836883544921875, -0.79315185546875, -0.749420166015625, -0.7056884765625, -0.661956787109375, -0.61822509765625, -0.574493408203125, -0.53076171875, -0.487030029296875, -0.44329833984375, -0.399566650390625, -0.3558349609375, -0.312103271484375, -0.26837158203125, -0.224639892578125, -0.180908203125, -0.137176513671875, -0.09344482421875, -0.049713134765625, -0.0059814453125, 0.037750244140625, 0.08148193359375, 0.125213623046875, 0.1689453125, 0.212677001953125, 0.25640869140625, 0.300140380859375, 0.3438720703125, 0.387603759765625, 0.43133544921875, 0.475067138671875, 0.518798828125, 0.562530517578125, 0.60626220703125, 0.649993896484375, 0.6937255859375, 0.737457275390625, 0.78118896484375, 0.824920654296875, 0.86865234375, 0.912384033203125, 0.95611572265625, 0.999847412109375, 1.0435791015625, 1.087310791015625, 1.13104248046875, 1.174774169921875, 1.218505859375, 1.262237548828125, 1.30596923828125, 1.349700927734375, 1.3934326171875, 1.437164306640625, 1.48089599609375, 1.524627685546875, 1.568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 9.0, 10.0, 26.0, 51.0, 141.0, 336.0, 1314.0, 8616.0, 1004994.0, 29612.0, 2521.0, 577.0, 170.0, 82.0, 48.0, 21.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4899024963378906, -0.47443389892578125, -0.4589653015136719, -0.4434967041015625, -0.4280281066894531, -0.41255950927734375, -0.3970909118652344, -0.381622314453125, -0.3661537170410156, -0.35068511962890625, -0.3352165222167969, -0.3197479248046875, -0.3042793273925781, -0.28881072998046875, -0.2733421325683594, -0.25787353515625, -0.24240493774414062, -0.22693634033203125, -0.21146774291992188, -0.1959991455078125, -0.18053054809570312, -0.16506195068359375, -0.14959335327148438, -0.134124755859375, -0.11865615844726562, -0.10318756103515625, -0.08771896362304688, -0.0722503662109375, -0.056781768798828125, -0.04131317138671875, -0.025844573974609375, -0.0103759765625, 0.005092620849609375, 0.02056121826171875, 0.036029815673828125, 0.0514984130859375, 0.06696701049804688, 0.08243560791015625, 0.09790420532226562, 0.113372802734375, 0.12884140014648438, 0.14430999755859375, 0.15977859497070312, 0.1752471923828125, 0.19071578979492188, 0.20618438720703125, 0.22165298461914062, 0.23712158203125, 0.2525901794433594, 0.26805877685546875, 0.2835273742675781, 0.2989959716796875, 0.3144645690917969, 0.32993316650390625, 0.3454017639160156, 0.360870361328125, 0.3763389587402344, 0.39180755615234375, 0.4072761535644531, 0.4227447509765625, 0.4382133483886719, 0.45368194580078125, 0.4691505432128906, 0.484619140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 24.0, 40.0, 92.0, 148.0, 200.0, 196.0, 137.0, 78.0, 35.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.074256867170334e-05, -3.9165839552879333e-05, -3.758911043405533e-05, -3.601238131523132e-05, -3.443565219640732e-05, -3.285892307758331e-05, -3.128219395875931e-05, -2.9705464839935303e-05, -2.8128735721111298e-05, -2.6552006602287292e-05, -2.4975277483463287e-05, -2.3398548364639282e-05, -2.1821819245815277e-05, -2.0245090126991272e-05, -1.8668361008167267e-05, -1.7091631889343262e-05, -1.5514902770519257e-05, -1.3938173651695251e-05, -1.2361444532871246e-05, -1.0784715414047241e-05, -9.207986295223236e-06, -7.631257176399231e-06, -6.054528057575226e-06, -4.477798938751221e-06, -2.9010698199272156e-06, -1.3243407011032104e-06, 2.523884177207947e-07, 1.8291175365447998e-06, 3.405846655368805e-06, 4.98257577419281e-06, 6.559304893016815e-06, 8.13603401184082e-06, 9.712763130664825e-06, 1.128949224948883e-05, 1.2866221368312836e-05, 1.444295048713684e-05, 1.6019679605960846e-05, 1.759640872478485e-05, 1.9173137843608856e-05, 2.074986696243286e-05, 2.2326596081256866e-05, 2.390332520008087e-05, 2.5480054318904877e-05, 2.7056783437728882e-05, 2.8633512556552887e-05, 3.0210241675376892e-05, 3.17869707942009e-05, 3.33636999130249e-05, 3.494042903184891e-05, 3.651715815067291e-05, 3.809388726949692e-05, 3.967061638832092e-05, 4.124734550714493e-05, 4.282407462596893e-05, 4.440080374479294e-05, 4.597753286361694e-05, 4.755426198244095e-05, 4.9130991101264954e-05, 5.070772022008896e-05, 5.2284449338912964e-05, 5.386117845773697e-05, 5.5437907576560974e-05, 5.701463669538498e-05, 5.8591365814208984e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 8.0, 7.0, 10.0, 21.0, 25.0, 57.0, 111.0, 129.0, 233.0, 396.0, 814.0, 1665.0, 4045.0, 14688.0, 132038.0, 788536.0, 88034.0, 11451.0, 3230.0, 1267.0, 664.0, 423.0, 234.0, 163.0, 108.0, 48.0, 35.0, 30.0, 13.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16140365600585938, -0.15642547607421875, -0.15144729614257812, -0.1464691162109375, -0.14149093627929688, -0.13651275634765625, -0.13153457641601562, -0.126556396484375, -0.12157821655273438, -0.11660003662109375, -0.11162185668945312, -0.1066436767578125, -0.10166549682617188, -0.09668731689453125, -0.09170913696289062, -0.08673095703125, -0.08175277709960938, -0.07677459716796875, -0.07179641723632812, -0.0668182373046875, -0.061840057373046875, -0.05686187744140625, -0.051883697509765625, -0.046905517578125, -0.041927337646484375, -0.03694915771484375, -0.031970977783203125, -0.0269927978515625, -0.022014617919921875, -0.01703643798828125, -0.012058258056640625, -0.007080078125, -0.002101898193359375, 0.00287628173828125, 0.007854461669921875, 0.0128326416015625, 0.017810821533203125, 0.02278900146484375, 0.027767181396484375, 0.032745361328125, 0.037723541259765625, 0.04270172119140625, 0.047679901123046875, 0.0526580810546875, 0.057636260986328125, 0.06261444091796875, 0.06759262084960938, 0.07257080078125, 0.07754898071289062, 0.08252716064453125, 0.08750534057617188, 0.0924835205078125, 0.09746170043945312, 0.10243988037109375, 0.10741806030273438, 0.112396240234375, 0.11737442016601562, 0.12235260009765625, 0.12733078002929688, 0.1323089599609375, 0.13728713989257812, 0.14226531982421875, 0.14724349975585938, 0.1522216796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 16.0, 18.0, 33.0, 43.0, 116.0, 193.0, 209.0, 167.0, 79.0, 40.0, 25.0, 18.0, 2.0, 7.0, 4.0, 11.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.407806396484375, -0.39715576171875, -0.386505126953125, -0.3758544921875, -0.365203857421875, -0.35455322265625, -0.343902587890625, -0.333251953125, -0.322601318359375, -0.31195068359375, -0.301300048828125, -0.2906494140625, -0.279998779296875, -0.26934814453125, -0.258697509765625, -0.248046875, -0.237396240234375, -0.22674560546875, -0.216094970703125, -0.2054443359375, -0.194793701171875, -0.18414306640625, -0.173492431640625, -0.162841796875, -0.152191162109375, -0.14154052734375, -0.130889892578125, -0.1202392578125, -0.109588623046875, -0.09893798828125, -0.088287353515625, -0.07763671875, -0.066986083984375, -0.05633544921875, -0.045684814453125, -0.0350341796875, -0.024383544921875, -0.01373291015625, -0.003082275390625, 0.007568359375, 0.018218994140625, 0.02886962890625, 0.039520263671875, 0.0501708984375, 0.060821533203125, 0.07147216796875, 0.082122802734375, 0.0927734375, 0.103424072265625, 0.11407470703125, 0.124725341796875, 0.1353759765625, 0.146026611328125, 0.15667724609375, 0.167327880859375, 0.177978515625, 0.188629150390625, 0.19927978515625, 0.209930419921875, 0.2205810546875, 0.231231689453125, 0.24188232421875, 0.252532958984375, 0.26318359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 12.0, 29.0, 60.0, 131.0, 323.0, 251.0, 102.0, 38.0, 18.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.016511917114258, -6.821351528167725, -6.626190662384033, -6.4310302734375, -6.235869407653809, -6.040709018707275, -5.845548629760742, -5.650387763977051, -5.455226898193359, -5.260066509246826, -5.064905643463135, -4.869745254516602, -4.67458438873291, -4.479423999786377, -4.284263610839844, -4.089102745056152, -3.893942356109619, -3.698781728744507, -3.5036211013793945, -3.3084607124328613, -3.11329984664917, -2.9181394577026367, -2.7229788303375244, -2.527818202972412, -2.3326575756073, -2.1374969482421875, -1.9423363208770752, -1.7471758127212524, -1.5520151853561401, -1.3568545579910278, -1.161694049835205, -0.9665334224700928, -0.7713727951049805, -0.5762121677398682, -0.38105159997940063, -0.1858910322189331, 0.0092695951461792, 0.2044302225112915, 0.39959073066711426, 0.5947513580322266, 0.7899119853973389, 0.9850726127624512, 1.1802332401275635, 1.3753937482833862, 1.5705543756484985, 1.7657150030136108, 1.9608755111694336, 2.156036138534546, 2.351196765899658, 2.5463573932647705, 2.741518020629883, 2.936678409576416, 3.1318392753601074, 3.3269996643066406, 3.522160291671753, 3.7173209190368652, 3.9124815464019775, 4.10764217376709, 4.302802562713623, 4.4979634284973145, 4.693123817443848, 4.888284683227539, 5.083445072174072, 5.2786054611206055, 5.473766326904297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 12.0, 14.0, 17.0, 31.0, 28.0, 49.0, 65.0, 67.0, 83.0, 134.0, 103.0, 83.0, 54.0, 59.0, 45.0, 34.0, 38.0, 18.0, 14.0, 17.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.387158393859863, -4.253346920013428, -4.11953592300415, -3.985724687576294, -3.8519134521484375, -3.718101978302002, -3.5842907428741455, -3.450479507446289, -3.3166682720184326, -3.182857036590576, -3.0490458011627197, -2.9152345657348633, -2.7814230918884277, -2.6476120948791504, -2.513800621032715, -2.3799893856048584, -2.246178150177002, -2.1123669147491455, -1.978555679321289, -1.844744324684143, -1.7109330892562866, -1.5771218538284302, -1.4433104991912842, -1.3094992637634277, -1.1756880283355713, -1.0418767929077148, -0.9080654978752136, -0.7742542028427124, -0.640442967414856, -0.5066317319869995, -0.3728204369544983, -0.23900914192199707, -0.10519838333129883, 0.028612881898880005, 0.16242414712905884, 0.29623541235923767, 0.4300466775894165, 0.563857913017273, 0.6976692080497742, 0.8314805030822754, 0.9652917385101318, 1.0991029739379883, 1.2329142093658447, 1.3667255640029907, 1.5005367994308472, 1.6343480348587036, 1.7681593894958496, 1.901970624923706, 2.0357818603515625, 2.169593095779419, 2.3034043312072754, 2.437215566635132, 2.5710268020629883, 2.704838275909424, 2.8386495113372803, 2.9724607467651367, 3.106271982192993, 3.2400832176208496, 3.373894453048706, 3.5077056884765625, 3.641517162322998, 3.7753281593322754, 3.909139633178711, 4.042950630187988, 4.176762104034424]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 9.0, 12.0, 16.0, 29.0, 29.0, 32.0, 37.0, 54.0, 284.0, 194.0, 65.0, 50.0, 30.0, 29.0, 24.0, 19.0, 12.0, 8.0, 10.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.720703125, -0.6966018676757812, -0.6725006103515625, -0.6483993530273438, -0.624298095703125, -0.6001968383789062, -0.5760955810546875, -0.5519943237304688, -0.52789306640625, -0.5037918090820312, -0.4796905517578125, -0.45558929443359375, -0.431488037109375, -0.40738677978515625, -0.3832855224609375, -0.35918426513671875, -0.3350830078125, -0.31098175048828125, -0.2868804931640625, -0.26277923583984375, -0.238677978515625, -0.21457672119140625, -0.1904754638671875, -0.16637420654296875, -0.14227294921875, -0.11817169189453125, -0.0940704345703125, -0.06996917724609375, -0.045867919921875, -0.02176666259765625, 0.0023345947265625, 0.02643585205078125, 0.050537109375, 0.07463836669921875, 0.0987396240234375, 0.12284088134765625, 0.146942138671875, 0.17104339599609375, 0.1951446533203125, 0.21924591064453125, 0.24334716796875, 0.26744842529296875, 0.2915496826171875, 0.31565093994140625, 0.339752197265625, 0.36385345458984375, 0.3879547119140625, 0.41205596923828125, 0.4361572265625, 0.46025848388671875, 0.4843597412109375, 0.5084609985351562, 0.532562255859375, 0.5566635131835938, 0.5807647705078125, 0.6048660278320312, 0.62896728515625, 0.6530685424804688, 0.6771697998046875, 0.7012710571289062, 0.725372314453125, 0.7494735717773438, 0.7735748291015625, 0.7976760864257812, 0.82177734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 17.0, 16.0, 24.0, 28.0, 30.0, 50.0, 78.0, 132.0, 156.0, 308.0, 555.0, 1098.0, 2526.0, 7333.0, 40323.0, 8280694.0, 43003.0, 7512.0, 2445.0, 1000.0, 503.0, 279.0, 160.0, 103.0, 47.0, 37.0, 37.0, 19.0, 20.0, 6.0, 10.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.582430362701416, -1.5390931367874146, -1.4957560300827026, -1.4524188041687012, -1.4090816974639893, -1.3657444715499878, -1.3224072456359863, -1.2790701389312744, -1.2357330322265625, -1.192395806312561, -1.1490586996078491, -1.1057214736938477, -1.0623843669891357, -1.0190471410751343, -0.9757099747657776, -0.9323728084564209, -0.8890355825424194, -0.8456984162330627, -0.802361249923706, -0.7590240240097046, -0.7156869173049927, -0.6723496913909912, -0.6290125250816345, -0.5856753587722778, -0.5423381924629211, -0.49900102615356445, -0.45566385984420776, -0.4123266637325287, -0.368989497423172, -0.3256523311138153, -0.28231513500213623, -0.23897796869277954, -0.1956409215927124, -0.1523037552833557, -0.10896657407283783, -0.06562939286231995, -0.022292226552963257, 0.021044939756393433, 0.06438213586807251, 0.1077193021774292, 0.1510564684867859, 0.19439363479614258, 0.23773081600666046, 0.28106799721717834, 0.32440516352653503, 0.3677423298358917, 0.4110795259475708, 0.4544166922569275, 0.4977538585662842, 0.5410910248756409, 0.5844281911849976, 0.627765417098999, 0.6711025238037109, 0.7144397497177124, 0.7577769160270691, 0.8011140823364258, 0.8444512486457825, 0.8877884149551392, 0.9311255812644958, 0.9744627475738525, 1.017799973487854, 1.061137080192566, 1.1044743061065674, 1.1478114128112793, 1.1911486387252808]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 2.0, 8.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.5420992374420166, -3.4338197708129883, -3.32554030418396, -3.2172608375549316, -3.1089813709259033, -3.000701904296875, -2.8924221992492676, -2.7841427326202393, -2.675863265991211, -2.5675837993621826, -2.4593043327331543, -2.351024866104126, -2.2427453994750977, -2.1344656944274902, -2.026186466217041, -1.9179067611694336, -1.8096274137496948, -1.7013479471206665, -1.5930684804916382, -1.4847888946533203, -1.376509428024292, -1.2682299613952637, -1.1599504947662354, -1.051671028137207, -0.9433915019035339, -0.8351120352745056, -0.7268325090408325, -0.6185530424118042, -0.5102735757827759, -0.4019940495491028, -0.29371458292007446, -0.18543505668640137, -0.07715559005737305, 0.031123898923397064, 0.13940338790416718, 0.2476828694343567, 0.3559623658657074, 0.4642418622970581, 0.5725213289260864, 0.6808008551597595, 0.7890803217887878, 0.8973597884178162, 1.0056393146514893, 1.1139187812805176, 1.222198247909546, 1.3304777145385742, 1.4387571811676025, 1.5470367670059204, 1.6553162336349487, 1.763595700263977, 1.8718751668930054, 1.9801547527313232, 2.0884342193603516, 2.19671368598938, 2.304993152618408, 2.4132726192474365, 2.521552085876465, 2.629831552505493, 2.7381110191345215, 2.84639048576355, 2.954669952392578, 3.0629496574401855, 3.1712288856506348, 3.279508590698242, 3.3877880573272705]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 6.0, 13.0, 16.0, 19.0, 36.0, 52.0, 56.0, 67.0, 77.0, 70.0, 92.0, 87.0, 78.0, 56.0, 74.0, 56.0, 30.0, 38.0, 19.0, 15.0, 10.0, 15.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6705474853515625, -0.651153564453125, -0.6317596435546875, -0.61236572265625, -0.5929718017578125, -0.573577880859375, -0.5541839599609375, -0.5347900390625, -0.5153961181640625, -0.496002197265625, -0.4766082763671875, -0.45721435546875, -0.4378204345703125, -0.418426513671875, -0.3990325927734375, -0.379638671875, -0.3602447509765625, -0.340850830078125, -0.3214569091796875, -0.30206298828125, -0.2826690673828125, -0.263275146484375, -0.2438812255859375, -0.2244873046875, -0.2050933837890625, -0.185699462890625, -0.1663055419921875, -0.14691162109375, -0.1275177001953125, -0.108123779296875, -0.0887298583984375, -0.0693359375, -0.0499420166015625, -0.030548095703125, -0.0111541748046875, 0.00823974609375, 0.0276336669921875, 0.047027587890625, 0.0664215087890625, 0.0858154296875, 0.1052093505859375, 0.124603271484375, 0.1439971923828125, 0.16339111328125, 0.1827850341796875, 0.202178955078125, 0.2215728759765625, 0.240966796875, 0.2603607177734375, 0.279754638671875, 0.2991485595703125, 0.31854248046875, 0.3379364013671875, 0.357330322265625, 0.3767242431640625, 0.3961181640625, 0.4155120849609375, 0.434906005859375, 0.4542999267578125, 0.47369384765625, 0.4930877685546875, 0.512481689453125, 0.5318756103515625, 0.55126953125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 17.0, 21.0, 45.0, 60.0, 119.0, 246.0, 410.0, 806.0, 1630.0, 3421.0, 7580.0, 18343.0, 53593.0, 202068.0, 165953.0, 42039.0, 15357.0, 6363.0, 3032.0, 1497.0, 734.0, 394.0, 225.0, 123.0, 59.0, 46.0, 25.0, 21.0, 7.0, 4.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3515625, -4.21514892578125, -4.0787353515625, -3.94232177734375, -3.805908203125, -3.66949462890625, -3.5330810546875, -3.39666748046875, -3.26025390625, -3.12384033203125, -2.9874267578125, -2.85101318359375, -2.714599609375, -2.57818603515625, -2.4417724609375, -2.30535888671875, -2.1689453125, -2.03253173828125, -1.8961181640625, -1.75970458984375, -1.623291015625, -1.48687744140625, -1.3504638671875, -1.21405029296875, -1.07763671875, -0.94122314453125, -0.8048095703125, -0.66839599609375, -0.531982421875, -0.39556884765625, -0.2591552734375, -0.12274169921875, 0.013671875, 0.15008544921875, 0.2864990234375, 0.42291259765625, 0.559326171875, 0.69573974609375, 0.8321533203125, 0.96856689453125, 1.10498046875, 1.24139404296875, 1.3778076171875, 1.51422119140625, 1.650634765625, 1.78704833984375, 1.9234619140625, 2.05987548828125, 2.1962890625, 2.33270263671875, 2.4691162109375, 2.60552978515625, 2.741943359375, 2.87835693359375, 3.0147705078125, 3.15118408203125, 3.28759765625, 3.42401123046875, 3.5604248046875, 3.69683837890625, 3.833251953125, 3.96966552734375, 4.1060791015625, 4.24249267578125, 4.37890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 13.0, 7.0, 6.0, 14.0, 18.0, 26.0, 43.0, 40.0, 43.0, 64.0, 64.0, 68.0, 77.0, 79.0, 87.0, 63.0, 61.0, 48.0, 40.0, 38.0, 30.0, 27.0, 9.0, 10.0, 8.0, 9.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44618988037109375, -0.4280242919921875, -0.40985870361328125, -0.391693115234375, -0.37352752685546875, -0.3553619384765625, -0.33719635009765625, -0.31903076171875, -0.30086517333984375, -0.2826995849609375, -0.26453399658203125, -0.246368408203125, -0.22820281982421875, -0.2100372314453125, -0.19187164306640625, -0.1737060546875, -0.15554046630859375, -0.1373748779296875, -0.11920928955078125, -0.101043701171875, -0.08287811279296875, -0.0647125244140625, -0.04654693603515625, -0.02838134765625, -0.01021575927734375, 0.0079498291015625, 0.02611541748046875, 0.044281005859375, 0.06244659423828125, 0.0806121826171875, 0.09877777099609375, 0.116943359375, 0.13510894775390625, 0.1532745361328125, 0.17144012451171875, 0.189605712890625, 0.20777130126953125, 0.2259368896484375, 0.24410247802734375, 0.26226806640625, 0.28043365478515625, 0.2985992431640625, 0.31676483154296875, 0.334930419921875, 0.35309600830078125, 0.3712615966796875, 0.38942718505859375, 0.4075927734375, 0.42575836181640625, 0.4439239501953125, 0.46208953857421875, 0.480255126953125, 0.49842071533203125, 0.5165863037109375, 0.5347518920898438, 0.55291748046875, 0.5710830688476562, 0.5892486572265625, 0.6074142456054688, 0.625579833984375, 0.6437454223632812, 0.6619110107421875, 0.6800765991210938, 0.6982421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 6.0, 10.0, 5.0, 16.0, 24.0, 30.0, 59.0, 90.0, 96.0, 58.0, 33.0, 18.0, 15.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.364755392074585, -2.3110127449035645, -2.257270097732544, -2.2035274505615234, -2.149784803390503, -2.0960421562194824, -2.042299747467041, -1.9885571002960205, -1.934814453125, -1.8810718059539795, -1.827329158782959, -1.773586630821228, -1.7198439836502075, -1.666101336479187, -1.6123586893081665, -1.5586161613464355, -1.504873514175415, -1.4511308670043945, -1.397388219833374, -1.343645691871643, -1.2899030447006226, -1.236160397529602, -1.1824177503585815, -1.1286752223968506, -1.0749324560165405, -1.02118980884552, -0.9674472212791443, -0.9137045741081238, -0.859961986541748, -0.8062193393707275, -0.752476692199707, -0.6987341046333313, -0.6449915170669556, -0.5912488698959351, -0.5375062823295593, -0.4837636351585388, -0.4300210475921631, -0.3762784004211426, -0.32253578305244446, -0.26879316568374634, -0.21505054831504822, -0.1613079309463501, -0.10756530612707138, -0.053822681307792664, -8.006393909454346e-05, 0.05366256833076477, 0.10740518569946289, 0.161147803068161, 0.21489042043685913, 0.26863303780555725, 0.32237565517425537, 0.3761183023452759, 0.4298608899116516, 0.4836035370826721, 0.5373461246490479, 0.5910887718200684, 0.6448314189910889, 0.6985740661621094, 0.7523166537284851, 0.8060593008995056, 0.8598018884658813, 0.9135445356369019, 0.9672871828079224, 1.0210297107696533, 1.0747723579406738]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 11.0, 14.0, 15.0, 25.0, 32.0, 86.0, 116.0, 69.0, 17.0, 17.0, 19.0, 4.0, 9.0, 7.0, 7.0, 10.0, 10.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7380106449127197, -3.6531708240509033, -3.568331003189087, -3.4834909439086914, -3.398651123046875, -3.3138113021850586, -3.228971481323242, -3.144131660461426, -3.0592918395996094, -2.974452018737793, -2.8896121978759766, -2.80477237701416, -2.7199323177337646, -2.6350924968719482, -2.550252676010132, -2.4654128551483154, -2.38057279586792, -2.2957329750061035, -2.210893154144287, -2.1260533332824707, -2.041213274002075, -1.9563734531402588, -1.8715336322784424, -1.786693811416626, -1.70185387134552, -1.6170140504837036, -1.5321741104125977, -1.4473342895507812, -1.3624944686889648, -1.2776545286178589, -1.1928147077560425, -1.1079747676849365, -1.0231349468231201, -0.9382950663566589, -0.8534551858901978, -0.7686153650283813, -0.6837754845619202, -0.598935604095459, -0.5140957832336426, -0.4292559027671814, -0.3444160223007202, -0.25957614183425903, -0.17473629117012024, -0.08989644050598145, -0.005056560039520264, 0.07978332042694092, 0.16462314128875732, 0.2494630217552185, 0.3343029022216797, 0.41914278268814087, 0.503982663154602, 0.5888224840164185, 0.6736623644828796, 0.7585022449493408, 0.8433420658111572, 0.9281819462776184, 1.0130218267440796, 1.097861647605896, 1.182701587677002, 1.2675414085388184, 1.3523812294006348, 1.4372211694717407, 1.5220609903335571, 1.606900930404663, 1.6917407512664795]}, "eval/loss": 2.135566473007202, "eval/bleu": 1.0140224330923163e-13, "eval/runtime": 2535.9584, "eval/samples_per_second": 5.82, "eval/steps_per_second": 0.728} \ No newline at end of file +{"train/loss": 1.1552, "train/learning_rate": 5.504587155963303e-08, "train/epoch": 3.0, "train/global_step": 4860, "_runtime": 68135, "_timestamp": 1651840403, "_step": 4869, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 5.0, 10.0, 17.0, 27.0, 56.0, 53.0, 50.0, 77.0, 82.0, 78.0, 106.0, 85.0, 75.0, 78.0, 51.0, 39.0, 42.0, 31.0, 14.0, 7.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1944289207458496, -1.1561001539230347, -1.1177713871002197, -1.0794426202774048, -1.0411138534545898, -1.002785086631775, -0.9644562602043152, -0.9261274933815002, -0.8877987265586853, -0.8494699597358704, -0.8111411929130554, -0.7728124260902405, -0.7344835996627808, -0.6961548328399658, -0.6578260660171509, -0.6194972991943359, -0.581168532371521, -0.542839765548706, -0.5045109987258911, -0.4661822021007538, -0.42785343527793884, -0.3895246684551239, -0.3511958718299866, -0.31286710500717163, -0.2745383381843567, -0.23620957136154175, -0.1978807896375656, -0.15955200791358948, -0.12122324109077454, -0.0828944742679596, -0.04456569254398346, -0.006236910820007324, 0.032091736793518066, 0.0704205110669136, 0.10874928534030914, 0.14707806706428528, 0.18540683388710022, 0.22373560070991516, 0.2620643973350525, 0.30039316415786743, 0.3387219309806824, 0.3770506978034973, 0.41537946462631226, 0.4537082612514496, 0.4920370280742645, 0.5303658246994019, 0.5686945915222168, 0.6070233583450317, 0.6453521251678467, 0.6836808919906616, 0.7220096588134766, 0.7603384256362915, 0.7986671924591064, 0.8369959592819214, 0.8753247857093811, 0.913653552532196, 0.951982319355011, 0.9903110861778259, 1.0286399126052856, 1.0669686794281006, 1.1052974462509155, 1.1436262130737305, 1.1819549798965454, 1.2202837467193604, 1.2586125135421753]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 8.0, 6.0, 7.0, 9.0, 14.0, 15.0, 18.0, 16.0, 34.0, 19.0, 36.0, 31.0, 26.0, 48.0, 46.0, 51.0, 35.0, 44.0, 50.0, 55.0, 49.0, 30.0, 44.0, 41.0, 45.0, 35.0, 28.0, 26.0, 27.0, 21.0, 20.0, 12.0, 12.0, 7.0, 14.0, 5.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103015661239624, -1.0644952058792114, -1.0259747505187988, -0.9874542951583862, -0.9489338397979736, -0.910413384437561, -0.8718928694725037, -0.8333724141120911, -0.7948519587516785, -0.7563315033912659, -0.7178110480308533, -0.6792905926704407, -0.6407700777053833, -0.6022496223449707, -0.5637291669845581, -0.5252087116241455, -0.4866882562637329, -0.4481678009033203, -0.4096473455429077, -0.37112686038017273, -0.33260640501976013, -0.29408594965934753, -0.25556546449661255, -0.21704500913619995, -0.17852455377578735, -0.14000409841537476, -0.10148362815380096, -0.06296316534280777, -0.024442702531814575, 0.014077752828598022, 0.052598223090171814, 0.0911186933517456, 0.12963902950286865, 0.16815948486328125, 0.20667995512485504, 0.24520042538642883, 0.28372088074684143, 0.32224133610725403, 0.360761821269989, 0.3992822766304016, 0.4378027319908142, 0.4763231873512268, 0.5148436427116394, 0.553364098072052, 0.5918846130371094, 0.630405068397522, 0.6689255237579346, 0.7074459791183472, 0.7459664344787598, 0.7844868898391724, 0.823007345199585, 0.8615278005599976, 0.9000482559204102, 0.9385687112808228, 0.9770892262458801, 1.0156097412109375, 1.0541300773620605, 1.0926505327224731, 1.1311709880828857, 1.1696914434432983, 1.208211898803711, 1.2467323541641235, 1.2852528095245361, 1.3237733840942383, 1.3622938394546509]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 7.0, 9.0, 9.0, 16.0, 24.0, 20.0, 54.0, 79.0, 104.0, 182.0, 238.0, 376.0, 653.0, 1058.0, 1821.0, 3245.0, 5959.0, 12128.0, 27782.0, 73139.0, 197084.0, 494329.0, 1041458.0, 1207892.0, 658688.0, 284331.0, 109642.0, 40525.0, 16219.0, 7568.0, 3915.0, 2210.0, 1295.0, 833.0, 506.0, 283.0, 183.0, 136.0, 80.0, 60.0, 43.0, 39.0, 21.0, 16.0, 10.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.433502197265625, -1.38262939453125, -1.331756591796875, -1.2808837890625, -1.230010986328125, -1.17913818359375, -1.128265380859375, -1.077392578125, -1.026519775390625, -0.97564697265625, -0.924774169921875, -0.8739013671875, -0.823028564453125, -0.77215576171875, -0.721282958984375, -0.67041015625, -0.619537353515625, -0.56866455078125, -0.517791748046875, -0.4669189453125, -0.416046142578125, -0.36517333984375, -0.314300537109375, -0.263427734375, -0.212554931640625, -0.16168212890625, -0.110809326171875, -0.0599365234375, -0.009063720703125, 0.04180908203125, 0.092681884765625, 0.1435546875, 0.194427490234375, 0.24530029296875, 0.296173095703125, 0.3470458984375, 0.397918701171875, 0.44879150390625, 0.499664306640625, 0.550537109375, 0.601409912109375, 0.65228271484375, 0.703155517578125, 0.7540283203125, 0.804901123046875, 0.85577392578125, 0.906646728515625, 0.95751953125, 1.008392333984375, 1.05926513671875, 1.110137939453125, 1.1610107421875, 1.211883544921875, 1.26275634765625, 1.313629150390625, 1.364501953125, 1.415374755859375, 1.46624755859375, 1.517120361328125, 1.5679931640625, 1.618865966796875, 1.66973876953125, 1.720611572265625, 1.771484375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 4.0, 11.0, 14.0, 8.0, 11.0, 8.0, 10.0, 19.0, 17.0, 21.0, 28.0, 22.0, 36.0, 42.0, 33.0, 37.0, 44.0, 34.0, 45.0, 39.0, 46.0, 34.0, 44.0, 52.0, 40.0, 36.0, 43.0, 27.0, 28.0, 24.0, 20.0, 21.0, 18.0, 12.0, 14.0, 6.0, 3.0, 7.0, 14.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.642578125, -1.5875701904296875, -1.532562255859375, -1.4775543212890625, -1.42254638671875, -1.3675384521484375, -1.312530517578125, -1.2575225830078125, -1.2025146484375, -1.1475067138671875, -1.092498779296875, -1.0374908447265625, -0.98248291015625, -0.9274749755859375, -0.872467041015625, -0.8174591064453125, -0.762451171875, -0.7074432373046875, -0.652435302734375, -0.5974273681640625, -0.54241943359375, -0.4874114990234375, -0.432403564453125, -0.3773956298828125, -0.3223876953125, -0.2673797607421875, -0.212371826171875, -0.1573638916015625, -0.10235595703125, -0.0473480224609375, 0.007659912109375, 0.0626678466796875, 0.11767578125, 0.1726837158203125, 0.227691650390625, 0.2826995849609375, 0.33770751953125, 0.3927154541015625, 0.447723388671875, 0.5027313232421875, 0.5577392578125, 0.6127471923828125, 0.667755126953125, 0.7227630615234375, 0.77777099609375, 0.8327789306640625, 0.887786865234375, 0.9427947998046875, 0.997802734375, 1.0528106689453125, 1.107818603515625, 1.1628265380859375, 1.21783447265625, 1.2728424072265625, 1.327850341796875, 1.3828582763671875, 1.4378662109375, 1.4928741455078125, 1.547882080078125, 1.6028900146484375, 1.65789794921875, 1.7129058837890625, 1.767913818359375, 1.8229217529296875, 1.8779296875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 1.0, 1.0, 7.0, 5.0, 8.0, 18.0, 18.0, 43.0, 62.0, 82.0, 155.0, 292.0, 618.0, 7555.0, 4181989.0, 2311.0, 473.0, 242.0, 147.0, 89.0, 62.0, 29.0, 25.0, 20.0, 11.0, 4.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0625, -24.209228515625, -23.35595703125, -22.502685546875, -21.6494140625, -20.796142578125, -19.94287109375, -19.089599609375, -18.236328125, -17.383056640625, -16.52978515625, -15.676513671875, -14.8232421875, -13.969970703125, -13.11669921875, -12.263427734375, -11.41015625, -10.556884765625, -9.70361328125, -8.850341796875, -7.9970703125, -7.143798828125, -6.29052734375, -5.437255859375, -4.583984375, -3.730712890625, -2.87744140625, -2.024169921875, -1.1708984375, -0.317626953125, 0.53564453125, 1.388916015625, 2.2421875, 3.095458984375, 3.94873046875, 4.802001953125, 5.6552734375, 6.508544921875, 7.36181640625, 8.215087890625, 9.068359375, 9.921630859375, 10.77490234375, 11.628173828125, 12.4814453125, 13.334716796875, 14.18798828125, 15.041259765625, 15.89453125, 16.747802734375, 17.60107421875, 18.454345703125, 19.3076171875, 20.160888671875, 21.01416015625, 21.867431640625, 22.720703125, 23.573974609375, 24.42724609375, 25.280517578125, 26.1337890625, 26.987060546875, 27.84033203125, 28.693603515625, 29.546875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 11.0, 21.0, 30.0, 45.0, 70.0, 107.0, 187.0, 293.0, 507.0, 796.0, 759.0, 443.0, 289.0, 149.0, 125.0, 74.0, 45.0, 34.0, 23.0, 14.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0732421875, -1.038543701171875, -1.00384521484375, -0.969146728515625, -0.9344482421875, -0.899749755859375, -0.86505126953125, -0.830352783203125, -0.795654296875, -0.760955810546875, -0.72625732421875, -0.691558837890625, -0.6568603515625, -0.622161865234375, -0.58746337890625, -0.552764892578125, -0.51806640625, -0.483367919921875, -0.44866943359375, -0.413970947265625, -0.3792724609375, -0.344573974609375, -0.30987548828125, -0.275177001953125, -0.240478515625, -0.205780029296875, -0.17108154296875, -0.136383056640625, -0.1016845703125, -0.066986083984375, -0.03228759765625, 0.002410888671875, 0.037109375, 0.071807861328125, 0.10650634765625, 0.141204833984375, 0.1759033203125, 0.210601806640625, 0.24530029296875, 0.279998779296875, 0.314697265625, 0.349395751953125, 0.38409423828125, 0.418792724609375, 0.4534912109375, 0.488189697265625, 0.52288818359375, 0.557586669921875, 0.59228515625, 0.626983642578125, 0.66168212890625, 0.696380615234375, 0.7310791015625, 0.765777587890625, 0.80047607421875, 0.835174560546875, 0.869873046875, 0.904571533203125, 0.93927001953125, 0.973968505859375, 1.0086669921875, 1.043365478515625, 1.07806396484375, 1.112762451171875, 1.1474609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 7.0, 12.0, 15.0, 21.0, 31.0, 34.0, 41.0, 39.0, 64.0, 63.0, 55.0, 76.0, 72.0, 76.0, 61.0, 59.0, 43.0, 35.0, 49.0, 30.0, 22.0, 24.0, 11.0, 10.0, 4.0, 6.0, 0.0, 8.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0], "bins": [-3.0117263793945312, -2.939441680908203, -2.867157220840454, -2.794872522354126, -2.722587823867798, -2.650303363800049, -2.5780186653137207, -2.5057339668273926, -2.4334492683410645, -2.3611645698547363, -2.2888801097869873, -2.216595411300659, -2.144310712814331, -2.072026252746582, -1.999741554260254, -1.9274568557739258, -1.8551723957061768, -1.7828878164291382, -1.71060311794281, -1.6383185386657715, -1.5660338401794434, -1.4937492609024048, -1.4214646816253662, -1.349179983139038, -1.2768954038619995, -1.204610824584961, -1.1323261260986328, -1.0600415468215942, -0.9877569079399109, -0.9154722690582275, -0.843187689781189, -0.7709030508995056, -0.6986182928085327, -0.6263336539268494, -0.554049015045166, -0.48176443576812744, -0.4094797968864441, -0.33719515800476074, -0.2649105489253998, -0.19262593984603882, -0.12034130096435547, -0.04805667698383331, 0.024227946996688843, 0.096512570977211, 0.16879719495773315, 0.2410818338394165, 0.31336644291877747, 0.3856510519981384, 0.4579356908798218, 0.5302203297615051, 0.6025049686431885, 0.674789547920227, 0.7470741868019104, 0.8193588256835938, 0.8916434049606323, 0.9639280438423157, 1.036212682723999, 1.1084972620010376, 1.1807819604873657, 1.2530665397644043, 1.3253512382507324, 1.397635817527771, 1.4699203968048096, 1.5422050952911377, 1.6144896745681763]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 17.0, 7.0, 12.0, 18.0, 19.0, 23.0, 28.0, 22.0, 27.0, 34.0, 37.0, 32.0, 40.0, 29.0, 38.0, 45.0, 43.0, 40.0, 37.0, 47.0, 47.0, 31.0, 41.0, 33.0, 31.0, 30.0, 29.0, 17.0, 14.0, 14.0, 11.0, 8.0, 19.0, 10.0, 10.0, 5.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9257923364639282, -1.874249815940857, -1.8227072954177856, -1.7711647748947144, -1.7196223735809326, -1.6680798530578613, -1.61653733253479, -1.5649948120117188, -1.5134522914886475, -1.4619097709655762, -1.4103672504425049, -1.3588247299194336, -1.3072822093963623, -1.255739688873291, -1.2041972875595093, -1.152654767036438, -1.1011122465133667, -1.0495697259902954, -0.9980272054672241, -0.9464847445487976, -0.8949422240257263, -0.843399703502655, -0.7918572425842285, -0.7403147220611572, -0.6887722015380859, -0.6372296810150146, -0.5856871604919434, -0.5341446995735168, -0.48260217905044556, -0.43105965852737427, -0.37951716780662537, -0.32797467708587646, -0.2764320373535156, -0.22488953173160553, -0.17334702610969543, -0.12180452048778534, -0.07026201486587524, -0.018719494342803955, 0.032822996377944946, 0.08436548709869385, 0.13590800762176514, 0.18745051324367523, 0.23899301886558533, 0.29053550958633423, 0.3420780301094055, 0.3936205506324768, 0.4451630413532257, 0.4967055320739746, 0.5482480525970459, 0.5997905731201172, 0.6513330936431885, 0.702875554561615, 0.7544180750846863, 0.8059605956077576, 0.8575030565261841, 0.9090455770492554, 0.9605880975723267, 1.012130618095398, 1.0636731386184692, 1.1152156591415405, 1.1667580604553223, 1.2183005809783936, 1.2698431015014648, 1.3213856220245361, 1.3729281425476074]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 17.0, 24.0, 33.0, 55.0, 68.0, 93.0, 145.0, 169.0, 279.0, 418.0, 573.0, 826.0, 1218.0, 1801.0, 2902.0, 4808.0, 8514.0, 17300.0, 36659.0, 84070.0, 186851.0, 296843.0, 214983.0, 100487.0, 44412.0, 20242.0, 10010.0, 5434.0, 3208.0, 1971.0, 1259.0, 836.0, 631.0, 413.0, 295.0, 213.0, 151.0, 99.0, 69.0, 41.0, 35.0, 28.0, 19.0, 7.0, 11.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.53125, -0.5138931274414062, -0.4965362548828125, -0.47917938232421875, -0.461822509765625, -0.44446563720703125, -0.4271087646484375, -0.40975189208984375, -0.39239501953125, -0.37503814697265625, -0.3576812744140625, -0.34032440185546875, -0.322967529296875, -0.30561065673828125, -0.2882537841796875, -0.27089691162109375, -0.2535400390625, -0.23618316650390625, -0.2188262939453125, -0.20146942138671875, -0.184112548828125, -0.16675567626953125, -0.1493988037109375, -0.13204193115234375, -0.11468505859375, -0.09732818603515625, -0.0799713134765625, -0.06261444091796875, -0.045257568359375, -0.02790069580078125, -0.0105438232421875, 0.00681304931640625, 0.024169921875, 0.04152679443359375, 0.0588836669921875, 0.07624053955078125, 0.093597412109375, 0.11095428466796875, 0.1283111572265625, 0.14566802978515625, 0.16302490234375, 0.18038177490234375, 0.1977386474609375, 0.21509552001953125, 0.232452392578125, 0.24980926513671875, 0.2671661376953125, 0.28452301025390625, 0.3018798828125, 0.31923675537109375, 0.3365936279296875, 0.35395050048828125, 0.371307373046875, 0.38866424560546875, 0.4060211181640625, 0.42337799072265625, 0.44073486328125, 0.45809173583984375, 0.4754486083984375, 0.49280548095703125, 0.510162353515625, 0.5275192260742188, 0.5448760986328125, 0.5622329711914062, 0.57958984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 8.0, 5.0, 12.0, 10.0, 9.0, 18.0, 15.0, 13.0, 21.0, 22.0, 26.0, 35.0, 27.0, 35.0, 39.0, 42.0, 37.0, 39.0, 45.0, 38.0, 51.0, 42.0, 48.0, 48.0, 37.0, 35.0, 38.0, 34.0, 20.0, 26.0, 23.0, 18.0, 12.0, 16.0, 15.0, 11.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0], "bins": [-1.4951171875, -1.4537506103515625, -1.412384033203125, -1.3710174560546875, -1.32965087890625, -1.2882843017578125, -1.246917724609375, -1.2055511474609375, -1.1641845703125, -1.1228179931640625, -1.081451416015625, -1.0400848388671875, -0.99871826171875, -0.9573516845703125, -0.915985107421875, -0.8746185302734375, -0.833251953125, -0.7918853759765625, -0.750518798828125, -0.7091522216796875, -0.66778564453125, -0.6264190673828125, -0.585052490234375, -0.5436859130859375, -0.5023193359375, -0.4609527587890625, -0.419586181640625, -0.3782196044921875, -0.33685302734375, -0.2954864501953125, -0.254119873046875, -0.2127532958984375, -0.17138671875, -0.1300201416015625, -0.088653564453125, -0.0472869873046875, -0.00592041015625, 0.0354461669921875, 0.076812744140625, 0.1181793212890625, 0.1595458984375, 0.2009124755859375, 0.242279052734375, 0.2836456298828125, 0.32501220703125, 0.3663787841796875, 0.407745361328125, 0.4491119384765625, 0.490478515625, 0.5318450927734375, 0.573211669921875, 0.6145782470703125, 0.65594482421875, 0.6973114013671875, 0.738677978515625, 0.7800445556640625, 0.8214111328125, 0.8627777099609375, 0.904144287109375, 0.9455108642578125, 0.98687744140625, 1.0282440185546875, 1.069610595703125, 1.1109771728515625, 1.15234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 14.0, 26.0, 24.0, 51.0, 76.0, 116.0, 227.0, 380.0, 744.0, 1714.0, 3977.0, 11053.0, 38629.0, 177739.0, 544548.0, 205245.0, 43600.0, 12349.0, 4333.0, 1829.0, 852.0, 413.0, 235.0, 113.0, 72.0, 42.0, 32.0, 29.0, 20.0, 9.0, 10.0, 7.0, 1.0, 8.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.228118896484375, -1.19256591796875, -1.157012939453125, -1.1214599609375, -1.085906982421875, -1.05035400390625, -1.014801025390625, -0.979248046875, -0.943695068359375, -0.90814208984375, -0.872589111328125, -0.8370361328125, -0.801483154296875, -0.76593017578125, -0.730377197265625, -0.69482421875, -0.659271240234375, -0.62371826171875, -0.588165283203125, -0.5526123046875, -0.517059326171875, -0.48150634765625, -0.445953369140625, -0.410400390625, -0.374847412109375, -0.33929443359375, -0.303741455078125, -0.2681884765625, -0.232635498046875, -0.19708251953125, -0.161529541015625, -0.1259765625, -0.090423583984375, -0.05487060546875, -0.019317626953125, 0.0162353515625, 0.051788330078125, 0.08734130859375, 0.122894287109375, 0.158447265625, 0.194000244140625, 0.22955322265625, 0.265106201171875, 0.3006591796875, 0.336212158203125, 0.37176513671875, 0.407318115234375, 0.44287109375, 0.478424072265625, 0.51397705078125, 0.549530029296875, 0.5850830078125, 0.620635986328125, 0.65618896484375, 0.691741943359375, 0.727294921875, 0.762847900390625, 0.79840087890625, 0.833953857421875, 0.8695068359375, 0.905059814453125, 0.94061279296875, 0.976165771484375, 1.01171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 9.0, 8.0, 6.0, 16.0, 11.0, 14.0, 20.0, 18.0, 43.0, 34.0, 44.0, 46.0, 42.0, 48.0, 54.0, 48.0, 59.0, 48.0, 47.0, 60.0, 50.0, 47.0, 37.0, 32.0, 30.0, 27.0, 18.0, 16.0, 18.0, 14.0, 19.0, 9.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -3.014556884765625, -2.91387939453125, -2.813201904296875, -2.7125244140625, -2.611846923828125, -2.51116943359375, -2.410491943359375, -2.309814453125, -2.209136962890625, -2.10845947265625, -2.007781982421875, -1.9071044921875, -1.806427001953125, -1.70574951171875, -1.605072021484375, -1.50439453125, -1.403717041015625, -1.30303955078125, -1.202362060546875, -1.1016845703125, -1.001007080078125, -0.90032958984375, -0.799652099609375, -0.698974609375, -0.598297119140625, -0.49761962890625, -0.396942138671875, -0.2962646484375, -0.195587158203125, -0.09490966796875, 0.005767822265625, 0.1064453125, 0.207122802734375, 0.30780029296875, 0.408477783203125, 0.5091552734375, 0.609832763671875, 0.71051025390625, 0.811187744140625, 0.911865234375, 1.012542724609375, 1.11322021484375, 1.213897705078125, 1.3145751953125, 1.415252685546875, 1.51593017578125, 1.616607666015625, 1.71728515625, 1.817962646484375, 1.91864013671875, 2.019317626953125, 2.1199951171875, 2.220672607421875, 2.32135009765625, 2.422027587890625, 2.522705078125, 2.623382568359375, 2.72406005859375, 2.824737548828125, 2.9254150390625, 3.026092529296875, 3.12677001953125, 3.227447509765625, 3.328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 10.0, 16.0, 12.0, 23.0, 43.0, 55.0, 65.0, 106.0, 133.0, 215.0, 304.0, 485.0, 786.0, 1274.0, 2233.0, 4113.0, 7722.0, 16138.0, 37484.0, 97987.0, 286310.0, 366775.0, 134574.0, 49254.0, 20797.0, 9778.0, 5074.0, 2706.0, 1537.0, 879.0, 536.0, 355.0, 243.0, 167.0, 97.0, 73.0, 52.0, 40.0, 21.0, 24.0, 13.0, 6.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2210693359375, -0.2139720916748047, -0.20687484741210938, -0.19977760314941406, -0.19268035888671875, -0.18558311462402344, -0.17848587036132812, -0.1713886260986328, -0.1642913818359375, -0.1571941375732422, -0.15009689331054688, -0.14299964904785156, -0.13590240478515625, -0.12880516052246094, -0.12170791625976562, -0.11461067199707031, -0.107513427734375, -0.10041618347167969, -0.09331893920898438, -0.08622169494628906, -0.07912445068359375, -0.07202720642089844, -0.06492996215820312, -0.05783271789550781, -0.0507354736328125, -0.04363822937011719, -0.036540985107421875, -0.029443740844726562, -0.02234649658203125, -0.015249252319335938, -0.008152008056640625, -0.0010547637939453125, 0.00604248046875, 0.013139724731445312, 0.020236968994140625, 0.027334213256835938, 0.03443145751953125, 0.04152870178222656, 0.048625946044921875, 0.05572319030761719, 0.0628204345703125, 0.06991767883300781, 0.07701492309570312, 0.08411216735839844, 0.09120941162109375, 0.09830665588378906, 0.10540390014648438, 0.11250114440917969, 0.119598388671875, 0.1266956329345703, 0.13379287719726562, 0.14089012145996094, 0.14798736572265625, 0.15508460998535156, 0.16218185424804688, 0.1692790985107422, 0.1763763427734375, 0.1834735870361328, 0.19057083129882812, 0.19766807556152344, 0.20476531982421875, 0.21186256408691406, 0.21895980834960938, 0.2260570526123047, 0.233154296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 7.0, 19.0, 25.0, 37.0, 56.0, 102.0, 138.0, 164.0, 169.0, 99.0, 46.0, 40.0, 20.0, 20.0, 13.0, 10.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028705596923828125, -0.00027873367071151733, -0.0002704113721847534, -0.0002620890736579895, -0.0002537667751312256, -0.00024544447660446167, -0.00023712217807769775, -0.00022879987955093384, -0.00022047758102416992, -0.000212155282497406, -0.0002038329839706421, -0.00019551068544387817, -0.00018718838691711426, -0.00017886608839035034, -0.00017054378986358643, -0.0001622214913368225, -0.0001538991928100586, -0.00014557689428329468, -0.00013725459575653076, -0.00012893229722976685, -0.00012060999870300293, -0.00011228770017623901, -0.0001039654016494751, -9.564310312271118e-05, -8.732080459594727e-05, -7.899850606918335e-05, -7.067620754241943e-05, -6.235390901565552e-05, -5.40316104888916e-05, -4.5709311962127686e-05, -3.738701343536377e-05, -2.9064714908599854e-05, -2.0742416381835938e-05, -1.2420117855072021e-05, -4.0978193283081055e-06, 4.2244791984558105e-06, 1.2546777725219727e-05, 2.0869076251983643e-05, 2.919137477874756e-05, 3.7513673305511475e-05, 4.583597183227539e-05, 5.415827035903931e-05, 6.248056888580322e-05, 7.080286741256714e-05, 7.912516593933105e-05, 8.744746446609497e-05, 9.576976299285889e-05, 0.0001040920615196228, 0.00011241436004638672, 0.00012073665857315063, 0.00012905895709991455, 0.00013738125562667847, 0.00014570355415344238, 0.0001540258526802063, 0.00016234815120697021, 0.00017067044973373413, 0.00017899274826049805, 0.00018731504678726196, 0.00019563734531402588, 0.0002039596438407898, 0.0002122819423675537, 0.00022060424089431763, 0.00022892653942108154, 0.00023724883794784546, 0.0002455711364746094]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 6.0, 3.0, 8.0, 14.0, 11.0, 12.0, 20.0, 35.0, 38.0, 58.0, 85.0, 171.0, 490.0, 3192.0, 61358.0, 897136.0, 81208.0, 3737.0, 491.0, 157.0, 95.0, 67.0, 43.0, 29.0, 23.0, 14.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7508697509765625, -0.721466064453125, -0.6920623779296875, -0.66265869140625, -0.6332550048828125, -0.603851318359375, -0.5744476318359375, -0.5450439453125, -0.5156402587890625, -0.486236572265625, -0.4568328857421875, -0.42742919921875, -0.3980255126953125, -0.368621826171875, -0.3392181396484375, -0.309814453125, -0.2804107666015625, -0.251007080078125, -0.2216033935546875, -0.19219970703125, -0.1627960205078125, -0.133392333984375, -0.1039886474609375, -0.0745849609375, -0.0451812744140625, -0.015777587890625, 0.0136260986328125, 0.04302978515625, 0.0724334716796875, 0.101837158203125, 0.1312408447265625, 0.16064453125, 0.1900482177734375, 0.219451904296875, 0.2488555908203125, 0.27825927734375, 0.3076629638671875, 0.337066650390625, 0.3664703369140625, 0.3958740234375, 0.4252777099609375, 0.454681396484375, 0.4840850830078125, 0.51348876953125, 0.5428924560546875, 0.572296142578125, 0.6016998291015625, 0.631103515625, 0.6605072021484375, 0.689910888671875, 0.7193145751953125, 0.74871826171875, 0.7781219482421875, 0.807525634765625, 0.8369293212890625, 0.8663330078125, 0.8957366943359375, 0.925140380859375, 0.9545440673828125, 0.98394775390625, 1.0133514404296875, 1.042755126953125, 1.0721588134765625, 1.1015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 12.0, 5.0, 9.0, 14.0, 13.0, 22.0, 34.0, 42.0, 39.0, 53.0, 65.0, 61.0, 74.0, 70.0, 92.0, 69.0, 51.0, 51.0, 47.0, 42.0, 30.0, 19.0, 16.0, 16.0, 17.0, 3.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0841064453125, -0.08094596862792969, -0.07778549194335938, -0.07462501525878906, -0.07146453857421875, -0.06830406188964844, -0.06514358520507812, -0.06198310852050781, -0.0588226318359375, -0.05566215515136719, -0.052501678466796875, -0.04934120178222656, -0.04618072509765625, -0.04302024841308594, -0.039859771728515625, -0.03669929504394531, -0.033538818359375, -0.030378341674804688, -0.027217864990234375, -0.024057388305664062, -0.02089691162109375, -0.017736434936523438, -0.014575958251953125, -0.011415481567382812, -0.0082550048828125, -0.0050945281982421875, -0.001934051513671875, 0.0012264251708984375, 0.00438690185546875, 0.0075473785400390625, 0.010707855224609375, 0.013868331909179688, 0.01702880859375, 0.020189285278320312, 0.023349761962890625, 0.026510238647460938, 0.02967071533203125, 0.03283119201660156, 0.035991668701171875, 0.03915214538574219, 0.0423126220703125, 0.04547309875488281, 0.048633575439453125, 0.05179405212402344, 0.05495452880859375, 0.05811500549316406, 0.061275482177734375, 0.06443595886230469, 0.067596435546875, 0.07075691223144531, 0.07391738891601562, 0.07707786560058594, 0.08023834228515625, 0.08339881896972656, 0.08655929565429688, 0.08971977233886719, 0.0928802490234375, 0.09604072570800781, 0.09920120239257812, 0.10236167907714844, 0.10552215576171875, 0.10868263244628906, 0.11184310913085938, 0.11500358581542969, 0.1181640625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 29.0, 64.0, 119.0, 161.0, 204.0, 175.0, 127.0, 53.0, 30.0, 15.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2012763023376465, -7.052414417266846, -6.903552055358887, -6.754690170288086, -6.605828285217285, -6.456965923309326, -6.308104038238525, -6.159241676330566, -6.010379791259766, -5.861517906188965, -5.712655544281006, -5.563793659210205, -5.414931774139404, -5.266069412231445, -5.1172075271606445, -4.968345642089844, -4.819483757019043, -4.670621871948242, -4.521759510040283, -4.372897624969482, -4.224035739898682, -4.075173377990723, -3.926311492919922, -3.777449369430542, -3.628587245941162, -3.4797251224517822, -3.3308632373809814, -3.1820011138916016, -3.0331389904022217, -2.884276866912842, -2.735414981842041, -2.586552858352661, -2.4376909732818604, -2.2888288497924805, -2.1399669647216797, -1.9911048412322998, -1.84224271774292, -1.6933807134628296, -1.5445187091827393, -1.3956565856933594, -1.246794581413269, -1.0979325771331787, -0.9490704536437988, -0.8002084493637085, -0.6513463854789734, -0.5024843215942383, -0.35362231731414795, -0.20476019382476807, -0.055898189544677734, 0.09296385943889618, 0.2418259084224701, 0.3906879425048828, 0.5395500063896179, 0.688412070274353, 0.8372740745544434, 0.9861361980438232, 1.1349982023239136, 1.283860206604004, 1.4327223300933838, 1.5815843343734741, 1.7304463386535645, 1.8793084621429443, 2.028170585632324, 2.177032470703125, 2.325894594192505]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 6.0, 7.0, 6.0, 10.0, 14.0, 9.0, 14.0, 14.0, 16.0, 14.0, 20.0, 22.0, 30.0, 34.0, 41.0, 34.0, 39.0, 42.0, 31.0, 34.0, 42.0, 54.0, 43.0, 34.0, 42.0, 36.0, 46.0, 33.0, 36.0, 35.0, 31.0, 17.0, 20.0, 16.0, 13.0, 9.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.435074806213379, -1.3958740234375, -1.356673240661621, -1.3174724578857422, -1.2782716751098633, -1.239071011543274, -1.199870228767395, -1.1606694459915161, -1.1214686632156372, -1.0822678804397583, -1.0430670976638794, -1.0038663148880005, -0.9646655917167664, -0.9254648089408875, -0.8862640857696533, -0.8470633029937744, -0.8078625202178955, -0.7686617374420166, -0.7294609546661377, -0.6902602314949036, -0.6510594487190247, -0.6118586659431458, -0.5726579427719116, -0.5334571599960327, -0.4942563772201538, -0.4550555944442749, -0.4158548414707184, -0.37665408849716187, -0.33745330572128296, -0.29825252294540405, -0.25905176997184753, -0.21985101699829102, -0.18065035343170166, -0.14144958555698395, -0.10224881768226624, -0.06304804980754852, -0.02384728193283081, 0.015353485941886902, 0.054554253816604614, 0.09375500679016113, 0.13295578956604004, 0.17215655744075775, 0.21135732531547546, 0.250558078289032, 0.2897588610649109, 0.3289596438407898, 0.3681603968143463, 0.40736114978790283, 0.44656193256378174, 0.48576271533966064, 0.5249634981155396, 0.5641642212867737, 0.6033650040626526, 0.6425657868385315, 0.6817665100097656, 0.7209672927856445, 0.7601680755615234, 0.7993688583374023, 0.8385696411132812, 0.8777703642845154, 0.9169711470603943, 0.9561719298362732, 0.9953726530075073, 1.0345734357833862, 1.0737742185592651]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 13.0, 4.0, 17.0, 24.0, 29.0, 67.0, 101.0, 134.0, 216.0, 340.0, 551.0, 929.0, 1512.0, 2570.0, 4773.0, 9027.0, 17419.0, 34984.0, 69689.0, 131591.0, 209664.0, 229744.0, 157368.0, 86941.0, 44184.0, 21848.0, 11039.0, 5786.0, 3189.0, 1907.0, 1112.0, 653.0, 372.0, 262.0, 164.0, 105.0, 83.0, 41.0, 35.0, 21.0, 10.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6318283081054688, -0.6127777099609375, -0.5937271118164062, -0.574676513671875, -0.5556259155273438, -0.5365753173828125, -0.5175247192382812, -0.49847412109375, -0.47942352294921875, -0.4603729248046875, -0.44132232666015625, -0.422271728515625, -0.40322113037109375, -0.3841705322265625, -0.36511993408203125, -0.3460693359375, -0.32701873779296875, -0.3079681396484375, -0.28891754150390625, -0.269866943359375, -0.25081634521484375, -0.2317657470703125, -0.21271514892578125, -0.19366455078125, -0.17461395263671875, -0.1555633544921875, -0.13651275634765625, -0.117462158203125, -0.09841156005859375, -0.0793609619140625, -0.06031036376953125, -0.041259765625, -0.02220916748046875, -0.0031585693359375, 0.01589202880859375, 0.034942626953125, 0.05399322509765625, 0.0730438232421875, 0.09209442138671875, 0.11114501953125, 0.13019561767578125, 0.1492462158203125, 0.16829681396484375, 0.187347412109375, 0.20639801025390625, 0.2254486083984375, 0.24449920654296875, 0.2635498046875, 0.28260040283203125, 0.3016510009765625, 0.32070159912109375, 0.339752197265625, 0.35880279541015625, 0.3778533935546875, 0.39690399169921875, 0.41595458984375, 0.43500518798828125, 0.4540557861328125, 0.47310638427734375, 0.492156982421875, 0.5112075805664062, 0.5302581787109375, 0.5493087768554688, 0.568359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 10.0, 10.0, 8.0, 18.0, 13.0, 32.0, 28.0, 25.0, 30.0, 30.0, 29.0, 22.0, 41.0, 39.0, 39.0, 47.0, 50.0, 46.0, 46.0, 41.0, 40.0, 33.0, 42.0, 30.0, 30.0, 34.0, 31.0, 14.0, 26.0, 18.0, 16.0, 21.0, 9.0, 9.0, 8.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.375, -10.0528564453125, -9.730712890625, -9.4085693359375, -9.08642578125, -8.7642822265625, -8.442138671875, -8.1199951171875, -7.7978515625, -7.4757080078125, -7.153564453125, -6.8314208984375, -6.50927734375, -6.1871337890625, -5.864990234375, -5.5428466796875, -5.220703125, -4.8985595703125, -4.576416015625, -4.2542724609375, -3.93212890625, -3.6099853515625, -3.287841796875, -2.9656982421875, -2.6435546875, -2.3214111328125, -1.999267578125, -1.6771240234375, -1.35498046875, -1.0328369140625, -0.710693359375, -0.3885498046875, -0.06640625, 0.2557373046875, 0.577880859375, 0.9000244140625, 1.22216796875, 1.5443115234375, 1.866455078125, 2.1885986328125, 2.5107421875, 2.8328857421875, 3.155029296875, 3.4771728515625, 3.79931640625, 4.1214599609375, 4.443603515625, 4.7657470703125, 5.087890625, 5.4100341796875, 5.732177734375, 6.0543212890625, 6.37646484375, 6.6986083984375, 7.020751953125, 7.3428955078125, 7.6650390625, 7.9871826171875, 8.309326171875, 8.6314697265625, 8.95361328125, 9.2757568359375, 9.597900390625, 9.9200439453125, 10.2421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 7.0, 12.0, 17.0, 34.0, 43.0, 65.0, 109.0, 176.0, 360.0, 927.0, 12366.0, 1011665.0, 20745.0, 1008.0, 435.0, 218.0, 122.0, 87.0, 51.0, 31.0, 33.0, 11.0, 8.0, 4.0, 3.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1328125, -5.91015625, -5.6875, -5.46484375, -5.2421875, -5.01953125, -4.796875, -4.57421875, -4.3515625, -4.12890625, -3.90625, -3.68359375, -3.4609375, -3.23828125, -3.015625, -2.79296875, -2.5703125, -2.34765625, -2.125, -1.90234375, -1.6796875, -1.45703125, -1.234375, -1.01171875, -0.7890625, -0.56640625, -0.34375, -0.12109375, 0.1015625, 0.32421875, 0.546875, 0.76953125, 0.9921875, 1.21484375, 1.4375, 1.66015625, 1.8828125, 2.10546875, 2.328125, 2.55078125, 2.7734375, 2.99609375, 3.21875, 3.44140625, 3.6640625, 3.88671875, 4.109375, 4.33203125, 4.5546875, 4.77734375, 5.0, 5.22265625, 5.4453125, 5.66796875, 5.890625, 6.11328125, 6.3359375, 6.55859375, 6.78125, 7.00390625, 7.2265625, 7.44921875, 7.671875, 7.89453125, 8.1171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 12.0, 12.0, 24.0, 28.0, 36.0, 50.0, 70.0, 85.0, 101.0, 87.0, 86.0, 85.0, 76.0, 60.0, 42.0, 36.0, 37.0, 25.0, 19.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.88916015625, -15.2939453125, -14.69873046875, -14.103515625, -13.50830078125, -12.9130859375, -12.31787109375, -11.72265625, -11.12744140625, -10.5322265625, -9.93701171875, -9.341796875, -8.74658203125, -8.1513671875, -7.55615234375, -6.9609375, -6.36572265625, -5.7705078125, -5.17529296875, -4.580078125, -3.98486328125, -3.3896484375, -2.79443359375, -2.19921875, -1.60400390625, -1.0087890625, -0.41357421875, 0.181640625, 0.77685546875, 1.3720703125, 1.96728515625, 2.5625, 3.15771484375, 3.7529296875, 4.34814453125, 4.943359375, 5.53857421875, 6.1337890625, 6.72900390625, 7.32421875, 7.91943359375, 8.5146484375, 9.10986328125, 9.705078125, 10.30029296875, 10.8955078125, 11.49072265625, 12.0859375, 12.68115234375, 13.2763671875, 13.87158203125, 14.466796875, 15.06201171875, 15.6572265625, 16.25244140625, 16.84765625, 17.44287109375, 18.0380859375, 18.63330078125, 19.228515625, 19.82373046875, 20.4189453125, 21.01416015625, 21.609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 9.0, 15.0, 22.0, 22.0, 29.0, 42.0, 76.0, 126.0, 241.0, 557.0, 1257.0, 3302.0, 15063.0, 762333.0, 251176.0, 9729.0, 2561.0, 983.0, 447.0, 222.0, 107.0, 60.0, 46.0, 34.0, 18.0, 20.0, 10.0, 6.0, 11.0, 6.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1670303344726562, -1.1377716064453125, -1.1085128784179688, -1.079254150390625, -1.0499954223632812, -1.0207366943359375, -0.9914779663085938, -0.96221923828125, -0.9329605102539062, -0.9037017822265625, -0.8744430541992188, -0.845184326171875, -0.8159255981445312, -0.7866668701171875, -0.7574081420898438, -0.7281494140625, -0.6988906860351562, -0.6696319580078125, -0.6403732299804688, -0.611114501953125, -0.5818557739257812, -0.5525970458984375, -0.5233383178710938, -0.49407958984375, -0.46482086181640625, -0.4355621337890625, -0.40630340576171875, -0.377044677734375, -0.34778594970703125, -0.3185272216796875, -0.28926849365234375, -0.260009765625, -0.23075103759765625, -0.2014923095703125, -0.17223358154296875, -0.142974853515625, -0.11371612548828125, -0.0844573974609375, -0.05519866943359375, -0.02593994140625, 0.00331878662109375, 0.0325775146484375, 0.06183624267578125, 0.091094970703125, 0.12035369873046875, 0.1496124267578125, 0.17887115478515625, 0.2081298828125, 0.23738861083984375, 0.2666473388671875, 0.29590606689453125, 0.325164794921875, 0.35442352294921875, 0.3836822509765625, 0.41294097900390625, 0.44219970703125, 0.47145843505859375, 0.5007171630859375, 0.5299758911132812, 0.559234619140625, 0.5884933471679688, 0.6177520751953125, 0.6470108032226562, 0.67626953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 8.0, 7.0, 19.0, 26.0, 48.0, 118.0, 241.0, 240.0, 117.0, 73.0, 30.0, 31.0, 9.0, 9.0, 10.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001404285430908203, -0.00013654213398694992, -0.00013265572488307953, -0.00012876931577920914, -0.00012488290667533875, -0.00012099649757146835, -0.00011711008846759796, -0.00011322367936372757, -0.00010933727025985718, -0.00010545086115598679, -0.0001015644520521164, -9.7678042948246e-05, -9.379163384437561e-05, -8.990522474050522e-05, -8.601881563663483e-05, -8.213240653276443e-05, -7.824599742889404e-05, -7.435958832502365e-05, -7.047317922115326e-05, -6.658677011728287e-05, -6.270036101341248e-05, -5.8813951909542084e-05, -5.492754280567169e-05, -5.10411337018013e-05, -4.715472459793091e-05, -4.3268315494060516e-05, -3.9381906390190125e-05, -3.549549728631973e-05, -3.160908818244934e-05, -2.772267907857895e-05, -2.3836269974708557e-05, -1.9949860870838165e-05, -1.6063451766967773e-05, -1.2177042663097382e-05, -8.29063355922699e-06, -4.404224455356598e-06, -5.178153514862061e-07, 3.368593752384186e-06, 7.255002856254578e-06, 1.114141196012497e-05, 1.5027821063995361e-05, 1.8914230167865753e-05, 2.2800639271736145e-05, 2.6687048375606537e-05, 3.057345747947693e-05, 3.445986658334732e-05, 3.834627568721771e-05, 4.2232684791088104e-05, 4.6119093894958496e-05, 5.000550299882889e-05, 5.389191210269928e-05, 5.777832120656967e-05, 6.166473031044006e-05, 6.555113941431046e-05, 6.943754851818085e-05, 7.332395762205124e-05, 7.721036672592163e-05, 8.109677582979202e-05, 8.498318493366241e-05, 8.88695940375328e-05, 9.27560031414032e-05, 9.664241224527359e-05, 0.00010052882134914398, 0.00010441523045301437, 0.00010830163955688477]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 21.0, 23.0, 46.0, 67.0, 143.0, 270.0, 691.0, 1985.0, 8845.0, 68936.0, 803171.0, 145594.0, 14129.0, 2928.0, 929.0, 360.0, 158.0, 90.0, 50.0, 32.0, 21.0, 16.0, 12.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64892578125, -0.6321296691894531, -0.6153335571289062, -0.5985374450683594, -0.5817413330078125, -0.5649452209472656, -0.5481491088867188, -0.5313529968261719, -0.514556884765625, -0.4977607727050781, -0.48096466064453125, -0.4641685485839844, -0.4473724365234375, -0.4305763244628906, -0.41378021240234375, -0.3969841003417969, -0.38018798828125, -0.3633918762207031, -0.34659576416015625, -0.3297996520996094, -0.3130035400390625, -0.2962074279785156, -0.27941131591796875, -0.2626152038574219, -0.245819091796875, -0.22902297973632812, -0.21222686767578125, -0.19543075561523438, -0.1786346435546875, -0.16183853149414062, -0.14504241943359375, -0.12824630737304688, -0.1114501953125, -0.09465408325195312, -0.07785797119140625, -0.061061859130859375, -0.0442657470703125, -0.027469635009765625, -0.01067352294921875, 0.006122589111328125, 0.022918701171875, 0.039714813232421875, 0.05651092529296875, 0.07330703735351562, 0.0901031494140625, 0.10689926147460938, 0.12369537353515625, 0.14049148559570312, 0.15728759765625, 0.17408370971679688, 0.19087982177734375, 0.20767593383789062, 0.2244720458984375, 0.24126815795898438, 0.25806427001953125, 0.2748603820800781, 0.291656494140625, 0.3084526062011719, 0.32524871826171875, 0.3420448303222656, 0.3588409423828125, 0.3756370544433594, 0.39243316650390625, 0.4092292785644531, 0.426025390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 5.0, 20.0, 31.0, 26.0, 28.0, 47.0, 56.0, 96.0, 133.0, 142.0, 118.0, 65.0, 50.0, 49.0, 36.0, 15.0, 18.0, 8.0, 11.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.160919189453125, -0.15606689453125, -0.151214599609375, -0.1463623046875, -0.141510009765625, -0.13665771484375, -0.131805419921875, -0.126953125, -0.122100830078125, -0.11724853515625, -0.112396240234375, -0.1075439453125, -0.102691650390625, -0.09783935546875, -0.092987060546875, -0.088134765625, -0.083282470703125, -0.07843017578125, -0.073577880859375, -0.0687255859375, -0.063873291015625, -0.05902099609375, -0.054168701171875, -0.04931640625, -0.044464111328125, -0.03961181640625, -0.034759521484375, -0.0299072265625, -0.025054931640625, -0.02020263671875, -0.015350341796875, -0.010498046875, -0.005645751953125, -0.00079345703125, 0.004058837890625, 0.0089111328125, 0.013763427734375, 0.01861572265625, 0.023468017578125, 0.0283203125, 0.033172607421875, 0.03802490234375, 0.042877197265625, 0.0477294921875, 0.052581787109375, 0.05743408203125, 0.062286376953125, 0.067138671875, 0.071990966796875, 0.07684326171875, 0.081695556640625, 0.0865478515625, 0.091400146484375, 0.09625244140625, 0.101104736328125, 0.10595703125, 0.110809326171875, 0.11566162109375, 0.120513916015625, 0.1253662109375, 0.130218505859375, 0.13507080078125, 0.139923095703125, 0.144775390625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 20.0, 44.0, 102.0, 139.0, 193.0, 183.0, 148.0, 90.0, 55.0, 17.0, 7.0, 3.0, 2.0, 1.0], "bins": [-13.261404991149902, -13.019675254821777, -12.777945518493652, -12.536214828491211, -12.294485092163086, -12.052755355834961, -11.811025619506836, -11.569295883178711, -11.327566146850586, -11.085836410522461, -10.844106674194336, -10.602376937866211, -10.36064624786377, -10.118916511535645, -9.87718677520752, -9.635457038879395, -9.393726348876953, -9.151996612548828, -8.910266876220703, -8.668537139892578, -8.426806449890137, -8.185076713562012, -7.943346977233887, -7.701617240905762, -7.459887504577637, -7.218157768249512, -6.9764275550842285, -6.7346978187561035, -6.4929680824279785, -6.251237869262695, -6.00950813293457, -5.767778396606445, -5.52604866027832, -5.284318923950195, -5.042588710784912, -4.800858974456787, -4.559129238128662, -4.317399024963379, -4.075669288635254, -3.833939552307129, -3.592209577560425, -3.3504796028137207, -3.1087498664855957, -2.8670198917388916, -2.6252899169921875, -2.3835601806640625, -2.1418302059173584, -1.9001003503799438, -1.6583704948425293, -1.4166406393051147, -1.1749107837677002, -0.9331808090209961, -0.6914509534835815, -0.449721097946167, -0.2079911231994629, 0.03373873233795166, 0.2754685878753662, 0.5171984434127808, 0.7589283585548401, 1.0006582736968994, 1.242388129234314, 1.4841179847717285, 1.7258479595184326, 1.9675778150558472, 2.2093076705932617]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 8.0, 14.0, 20.0, 10.0, 19.0, 16.0, 17.0, 16.0, 27.0, 26.0, 20.0, 28.0, 37.0, 37.0, 43.0, 44.0, 38.0, 42.0, 40.0, 35.0, 35.0, 27.0, 26.0, 27.0, 37.0, 33.0, 29.0, 32.0, 21.0, 28.0, 31.0, 19.0, 20.0, 10.0, 16.0, 13.0, 8.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.903173446655273, -12.475828170776367, -12.048481941223145, -11.621136665344238, -11.193791389465332, -10.76644515991211, -10.339099884033203, -9.911754608154297, -9.48440933227539, -9.057064056396484, -8.629717826843262, -8.202372550964355, -7.775027275085449, -7.347681522369385, -6.92033576965332, -6.492990493774414, -6.065644264221191, -5.638298511505127, -5.210953235626221, -4.783607482910156, -4.35626220703125, -3.9289164543151855, -3.501570701599121, -3.0742251873016357, -2.6468796730041504, -2.219534158706665, -1.7921885251998901, -1.3648428916931152, -0.9374973773956299, -0.5101518630981445, -0.08280611038208008, 0.3445394039154053, 0.771885871887207, 1.1992313861846924, 1.6265770196914673, 2.053922653198242, 2.4812681674957275, 2.908613681793213, 3.3359594345092773, 3.7633049488067627, 4.190650463104248, 4.6179962158203125, 5.045341491699219, 5.472687244415283, 5.900032997131348, 6.327378273010254, 6.754724025726318, 7.182069778442383, 7.609415054321289, 8.036760330200195, 8.464106559753418, 8.891451835632324, 9.31879711151123, 9.746143341064453, 10.17348861694336, 10.600833892822266, 11.028179168701172, 11.455524444580078, 11.8828706741333, 12.310215950012207, 12.737561225891113, 13.164907455444336, 13.592252731323242, 14.019598007202148, 14.446944236755371]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 6.0, 6.0, 8.0, 9.0, 14.0, 24.0, 25.0, 22.0, 28.0, 29.0, 40.0, 51.0, 64.0, 157.0, 355.0, 936.0, 3288.0, 15971.0, 172959.0, 2288189.0, 1588584.0, 106257.0, 12879.0, 2880.0, 807.0, 291.0, 125.0, 61.0, 45.0, 29.0, 27.0, 14.0, 22.0, 12.0, 15.0, 8.0, 5.0, 8.0, 8.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.14453125, -3.0318603515625, -2.919189453125, -2.8065185546875, -2.69384765625, -2.5811767578125, -2.468505859375, -2.3558349609375, -2.2431640625, -2.1304931640625, -2.017822265625, -1.9051513671875, -1.79248046875, -1.6798095703125, -1.567138671875, -1.4544677734375, -1.341796875, -1.2291259765625, -1.116455078125, -1.0037841796875, -0.89111328125, -0.7784423828125, -0.665771484375, -0.5531005859375, -0.4404296875, -0.3277587890625, -0.215087890625, -0.1024169921875, 0.01025390625, 0.1229248046875, 0.235595703125, 0.3482666015625, 0.4609375, 0.5736083984375, 0.686279296875, 0.7989501953125, 0.91162109375, 1.0242919921875, 1.136962890625, 1.2496337890625, 1.3623046875, 1.4749755859375, 1.587646484375, 1.7003173828125, 1.81298828125, 1.9256591796875, 2.038330078125, 2.1510009765625, 2.263671875, 2.3763427734375, 2.489013671875, 2.6016845703125, 2.71435546875, 2.8270263671875, 2.939697265625, 3.0523681640625, 3.1650390625, 3.2777099609375, 3.390380859375, 3.5030517578125, 3.61572265625, 3.7283935546875, 3.841064453125, 3.9537353515625, 4.06640625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 3.0, 9.0, 8.0, 7.0, 10.0, 13.0, 13.0, 21.0, 28.0, 26.0, 38.0, 35.0, 38.0, 41.0, 48.0, 49.0, 42.0, 44.0, 31.0, 33.0, 50.0, 49.0, 39.0, 51.0, 37.0, 36.0, 26.0, 30.0, 34.0, 21.0, 11.0, 13.0, 14.0, 15.0, 8.0, 3.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.984375, -1.9312286376953125, -1.878082275390625, -1.8249359130859375, -1.77178955078125, -1.7186431884765625, -1.665496826171875, -1.6123504638671875, -1.5592041015625, -1.5060577392578125, -1.452911376953125, -1.3997650146484375, -1.34661865234375, -1.2934722900390625, -1.240325927734375, -1.1871795654296875, -1.134033203125, -1.0808868408203125, -1.027740478515625, -0.9745941162109375, -0.92144775390625, -0.8683013916015625, -0.815155029296875, -0.7620086669921875, -0.7088623046875, -0.6557159423828125, -0.602569580078125, -0.5494232177734375, -0.49627685546875, -0.4431304931640625, -0.389984130859375, -0.3368377685546875, -0.28369140625, -0.2305450439453125, -0.177398681640625, -0.1242523193359375, -0.07110595703125, -0.0179595947265625, 0.035186767578125, 0.0883331298828125, 0.1414794921875, 0.1946258544921875, 0.247772216796875, 0.3009185791015625, 0.35406494140625, 0.4072113037109375, 0.460357666015625, 0.5135040283203125, 0.566650390625, 0.6197967529296875, 0.672943115234375, 0.7260894775390625, 0.77923583984375, 0.8323822021484375, 0.885528564453125, 0.9386749267578125, 0.9918212890625, 1.0449676513671875, 1.098114013671875, 1.1512603759765625, 1.20440673828125, 1.2575531005859375, 1.310699462890625, 1.3638458251953125, 1.4169921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 13.0, 20.0, 60.0, 660888.0, 3533187.0, 61.0, 30.0, 13.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-237.5, -232.552734375, -227.60546875, -222.658203125, -217.7109375, -212.763671875, -207.81640625, -202.869140625, -197.921875, -192.974609375, -188.02734375, -183.080078125, -178.1328125, -173.185546875, -168.23828125, -163.291015625, -158.34375, -153.396484375, -148.44921875, -143.501953125, -138.5546875, -133.607421875, -128.66015625, -123.712890625, -118.765625, -113.818359375, -108.87109375, -103.923828125, -98.9765625, -94.029296875, -89.08203125, -84.134765625, -79.1875, -74.240234375, -69.29296875, -64.345703125, -59.3984375, -54.451171875, -49.50390625, -44.556640625, -39.609375, -34.662109375, -29.71484375, -24.767578125, -19.8203125, -14.873046875, -9.92578125, -4.978515625, -0.03125, 4.916015625, 9.86328125, 14.810546875, 19.7578125, 24.705078125, 29.65234375, 34.599609375, 39.546875, 44.494140625, 49.44140625, 54.388671875, 59.3359375, 64.283203125, 69.23046875, 74.177734375, 79.125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 8.0, 9.0, 13.0, 20.0, 37.0, 56.0, 66.0, 141.0, 204.0, 329.0, 565.0, 797.0, 690.0, 432.0, 265.0, 152.0, 115.0, 57.0, 38.0, 19.0, 17.0, 16.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3095703125, -1.2782135009765625, -1.246856689453125, -1.2154998779296875, -1.18414306640625, -1.1527862548828125, -1.121429443359375, -1.0900726318359375, -1.0587158203125, -1.0273590087890625, -0.996002197265625, -0.9646453857421875, -0.93328857421875, -0.9019317626953125, -0.870574951171875, -0.8392181396484375, -0.807861328125, -0.7765045166015625, -0.745147705078125, -0.7137908935546875, -0.68243408203125, -0.6510772705078125, -0.619720458984375, -0.5883636474609375, -0.5570068359375, -0.5256500244140625, -0.494293212890625, -0.4629364013671875, -0.43157958984375, -0.4002227783203125, -0.368865966796875, -0.3375091552734375, -0.30615234375, -0.2747955322265625, -0.243438720703125, -0.2120819091796875, -0.18072509765625, -0.1493682861328125, -0.118011474609375, -0.0866546630859375, -0.0552978515625, -0.0239410400390625, 0.007415771484375, 0.0387725830078125, 0.07012939453125, 0.1014862060546875, 0.132843017578125, 0.1641998291015625, 0.195556640625, 0.2269134521484375, 0.258270263671875, 0.2896270751953125, 0.32098388671875, 0.3523406982421875, 0.383697509765625, 0.4150543212890625, 0.4464111328125, 0.4777679443359375, 0.509124755859375, 0.5404815673828125, 0.57183837890625, 0.6031951904296875, 0.634552001953125, 0.6659088134765625, 0.697265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 8.0, 19.0, 16.0, 21.0, 24.0, 49.0, 38.0, 50.0, 65.0, 78.0, 94.0, 74.0, 78.0, 63.0, 72.0, 44.0, 53.0, 38.0, 29.0, 19.0, 19.0, 16.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8551807403564453, -2.7785332202911377, -2.70188570022583, -2.6252381801605225, -2.548590660095215, -2.4719431400299072, -2.3952956199645996, -2.318648099899292, -2.2420005798339844, -2.1653530597686768, -2.088705539703369, -2.0120580196380615, -1.935410499572754, -1.8587629795074463, -1.7821154594421387, -1.705467939376831, -1.6288204193115234, -1.5521728992462158, -1.4755253791809082, -1.3988778591156006, -1.322230339050293, -1.2455828189849854, -1.1689352989196777, -1.0922877788543701, -1.0156402587890625, -0.9389927387237549, -0.8623452186584473, -0.7856976985931396, -0.709050178527832, -0.6324026584625244, -0.5557551383972168, -0.4791076183319092, -0.40246009826660156, -0.32581257820129395, -0.24916505813598633, -0.1725175380706787, -0.0958700180053711, -0.019222497940063477, 0.05742502212524414, 0.13407254219055176, 0.21072006225585938, 0.287367582321167, 0.3640151023864746, 0.4406626224517822, 0.5173101425170898, 0.5939576625823975, 0.6706051826477051, 0.7472527027130127, 0.8239002227783203, 0.9005477428436279, 0.9771952629089355, 1.0538427829742432, 1.1304903030395508, 1.2071378231048584, 1.283785343170166, 1.3604328632354736, 1.4370803833007812, 1.5137279033660889, 1.5903754234313965, 1.667022943496704, 1.7436704635620117, 1.8203179836273193, 1.896965503692627, 1.9736130237579346, 2.050260543823242]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 6.0, 9.0, 14.0, 11.0, 15.0, 11.0, 15.0, 24.0, 18.0, 16.0, 27.0, 34.0, 36.0, 34.0, 40.0, 38.0, 35.0, 36.0, 42.0, 45.0, 52.0, 44.0, 32.0, 34.0, 37.0, 43.0, 30.0, 32.0, 24.0, 25.0, 15.0, 10.0, 15.0, 14.0, 16.0, 13.0, 8.0, 11.0, 11.0, 6.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7197993993759155, -1.669728398323059, -1.619657278060913, -1.5695862770080566, -1.5195152759552002, -1.4694442749023438, -1.4193731546401978, -1.3693021535873413, -1.3192310333251953, -1.2691600322723389, -1.2190889120101929, -1.1690179109573364, -1.11894690990448, -1.068875789642334, -1.0188047885894775, -0.9687337875366211, -0.9186627864837646, -0.8685917258262634, -0.818520724773407, -0.7684496641159058, -0.7183786630630493, -0.6683076024055481, -0.6182365417480469, -0.5681655406951904, -0.5180944800376892, -0.4680234491825104, -0.41795241832733154, -0.3678813576698303, -0.3178103268146515, -0.26773929595947266, -0.21766823530197144, -0.1675972044467926, -0.11752617359161377, -0.06745513528585434, -0.01738409698009491, 0.03268694877624512, 0.08275797963142395, 0.13282901048660278, 0.182900071144104, 0.23297110199928284, 0.28304213285446167, 0.3331131637096405, 0.38318419456481934, 0.43325525522232056, 0.4833262860774994, 0.5333973169326782, 0.5834683775901794, 0.6335394382476807, 0.6836104393005371, 0.7336814999580383, 0.7837525010108948, 0.833823561668396, 0.8838945627212524, 0.9339656233787537, 0.9840366840362549, 1.0341076850891113, 1.0841786861419678, 1.1342496871948242, 1.1843208074569702, 1.2343918085098267, 1.284462809562683, 1.334533929824829, 1.3846049308776855, 1.434675931930542, 1.484747052192688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 8.0, 13.0, 15.0, 23.0, 32.0, 49.0, 82.0, 95.0, 154.0, 225.0, 330.0, 535.0, 760.0, 1142.0, 1711.0, 2615.0, 4113.0, 7025.0, 13258.0, 29500.0, 71177.0, 173581.0, 304235.0, 241674.0, 109576.0, 43866.0, 18791.0, 9191.0, 5298.0, 3191.0, 2098.0, 1335.0, 878.0, 647.0, 473.0, 269.0, 190.0, 148.0, 77.0, 50.0, 34.0, 31.0, 20.0, 12.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.623046875, -0.6056098937988281, -0.5881729125976562, -0.5707359313964844, -0.5532989501953125, -0.5358619689941406, -0.5184249877929688, -0.5009880065917969, -0.483551025390625, -0.4661140441894531, -0.44867706298828125, -0.4312400817871094, -0.4138031005859375, -0.3963661193847656, -0.37892913818359375, -0.3614921569824219, -0.34405517578125, -0.3266181945800781, -0.30918121337890625, -0.2917442321777344, -0.2743072509765625, -0.2568702697753906, -0.23943328857421875, -0.22199630737304688, -0.204559326171875, -0.18712234497070312, -0.16968536376953125, -0.15224838256835938, -0.1348114013671875, -0.11737442016601562, -0.09993743896484375, -0.08250045776367188, -0.0650634765625, -0.047626495361328125, -0.03018951416015625, -0.012752532958984375, 0.0046844482421875, 0.022121429443359375, 0.03955841064453125, 0.056995391845703125, 0.074432373046875, 0.09186935424804688, 0.10930633544921875, 0.12674331665039062, 0.1441802978515625, 0.16161727905273438, 0.17905426025390625, 0.19649124145507812, 0.21392822265625, 0.23136520385742188, 0.24880218505859375, 0.2662391662597656, 0.2836761474609375, 0.3011131286621094, 0.31855010986328125, 0.3359870910644531, 0.353424072265625, 0.3708610534667969, 0.38829803466796875, 0.4057350158691406, 0.4231719970703125, 0.4406089782714844, 0.45804595947265625, 0.4754829406738281, 0.492919921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 9.0, 5.0, 8.0, 13.0, 18.0, 21.0, 17.0, 22.0, 19.0, 34.0, 33.0, 36.0, 30.0, 46.0, 43.0, 51.0, 52.0, 45.0, 39.0, 35.0, 40.0, 45.0, 30.0, 35.0, 35.0, 39.0, 26.0, 29.0, 25.0, 13.0, 20.0, 22.0, 10.0, 12.0, 10.0, 6.0, 6.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.240234375, -1.2048492431640625, -1.169464111328125, -1.1340789794921875, -1.09869384765625, -1.0633087158203125, -1.027923583984375, -0.9925384521484375, -0.9571533203125, -0.9217681884765625, -0.886383056640625, -0.8509979248046875, -0.81561279296875, -0.7802276611328125, -0.744842529296875, -0.7094573974609375, -0.674072265625, -0.6386871337890625, -0.603302001953125, -0.5679168701171875, -0.53253173828125, -0.4971466064453125, -0.461761474609375, -0.4263763427734375, -0.3909912109375, -0.3556060791015625, -0.320220947265625, -0.2848358154296875, -0.24945068359375, -0.2140655517578125, -0.178680419921875, -0.1432952880859375, -0.10791015625, -0.0725250244140625, -0.037139892578125, -0.0017547607421875, 0.03363037109375, 0.0690155029296875, 0.104400634765625, 0.1397857666015625, 0.1751708984375, 0.2105560302734375, 0.245941162109375, 0.2813262939453125, 0.31671142578125, 0.3520965576171875, 0.387481689453125, 0.4228668212890625, 0.458251953125, 0.4936370849609375, 0.529022216796875, 0.5644073486328125, 0.59979248046875, 0.6351776123046875, 0.670562744140625, 0.7059478759765625, 0.7413330078125, 0.7767181396484375, 0.812103271484375, 0.8474884033203125, 0.88287353515625, 0.9182586669921875, 0.953643798828125, 0.9890289306640625, 1.0244140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 4.0, 16.0, 15.0, 23.0, 31.0, 38.0, 63.0, 114.0, 171.0, 324.0, 712.0, 1465.0, 3431.0, 9614.0, 33507.0, 144321.0, 473765.0, 287647.0, 66846.0, 16903.0, 5376.0, 2194.0, 899.0, 433.0, 243.0, 142.0, 75.0, 50.0, 32.0, 22.0, 26.0, 13.0, 8.0, 5.0, 2.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0869140625, -1.0565032958984375, -1.026092529296875, -0.9956817626953125, -0.96527099609375, -0.9348602294921875, -0.904449462890625, -0.8740386962890625, -0.8436279296875, -0.8132171630859375, -0.782806396484375, -0.7523956298828125, -0.72198486328125, -0.6915740966796875, -0.661163330078125, -0.6307525634765625, -0.600341796875, -0.5699310302734375, -0.539520263671875, -0.5091094970703125, -0.47869873046875, -0.4482879638671875, -0.417877197265625, -0.3874664306640625, -0.3570556640625, -0.3266448974609375, -0.296234130859375, -0.2658233642578125, -0.23541259765625, -0.2050018310546875, -0.174591064453125, -0.1441802978515625, -0.11376953125, -0.0833587646484375, -0.052947998046875, -0.0225372314453125, 0.00787353515625, 0.0382843017578125, 0.068695068359375, 0.0991058349609375, 0.1295166015625, 0.1599273681640625, 0.190338134765625, 0.2207489013671875, 0.25115966796875, 0.2815704345703125, 0.311981201171875, 0.3423919677734375, 0.372802734375, 0.4032135009765625, 0.433624267578125, 0.4640350341796875, 0.49444580078125, 0.5248565673828125, 0.555267333984375, 0.5856781005859375, 0.6160888671875, 0.6464996337890625, 0.676910400390625, 0.7073211669921875, 0.73773193359375, 0.7681427001953125, 0.798553466796875, 0.8289642333984375, 0.859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 7.0, 4.0, 10.0, 12.0, 11.0, 10.0, 13.0, 23.0, 30.0, 28.0, 31.0, 35.0, 22.0, 37.0, 41.0, 43.0, 37.0, 46.0, 47.0, 45.0, 40.0, 49.0, 43.0, 39.0, 39.0, 34.0, 35.0, 35.0, 19.0, 19.0, 17.0, 22.0, 6.0, 12.0, 9.0, 8.0, 9.0, 5.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.760528564453125, -1.69683837890625, -1.633148193359375, -1.5694580078125, -1.505767822265625, -1.44207763671875, -1.378387451171875, -1.314697265625, -1.251007080078125, -1.18731689453125, -1.123626708984375, -1.0599365234375, -0.996246337890625, -0.93255615234375, -0.868865966796875, -0.80517578125, -0.741485595703125, -0.67779541015625, -0.614105224609375, -0.5504150390625, -0.486724853515625, -0.42303466796875, -0.359344482421875, -0.295654296875, -0.231964111328125, -0.16827392578125, -0.104583740234375, -0.0408935546875, 0.022796630859375, 0.08648681640625, 0.150177001953125, 0.2138671875, 0.277557373046875, 0.34124755859375, 0.404937744140625, 0.4686279296875, 0.532318115234375, 0.59600830078125, 0.659698486328125, 0.723388671875, 0.787078857421875, 0.85076904296875, 0.914459228515625, 0.9781494140625, 1.041839599609375, 1.10552978515625, 1.169219970703125, 1.23291015625, 1.296600341796875, 1.36029052734375, 1.423980712890625, 1.4876708984375, 1.551361083984375, 1.61505126953125, 1.678741455078125, 1.742431640625, 1.806121826171875, 1.86981201171875, 1.933502197265625, 1.9971923828125, 2.060882568359375, 2.12457275390625, 2.188262939453125, 2.251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 15.0, 17.0, 30.0, 24.0, 43.0, 94.0, 122.0, 222.0, 355.0, 664.0, 1293.0, 2649.0, 6118.0, 15739.0, 47474.0, 167037.0, 419239.0, 269162.0, 78001.0, 24215.0, 8707.0, 3655.0, 1639.0, 857.0, 445.0, 283.0, 157.0, 89.0, 64.0, 45.0, 31.0, 20.0, 11.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.216796875, -0.2110462188720703, -0.20529556274414062, -0.19954490661621094, -0.19379425048828125, -0.18804359436035156, -0.18229293823242188, -0.1765422821044922, -0.1707916259765625, -0.1650409698486328, -0.15929031372070312, -0.15353965759277344, -0.14778900146484375, -0.14203834533691406, -0.13628768920898438, -0.1305370330810547, -0.124786376953125, -0.11903572082519531, -0.11328506469726562, -0.10753440856933594, -0.10178375244140625, -0.09603309631347656, -0.09028244018554688, -0.08453178405761719, -0.0787811279296875, -0.07303047180175781, -0.06727981567382812, -0.06152915954589844, -0.05577850341796875, -0.05002784729003906, -0.044277191162109375, -0.03852653503417969, -0.03277587890625, -0.027025222778320312, -0.021274566650390625, -0.015523910522460938, -0.00977325439453125, -0.0040225982666015625, 0.001728057861328125, 0.0074787139892578125, 0.0132293701171875, 0.018980026245117188, 0.024730682373046875, 0.030481338500976562, 0.03623199462890625, 0.04198265075683594, 0.047733306884765625, 0.05348396301269531, 0.059234619140625, 0.06498527526855469, 0.07073593139648438, 0.07648658752441406, 0.08223724365234375, 0.08798789978027344, 0.09373855590820312, 0.09948921203613281, 0.1052398681640625, 0.11099052429199219, 0.11674118041992188, 0.12249183654785156, 0.12824249267578125, 0.13399314880371094, 0.13974380493164062, 0.1454944610595703, 0.1512451171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 0.0, 5.0, 3.0, 10.0, 11.0, 14.0, 19.0, 24.0, 33.0, 40.0, 48.0, 67.0, 67.0, 89.0, 110.0, 91.0, 81.0, 71.0, 57.0, 39.0, 34.0, 26.0, 19.0, 7.0, 8.0, 9.0, 12.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.927417755126953e-05, -7.603317499160767e-05, -7.27921724319458e-05, -6.955116987228394e-05, -6.631016731262207e-05, -6.30691647529602e-05, -5.982816219329834e-05, -5.6587159633636475e-05, -5.334615707397461e-05, -5.0105154514312744e-05, -4.686415195465088e-05, -4.3623149394989014e-05, -4.038214683532715e-05, -3.714114427566528e-05, -3.390014171600342e-05, -3.065913915634155e-05, -2.7418136596679688e-05, -2.4177134037017822e-05, -2.0936131477355957e-05, -1.7695128917694092e-05, -1.4454126358032227e-05, -1.1213123798370361e-05, -7.972121238708496e-06, -4.731118679046631e-06, -1.4901161193847656e-06, 1.7508864402770996e-06, 4.991888999938965e-06, 8.23289155960083e-06, 1.1473894119262695e-05, 1.471489667892456e-05, 1.7955899238586426e-05, 2.119690179824829e-05, 2.4437904357910156e-05, 2.767890691757202e-05, 3.091990947723389e-05, 3.416091203689575e-05, 3.740191459655762e-05, 4.064291715621948e-05, 4.388391971588135e-05, 4.712492227554321e-05, 5.036592483520508e-05, 5.360692739486694e-05, 5.684792995452881e-05, 6.0088932514190674e-05, 6.332993507385254e-05, 6.65709376335144e-05, 6.981194019317627e-05, 7.305294275283813e-05, 7.62939453125e-05, 7.953494787216187e-05, 8.277595043182373e-05, 8.60169529914856e-05, 8.925795555114746e-05, 9.249895811080933e-05, 9.573996067047119e-05, 9.898096323013306e-05, 0.00010222196578979492, 0.00010546296834945679, 0.00010870397090911865, 0.00011194497346878052, 0.00011518597602844238, 0.00011842697858810425, 0.00012166798114776611, 0.00012490898370742798, 0.00012814998626708984]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 9.0, 15.0, 20.0, 35.0, 50.0, 62.0, 95.0, 143.0, 363.0, 4754.0, 544293.0, 493257.0, 4619.0, 384.0, 130.0, 78.0, 62.0, 38.0, 40.0, 14.0, 17.0, 7.0, 9.0, 9.0, 5.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6923828125, -0.665740966796875, -0.63909912109375, -0.612457275390625, -0.5858154296875, -0.559173583984375, -0.53253173828125, -0.505889892578125, -0.479248046875, -0.452606201171875, -0.42596435546875, -0.399322509765625, -0.3726806640625, -0.346038818359375, -0.31939697265625, -0.292755126953125, -0.26611328125, -0.239471435546875, -0.21282958984375, -0.186187744140625, -0.1595458984375, -0.132904052734375, -0.10626220703125, -0.079620361328125, -0.052978515625, -0.026336669921875, 0.00030517578125, 0.026947021484375, 0.0535888671875, 0.080230712890625, 0.10687255859375, 0.133514404296875, 0.16015625, 0.186798095703125, 0.21343994140625, 0.240081787109375, 0.2667236328125, 0.293365478515625, 0.32000732421875, 0.346649169921875, 0.373291015625, 0.399932861328125, 0.42657470703125, 0.453216552734375, 0.4798583984375, 0.506500244140625, 0.53314208984375, 0.559783935546875, 0.58642578125, 0.613067626953125, 0.63970947265625, 0.666351318359375, 0.6929931640625, 0.719635009765625, 0.74627685546875, 0.772918701171875, 0.799560546875, 0.826202392578125, 0.85284423828125, 0.879486083984375, 0.9061279296875, 0.932769775390625, 0.95941162109375, 0.986053466796875, 1.0126953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 5.0, 4.0, 10.0, 13.0, 20.0, 15.0, 18.0, 33.0, 31.0, 36.0, 39.0, 43.0, 50.0, 66.0, 52.0, 48.0, 57.0, 44.0, 54.0, 54.0, 41.0, 45.0, 41.0, 18.0, 29.0, 18.0, 16.0, 9.0, 14.0, 16.0, 12.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.051116943359375, -0.04952192306518555, -0.047926902770996094, -0.04633188247680664, -0.04473686218261719, -0.043141841888427734, -0.04154682159423828, -0.03995180130004883, -0.038356781005859375, -0.03676176071166992, -0.03516674041748047, -0.033571720123291016, -0.03197669982910156, -0.03038167953491211, -0.028786659240722656, -0.027191638946533203, -0.02559661865234375, -0.024001598358154297, -0.022406578063964844, -0.02081155776977539, -0.019216537475585938, -0.017621517181396484, -0.01602649688720703, -0.014431476593017578, -0.012836456298828125, -0.011241436004638672, -0.009646415710449219, -0.008051395416259766, -0.0064563751220703125, -0.004861354827880859, -0.0032663345336914062, -0.0016713142395019531, -7.62939453125e-05, 0.0015187263488769531, 0.0031137466430664062, 0.004708766937255859, 0.0063037872314453125, 0.007898807525634766, 0.009493827819824219, 0.011088848114013672, 0.012683868408203125, 0.014278888702392578, 0.01587390899658203, 0.017468929290771484, 0.019063949584960938, 0.02065896987915039, 0.022253990173339844, 0.023849010467529297, 0.02544403076171875, 0.027039051055908203, 0.028634071350097656, 0.03022909164428711, 0.03182411193847656, 0.033419132232666016, 0.03501415252685547, 0.03660917282104492, 0.038204193115234375, 0.03979921340942383, 0.04139423370361328, 0.042989253997802734, 0.04458427429199219, 0.04617929458618164, 0.047774314880371094, 0.04936933517456055, 0.05096435546875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 13.0, 11.0, 20.0, 27.0, 36.0, 63.0, 87.0, 115.0, 132.0, 122.0, 105.0, 81.0, 62.0, 53.0, 26.0, 18.0, 13.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345200538635254, -2.277953863143921, -2.210707426071167, -2.143460750579834, -2.07621431350708, -2.008967638015747, -1.9417210817337036, -1.8744745254516602, -1.8072279691696167, -1.7399814128875732, -1.6727348566055298, -1.6054883003234863, -1.5382416248321533, -1.4709951877593994, -1.4037485122680664, -1.336501955986023, -1.2692553997039795, -1.202008843421936, -1.1347622871398926, -1.0675157308578491, -1.0002691745758057, -0.9330225586891174, -0.8657759428024292, -0.7985293865203857, -0.7312828302383423, -0.6640362739562988, -0.5967897176742554, -0.5295431017875671, -0.4622965455055237, -0.3950499892234802, -0.3278034031391144, -0.26055681705474854, -0.19331002235412598, -0.12606345117092133, -0.058816879987716675, 0.008429691195487976, 0.07567626237869263, 0.14292281866073608, 0.21016940474510193, 0.2774159908294678, 0.34466254711151123, 0.4119091033935547, 0.47915568947792053, 0.5464022755622864, 0.6136488318443298, 0.6808953881263733, 0.7481420040130615, 0.815388560295105, 0.8826351165771484, 0.9498816728591919, 1.0171282291412354, 1.0843747854232788, 1.1516213417053223, 1.2188680171966553, 1.2861145734786987, 1.3533611297607422, 1.4206076860427856, 1.487854242324829, 1.5551007986068726, 1.622347354888916, 1.689594030380249, 1.756840467453003, 1.824087142944336, 1.8913336992263794, 1.9585802555084229]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 8.0, 15.0, 6.0, 9.0, 9.0, 24.0, 18.0, 18.0, 10.0, 22.0, 22.0, 32.0, 35.0, 44.0, 37.0, 39.0, 36.0, 44.0, 38.0, 44.0, 48.0, 42.0, 34.0, 42.0, 37.0, 32.0, 33.0, 30.0, 31.0, 17.0, 18.0, 21.0, 10.0, 8.0, 21.0, 13.0, 13.0, 9.0, 4.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.1172288656234741, -1.0859273672103882, -1.0546259880065918, -1.0233244895935059, -0.9920230507850647, -0.9607216119766235, -0.9294201135635376, -0.8981186747550964, -0.8668172359466553, -0.8355157971382141, -0.804214358329773, -0.772912859916687, -0.7416114211082458, -0.7103099822998047, -0.6790084838867188, -0.6477070450782776, -0.6164056062698364, -0.5851041674613953, -0.5538027286529541, -0.5225012302398682, -0.491199791431427, -0.45989835262298584, -0.4285968840122223, -0.39729541540145874, -0.3659939765930176, -0.3346925377845764, -0.30339106917381287, -0.2720896005630493, -0.24078816175460815, -0.2094867080450058, -0.17818525433540344, -0.1468838006258011, -0.11558234691619873, -0.08428089320659637, -0.05297943949699402, -0.021677985787391663, 0.009623467922210693, 0.04092492163181305, 0.0722263753414154, 0.10352782905101776, 0.13482928276062012, 0.16613073647022247, 0.19743219017982483, 0.22873364388942719, 0.26003509759902954, 0.2913365364074707, 0.32263800501823425, 0.3539394736289978, 0.38524091243743896, 0.4165423512458801, 0.4478438198566437, 0.4791452884674072, 0.5104467272758484, 0.5417481660842896, 0.5730496644973755, 0.6043511033058167, 0.6356525421142578, 0.666953980922699, 0.6982554197311401, 0.7295569181442261, 0.7608583569526672, 0.7921597957611084, 0.8234612941741943, 0.8547627329826355, 0.8860641717910767]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 13.0, 23.0, 24.0, 55.0, 97.0, 154.0, 329.0, 560.0, 988.0, 1980.0, 4051.0, 8783.0, 20786.0, 52925.0, 162532.0, 434747.0, 238397.0, 72940.0, 27596.0, 11325.0, 5041.0, 2483.0, 1202.0, 635.0, 389.0, 190.0, 96.0, 68.0, 43.0, 36.0, 15.0, 11.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8421554565429688, -0.8146820068359375, -0.7872085571289062, -0.759735107421875, -0.7322616577148438, -0.7047882080078125, -0.6773147583007812, -0.64984130859375, -0.6223678588867188, -0.5948944091796875, -0.5674209594726562, -0.539947509765625, -0.5124740600585938, -0.4850006103515625, -0.45752716064453125, -0.4300537109375, -0.40258026123046875, -0.3751068115234375, -0.34763336181640625, -0.320159912109375, -0.29268646240234375, -0.2652130126953125, -0.23773956298828125, -0.21026611328125, -0.18279266357421875, -0.1553192138671875, -0.12784576416015625, -0.100372314453125, -0.07289886474609375, -0.0454254150390625, -0.01795196533203125, 0.009521484375, 0.03699493408203125, 0.0644683837890625, 0.09194183349609375, 0.119415283203125, 0.14688873291015625, 0.1743621826171875, 0.20183563232421875, 0.22930908203125, 0.25678253173828125, 0.2842559814453125, 0.31172943115234375, 0.339202880859375, 0.36667633056640625, 0.3941497802734375, 0.42162322998046875, 0.4490966796875, 0.47657012939453125, 0.5040435791015625, 0.5315170288085938, 0.558990478515625, 0.5864639282226562, 0.6139373779296875, 0.6414108276367188, 0.66888427734375, 0.6963577270507812, 0.7238311767578125, 0.7513046264648438, 0.778778076171875, 0.8062515258789062, 0.8337249755859375, 0.8611984252929688, 0.888671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 6.0, 11.0, 21.0, 16.0, 22.0, 28.0, 21.0, 34.0, 33.0, 34.0, 51.0, 42.0, 39.0, 35.0, 38.0, 53.0, 47.0, 45.0, 43.0, 49.0, 55.0, 30.0, 34.0, 30.0, 36.0, 30.0, 21.0, 23.0, 14.0, 24.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.94769287109375, -4.7977294921875, -4.64776611328125, -4.497802734375, -4.34783935546875, -4.1978759765625, -4.04791259765625, -3.89794921875, -3.74798583984375, -3.5980224609375, -3.44805908203125, -3.298095703125, -3.14813232421875, -2.9981689453125, -2.84820556640625, -2.6982421875, -2.54827880859375, -2.3983154296875, -2.24835205078125, -2.098388671875, -1.94842529296875, -1.7984619140625, -1.64849853515625, -1.49853515625, -1.34857177734375, -1.1986083984375, -1.04864501953125, -0.898681640625, -0.74871826171875, -0.5987548828125, -0.44879150390625, -0.298828125, -0.14886474609375, 0.0010986328125, 0.15106201171875, 0.301025390625, 0.45098876953125, 0.6009521484375, 0.75091552734375, 0.90087890625, 1.05084228515625, 1.2008056640625, 1.35076904296875, 1.500732421875, 1.65069580078125, 1.8006591796875, 1.95062255859375, 2.1005859375, 2.25054931640625, 2.4005126953125, 2.55047607421875, 2.700439453125, 2.85040283203125, 3.0003662109375, 3.15032958984375, 3.30029296875, 3.45025634765625, 3.6002197265625, 3.75018310546875, 3.900146484375, 4.05010986328125, 4.2000732421875, 4.35003662109375, 4.5]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 9.0, 7.0, 9.0, 14.0, 13.0, 19.0, 22.0, 39.0, 42.0, 49.0, 52.0, 75.0, 126.0, 319.0, 33608.0, 1013024.0, 559.0, 139.0, 81.0, 49.0, 60.0, 36.0, 39.0, 26.0, 26.0, 23.0, 20.0, 12.0, 15.0, 14.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.576171875, -17.08984375, -16.603515625, -16.1171875, -15.630859375, -15.14453125, -14.658203125, -14.171875, -13.685546875, -13.19921875, -12.712890625, -12.2265625, -11.740234375, -11.25390625, -10.767578125, -10.28125, -9.794921875, -9.30859375, -8.822265625, -8.3359375, -7.849609375, -7.36328125, -6.876953125, -6.390625, -5.904296875, -5.41796875, -4.931640625, -4.4453125, -3.958984375, -3.47265625, -2.986328125, -2.5, -2.013671875, -1.52734375, -1.041015625, -0.5546875, -0.068359375, 0.41796875, 0.904296875, 1.390625, 1.876953125, 2.36328125, 2.849609375, 3.3359375, 3.822265625, 4.30859375, 4.794921875, 5.28125, 5.767578125, 6.25390625, 6.740234375, 7.2265625, 7.712890625, 8.19921875, 8.685546875, 9.171875, 9.658203125, 10.14453125, 10.630859375, 11.1171875, 11.603515625, 12.08984375, 12.576171875, 13.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 3.0, 7.0, 10.0, 5.0, 12.0, 9.0, 18.0, 24.0, 22.0, 31.0, 45.0, 42.0, 44.0, 46.0, 53.0, 55.0, 54.0, 62.0, 53.0, 55.0, 44.0, 41.0, 44.0, 41.0, 23.0, 35.0, 21.0, 21.0, 19.0, 12.0, 14.0, 16.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -7.00506591796875, -6.8109130859375, -6.61676025390625, -6.422607421875, -6.22845458984375, -6.0343017578125, -5.84014892578125, -5.64599609375, -5.45184326171875, -5.2576904296875, -5.06353759765625, -4.869384765625, -4.67523193359375, -4.4810791015625, -4.28692626953125, -4.0927734375, -3.89862060546875, -3.7044677734375, -3.51031494140625, -3.316162109375, -3.12200927734375, -2.9278564453125, -2.73370361328125, -2.53955078125, -2.34539794921875, -2.1512451171875, -1.95709228515625, -1.762939453125, -1.56878662109375, -1.3746337890625, -1.18048095703125, -0.986328125, -0.79217529296875, -0.5980224609375, -0.40386962890625, -0.209716796875, -0.01556396484375, 0.1785888671875, 0.37274169921875, 0.56689453125, 0.76104736328125, 0.9552001953125, 1.14935302734375, 1.343505859375, 1.53765869140625, 1.7318115234375, 1.92596435546875, 2.1201171875, 2.31427001953125, 2.5084228515625, 2.70257568359375, 2.896728515625, 3.09088134765625, 3.2850341796875, 3.47918701171875, 3.67333984375, 3.86749267578125, 4.0616455078125, 4.25579833984375, 4.449951171875, 4.64410400390625, 4.8382568359375, 5.03240966796875, 5.2265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 12.0, 10.0, 17.0, 18.0, 31.0, 58.0, 111.0, 203.0, 1056.0, 16046.0, 957871.0, 70180.0, 2264.0, 357.0, 126.0, 56.0, 32.0, 27.0, 21.0, 10.0, 9.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1912994384765625, -1.151153564453125, -1.1110076904296875, -1.07086181640625, -1.0307159423828125, -0.990570068359375, -0.9504241943359375, -0.9102783203125, -0.8701324462890625, -0.829986572265625, -0.7898406982421875, -0.74969482421875, -0.7095489501953125, -0.669403076171875, -0.6292572021484375, -0.589111328125, -0.5489654541015625, -0.508819580078125, -0.4686737060546875, -0.42852783203125, -0.3883819580078125, -0.348236083984375, -0.3080902099609375, -0.2679443359375, -0.2277984619140625, -0.187652587890625, -0.1475067138671875, -0.10736083984375, -0.0672149658203125, -0.027069091796875, 0.0130767822265625, 0.05322265625, 0.0933685302734375, 0.133514404296875, 0.1736602783203125, 0.21380615234375, 0.2539520263671875, 0.294097900390625, 0.3342437744140625, 0.3743896484375, 0.4145355224609375, 0.454681396484375, 0.4948272705078125, 0.53497314453125, 0.5751190185546875, 0.615264892578125, 0.6554107666015625, 0.695556640625, 0.7357025146484375, 0.775848388671875, 0.8159942626953125, 0.85614013671875, 0.8962860107421875, 0.936431884765625, 0.9765777587890625, 1.0167236328125, 1.0568695068359375, 1.097015380859375, 1.1371612548828125, 1.17730712890625, 1.2174530029296875, 1.257598876953125, 1.2977447509765625, 1.337890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 8.0, 7.0, 13.0, 18.0, 18.0, 28.0, 46.0, 84.0, 90.0, 141.0, 171.0, 127.0, 76.0, 67.0, 32.0, 14.0, 18.0, 4.0, 13.0, 6.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.990266799926758e-05, -5.7606957852840424e-05, -5.531124770641327e-05, -5.3015537559986115e-05, -5.071982741355896e-05, -4.8424117267131805e-05, -4.612840712070465e-05, -4.3832696974277496e-05, -4.153698682785034e-05, -3.924127668142319e-05, -3.694556653499603e-05, -3.464985638856888e-05, -3.2354146242141724e-05, -3.005843609571457e-05, -2.7762725949287415e-05, -2.546701580286026e-05, -2.3171305656433105e-05, -2.087559551000595e-05, -1.8579885363578796e-05, -1.6284175217151642e-05, -1.3988465070724487e-05, -1.1692754924297333e-05, -9.397044777870178e-06, -7.101334631443024e-06, -4.805624485015869e-06, -2.5099143385887146e-06, -2.1420419216156006e-07, 2.0815059542655945e-06, 4.377216100692749e-06, 6.6729262471199036e-06, 8.968636393547058e-06, 1.1264346539974213e-05, 1.3560056686401367e-05, 1.5855766832828522e-05, 1.8151476979255676e-05, 2.044718712568283e-05, 2.2742897272109985e-05, 2.503860741853714e-05, 2.7334317564964294e-05, 2.963002771139145e-05, 3.1925737857818604e-05, 3.422144800424576e-05, 3.651715815067291e-05, 3.881286829710007e-05, 4.110857844352722e-05, 4.3404288589954376e-05, 4.569999873638153e-05, 4.7995708882808685e-05, 5.029141902923584e-05, 5.2587129175662994e-05, 5.488283932209015e-05, 5.7178549468517303e-05, 5.947425961494446e-05, 6.176996976137161e-05, 6.406567990779877e-05, 6.636139005422592e-05, 6.865710020065308e-05, 7.095281034708023e-05, 7.324852049350739e-05, 7.554423063993454e-05, 7.78399407863617e-05, 8.013565093278885e-05, 8.2431361079216e-05, 8.472707122564316e-05, 8.702278137207031e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 4.0, 9.0, 15.0, 21.0, 25.0, 34.0, 78.0, 147.0, 364.0, 1354.0, 7852.0, 134165.0, 863544.0, 36037.0, 3646.0, 745.0, 229.0, 111.0, 39.0, 41.0, 25.0, 18.0, 12.0, 10.0, 2.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6608047485351562, -0.6336212158203125, -0.6064376831054688, -0.579254150390625, -0.5520706176757812, -0.5248870849609375, -0.49770355224609375, -0.47052001953125, -0.44333648681640625, -0.4161529541015625, -0.38896942138671875, -0.361785888671875, -0.33460235595703125, -0.3074188232421875, -0.28023529052734375, -0.2530517578125, -0.22586822509765625, -0.1986846923828125, -0.17150115966796875, -0.144317626953125, -0.11713409423828125, -0.0899505615234375, -0.06276702880859375, -0.03558349609375, -0.00839996337890625, 0.0187835693359375, 0.04596710205078125, 0.073150634765625, 0.10033416748046875, 0.1275177001953125, 0.15470123291015625, 0.181884765625, 0.20906829833984375, 0.2362518310546875, 0.26343536376953125, 0.290618896484375, 0.31780242919921875, 0.3449859619140625, 0.37216949462890625, 0.39935302734375, 0.42653656005859375, 0.4537200927734375, 0.48090362548828125, 0.508087158203125, 0.5352706909179688, 0.5624542236328125, 0.5896377563476562, 0.6168212890625, 0.6440048217773438, 0.6711883544921875, 0.6983718872070312, 0.725555419921875, 0.7527389526367188, 0.7799224853515625, 0.8071060180664062, 0.83428955078125, 0.8614730834960938, 0.8886566162109375, 0.9158401489257812, 0.943023681640625, 0.9702072143554688, 0.9973907470703125, 1.0245742797851562, 1.0517578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 10.0, 14.0, 16.0, 22.0, 34.0, 44.0, 42.0, 71.0, 73.0, 86.0, 134.0, 101.0, 79.0, 66.0, 57.0, 40.0, 18.0, 17.0, 16.0, 15.0, 12.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14432907104492188, -0.13961029052734375, -0.13489151000976562, -0.1301727294921875, -0.12545394897460938, -0.12073516845703125, -0.11601638793945312, -0.111297607421875, -0.10657882690429688, -0.10186004638671875, -0.09714126586914062, -0.0924224853515625, -0.08770370483398438, -0.08298492431640625, -0.07826614379882812, -0.07354736328125, -0.06882858276367188, -0.06410980224609375, -0.059391021728515625, -0.0546722412109375, -0.049953460693359375, -0.04523468017578125, -0.040515899658203125, -0.035797119140625, -0.031078338623046875, -0.02635955810546875, -0.021640777587890625, -0.0169219970703125, -0.012203216552734375, -0.00748443603515625, -0.002765655517578125, 0.001953125, 0.006671905517578125, 0.01139068603515625, 0.016109466552734375, 0.0208282470703125, 0.025547027587890625, 0.03026580810546875, 0.034984588623046875, 0.039703369140625, 0.044422149658203125, 0.04914093017578125, 0.053859710693359375, 0.0585784912109375, 0.06329727172851562, 0.06801605224609375, 0.07273483276367188, 0.07745361328125, 0.08217239379882812, 0.08689117431640625, 0.09160995483398438, 0.0963287353515625, 0.10104751586914062, 0.10576629638671875, 0.11048507690429688, 0.115203857421875, 0.11992263793945312, 0.12464141845703125, 0.12936019897460938, 0.1340789794921875, 0.13879776000976562, 0.14351654052734375, 0.14823532104492188, 0.1529541015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 15.0, 35.0, 119.0, 230.0, 271.0, 186.0, 103.0, 36.0, 11.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4186618328094482, -2.1285288333892822, -1.8383958339691162, -1.5482627153396606, -1.2581297159194946, -0.9679967164993286, -0.677863597869873, -0.38773059844970703, -0.09759759902954102, 0.1925354301929474, 0.4826684594154358, 0.7728015184402466, 1.0629345178604126, 1.3530675172805786, 1.6432006359100342, 1.9333336353302002, 2.223466634750366, 2.5135996341705322, 2.8037326335906982, 3.0938658714294434, 3.3839988708496094, 3.6741318702697754, 3.9642648696899414, 4.254397869110107, 4.544530868530273, 4.8346638679504395, 5.1247968673706055, 5.4149298667907715, 5.7050628662109375, 5.9951958656311035, 6.2853288650512695, 6.575462341308594, 6.865595817565918, 7.155728816986084, 7.44586181640625, 7.735994815826416, 8.026127815246582, 8.316261291503906, 8.606393814086914, 8.896527290344238, 9.186659812927246, 9.47679328918457, 9.766925811767578, 10.057059288024902, 10.34719181060791, 10.637325286865234, 10.927457809448242, 11.217591285705566, 11.50772476196289, 11.797858238220215, 12.087990760803223, 12.378124237060547, 12.668256759643555, 12.958390235900879, 13.248522758483887, 13.538656234741211, 13.828788757324219, 14.118922233581543, 14.40905475616455, 14.699188232421875, 14.989320755004883, 15.279454231262207, 15.569586753845215, 15.859720230102539, 16.149852752685547]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 5.0, 9.0, 14.0, 15.0, 19.0, 17.0, 26.0, 28.0, 30.0, 39.0, 41.0, 30.0, 42.0, 30.0, 49.0, 43.0, 43.0, 60.0, 48.0, 51.0, 53.0, 35.0, 31.0, 31.0, 30.0, 26.0, 23.0, 19.0, 22.0, 17.0, 12.0, 9.0, 14.0, 7.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.346895217895508, -8.117851257324219, -7.8888068199157715, -7.659762382507324, -7.430718421936035, -7.201673984527588, -6.972629547119141, -6.743585586547852, -6.514541149139404, -6.285496711730957, -6.056452751159668, -5.827408313751221, -5.598363876342773, -5.369319915771484, -5.140275478363037, -4.91123104095459, -4.682187080383301, -4.4531426429748535, -4.2240986824035645, -3.995054244995117, -3.766010046005249, -3.536965847015381, -3.3079214096069336, -3.0788772106170654, -2.8498330116271973, -2.620788812637329, -2.391744613647461, -2.1627001762390137, -1.9336559772491455, -1.7046117782592773, -1.4755674600601196, -1.246523141860962, -1.0174789428710938, -0.7884346842765808, -0.5593904256820679, -0.33034616708755493, -0.10130190849304199, 0.12774229049682617, 0.3567866086959839, 0.5858309268951416, 0.8148751258850098, 1.043919324874878, 1.2729636430740356, 1.5020079612731934, 1.7310521602630615, 1.9600963592529297, 2.189140796661377, 2.418184995651245, 2.6472291946411133, 2.8762733936309814, 3.1053175926208496, 3.334362030029297, 3.563406229019165, 3.792450428009033, 4.0214948654174805, 4.2505388259887695, 4.479583263397217, 4.708627700805664, 4.937671661376953, 5.1667160987854, 5.395760536193848, 5.624804496765137, 5.853848934173584, 6.082893371582031, 6.31193733215332]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 5.0, 16.0, 8.0, 13.0, 8.0, 14.0, 22.0, 25.0, 30.0, 37.0, 58.0, 77.0, 171.0, 746.0, 5551.0, 221468.0, 3774013.0, 185772.0, 5132.0, 664.0, 148.0, 61.0, 33.0, 28.0, 30.0, 24.0, 23.0, 18.0, 19.0, 13.0, 11.0, 15.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6953125, -6.51177978515625, -6.3282470703125, -6.14471435546875, -5.961181640625, -5.77764892578125, -5.5941162109375, -5.41058349609375, -5.22705078125, -5.04351806640625, -4.8599853515625, -4.67645263671875, -4.492919921875, -4.30938720703125, -4.1258544921875, -3.94232177734375, -3.7587890625, -3.57525634765625, -3.3917236328125, -3.20819091796875, -3.024658203125, -2.84112548828125, -2.6575927734375, -2.47406005859375, -2.29052734375, -2.10699462890625, -1.9234619140625, -1.73992919921875, -1.556396484375, -1.37286376953125, -1.1893310546875, -1.00579833984375, -0.822265625, -0.63873291015625, -0.4552001953125, -0.27166748046875, -0.088134765625, 0.09539794921875, 0.2789306640625, 0.46246337890625, 0.64599609375, 0.82952880859375, 1.0130615234375, 1.19659423828125, 1.380126953125, 1.56365966796875, 1.7471923828125, 1.93072509765625, 2.1142578125, 2.29779052734375, 2.4813232421875, 2.66485595703125, 2.848388671875, 3.03192138671875, 3.2154541015625, 3.39898681640625, 3.58251953125, 3.76605224609375, 3.9495849609375, 4.13311767578125, 4.316650390625, 4.50018310546875, 4.6837158203125, 4.86724853515625, 5.05078125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 11.0, 9.0, 8.0, 13.0, 17.0, 21.0, 19.0, 28.0, 25.0, 21.0, 28.0, 34.0, 45.0, 39.0, 43.0, 33.0, 47.0, 45.0, 41.0, 56.0, 42.0, 43.0, 41.0, 36.0, 36.0, 31.0, 30.0, 30.0, 20.0, 18.0, 12.0, 9.0, 11.0, 7.0, 11.0, 6.0, 8.0, 10.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.473358154296875, -1.43206787109375, -1.390777587890625, -1.3494873046875, -1.308197021484375, -1.26690673828125, -1.225616455078125, -1.184326171875, -1.143035888671875, -1.10174560546875, -1.060455322265625, -1.0191650390625, -0.977874755859375, -0.93658447265625, -0.895294189453125, -0.85400390625, -0.812713623046875, -0.77142333984375, -0.730133056640625, -0.6888427734375, -0.647552490234375, -0.60626220703125, -0.564971923828125, -0.523681640625, -0.482391357421875, -0.44110107421875, -0.399810791015625, -0.3585205078125, -0.317230224609375, -0.27593994140625, -0.234649658203125, -0.193359375, -0.152069091796875, -0.11077880859375, -0.069488525390625, -0.0281982421875, 0.013092041015625, 0.05438232421875, 0.095672607421875, 0.136962890625, 0.178253173828125, 0.21954345703125, 0.260833740234375, 0.3021240234375, 0.343414306640625, 0.38470458984375, 0.425994873046875, 0.46728515625, 0.508575439453125, 0.54986572265625, 0.591156005859375, 0.6324462890625, 0.673736572265625, 0.71502685546875, 0.756317138671875, 0.797607421875, 0.838897705078125, 0.88018798828125, 0.921478271484375, 0.9627685546875, 1.004058837890625, 1.04534912109375, 1.086639404296875, 1.1279296875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 10.0, 8.0, 16.0, 28.0, 32.0, 96.0, 140.0, 244.0, 534.0, 18171.0, 4173208.0, 987.0, 369.0, 185.0, 105.0, 58.0, 34.0, 12.0, 8.0, 11.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.09375, -25.308349609375, -24.52294921875, -23.737548828125, -22.9521484375, -22.166748046875, -21.38134765625, -20.595947265625, -19.810546875, -19.025146484375, -18.23974609375, -17.454345703125, -16.6689453125, -15.883544921875, -15.09814453125, -14.312744140625, -13.52734375, -12.741943359375, -11.95654296875, -11.171142578125, -10.3857421875, -9.600341796875, -8.81494140625, -8.029541015625, -7.244140625, -6.458740234375, -5.67333984375, -4.887939453125, -4.1025390625, -3.317138671875, -2.53173828125, -1.746337890625, -0.9609375, -0.175537109375, 0.60986328125, 1.395263671875, 2.1806640625, 2.966064453125, 3.75146484375, 4.536865234375, 5.322265625, 6.107666015625, 6.89306640625, 7.678466796875, 8.4638671875, 9.249267578125, 10.03466796875, 10.820068359375, 11.60546875, 12.390869140625, 13.17626953125, 13.961669921875, 14.7470703125, 15.532470703125, 16.31787109375, 17.103271484375, 17.888671875, 18.674072265625, 19.45947265625, 20.244873046875, 21.0302734375, 21.815673828125, 22.60107421875, 23.386474609375, 24.171875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 13.0, 10.0, 19.0, 29.0, 38.0, 57.0, 77.0, 96.0, 146.0, 203.0, 298.0, 464.0, 536.0, 518.0, 474.0, 307.0, 229.0, 151.0, 110.0, 87.0, 47.0, 38.0, 30.0, 18.0, 16.0, 15.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7861328125, -0.764892578125, -0.74365234375, -0.722412109375, -0.701171875, -0.679931640625, -0.65869140625, -0.637451171875, -0.6162109375, -0.594970703125, -0.57373046875, -0.552490234375, -0.53125, -0.510009765625, -0.48876953125, -0.467529296875, -0.4462890625, -0.425048828125, -0.40380859375, -0.382568359375, -0.361328125, -0.340087890625, -0.31884765625, -0.297607421875, -0.2763671875, -0.255126953125, -0.23388671875, -0.212646484375, -0.19140625, -0.170166015625, -0.14892578125, -0.127685546875, -0.1064453125, -0.085205078125, -0.06396484375, -0.042724609375, -0.021484375, -0.000244140625, 0.02099609375, 0.042236328125, 0.0634765625, 0.084716796875, 0.10595703125, 0.127197265625, 0.1484375, 0.169677734375, 0.19091796875, 0.212158203125, 0.2333984375, 0.254638671875, 0.27587890625, 0.297119140625, 0.318359375, 0.339599609375, 0.36083984375, 0.382080078125, 0.4033203125, 0.424560546875, 0.44580078125, 0.467041015625, 0.48828125, 0.509521484375, 0.53076171875, 0.552001953125, 0.5732421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 14.0, 12.0, 13.0, 27.0, 40.0, 45.0, 62.0, 83.0, 84.0, 104.0, 109.0, 97.0, 77.0, 57.0, 42.0, 39.0, 27.0, 22.0, 11.0, 15.0, 5.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1332597732543945, -2.051584005355835, -1.9699079990386963, -1.8882321119308472, -1.806556224822998, -1.7248804569244385, -1.6432045698165894, -1.5615286827087402, -1.4798527956008911, -1.398176908493042, -1.3165010213851929, -1.2348251342773438, -1.1531493663787842, -1.0714733600616455, -0.9897975921630859, -0.9081217050552368, -0.8264458179473877, -0.7447699308395386, -0.6630940437316895, -0.5814182162284851, -0.499742329120636, -0.41806644201278687, -0.33639058470726013, -0.2547147274017334, -0.17303884029388428, -0.09136296808719635, -0.009687095880508423, 0.0719887763261795, 0.15366464853286743, 0.23534053564071655, 0.3170163929462433, 0.39869225025177, 0.48036789894104004, 0.5620437860488892, 0.6437196731567383, 0.7253955006599426, 0.8070713877677917, 0.8887472748756409, 0.9704231023788452, 1.0520989894866943, 1.1337748765945435, 1.2154507637023926, 1.2971266508102417, 1.3788025379180908, 1.4604783058166504, 1.542154312133789, 1.6238300800323486, 1.7055059671401978, 1.7871818542480469, 1.868857741355896, 1.9505336284637451, 2.0322093963623047, 2.1138854026794434, 2.195561170578003, 2.2772371768951416, 2.358912944793701, 2.44058895111084, 2.5222647190093994, 2.603940725326538, 2.6856164932250977, 2.7672924995422363, 2.848968267440796, 2.9306442737579346, 3.012320041656494, 3.0939958095550537]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 3.0, 12.0, 10.0, 11.0, 7.0, 18.0, 24.0, 12.0, 17.0, 20.0, 34.0, 21.0, 32.0, 37.0, 41.0, 44.0, 32.0, 51.0, 37.0, 31.0, 28.0, 36.0, 28.0, 40.0, 49.0, 35.0, 36.0, 29.0, 27.0, 15.0, 30.0, 31.0, 18.0, 13.0, 19.0, 13.0, 12.0, 11.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3140054941177368, -1.273231029510498, -1.2324565649032593, -1.1916821002960205, -1.1509076356887817, -1.110133171081543, -1.0693587064743042, -1.0285842418670654, -0.9878097772598267, -0.9470353126525879, -0.9062608480453491, -0.8654863834381104, -0.8247119188308716, -0.7839374542236328, -0.743162989616394, -0.7023885250091553, -0.6616141200065613, -0.6208396553993225, -0.5800651907920837, -0.539290726184845, -0.4985162615776062, -0.45774179697036743, -0.41696736216545105, -0.3761928975582123, -0.3354184329509735, -0.29464396834373474, -0.25386950373649597, -0.2130950540304184, -0.17232058942317963, -0.13154612481594086, -0.09077167510986328, -0.04999721050262451, -0.009222745895385742, 0.03155171498656273, 0.0723261758685112, 0.11310063302516937, 0.15387509763240814, 0.1946495622396469, 0.2354240119457245, 0.27619847655296326, 0.316972941160202, 0.3577474057674408, 0.39852187037467957, 0.43929630517959595, 0.4800707697868347, 0.5208452343940735, 0.5616196990013123, 0.602394163608551, 0.6431686282157898, 0.6839430928230286, 0.7247175574302673, 0.7654920220375061, 0.8062664866447449, 0.8470409512519836, 0.8878153562545776, 0.9285898208618164, 0.9693642854690552, 1.010138750076294, 1.0509132146835327, 1.0916876792907715, 1.1324621438980103, 1.173236608505249, 1.2140110731124878, 1.2547855377197266, 1.2955600023269653]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 16.0, 16.0, 13.0, 32.0, 44.0, 98.0, 200.0, 450.0, 1241.0, 3291.0, 11160.0, 46225.0, 216083.0, 494656.0, 213146.0, 45504.0, 10989.0, 3342.0, 1144.0, 444.0, 209.0, 95.0, 60.0, 27.0, 14.0, 20.0, 7.0, 9.0, 9.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8525390625, -0.825469970703125, -0.79840087890625, -0.771331787109375, -0.7442626953125, -0.717193603515625, -0.69012451171875, -0.663055419921875, -0.635986328125, -0.608917236328125, -0.58184814453125, -0.554779052734375, -0.5277099609375, -0.500640869140625, -0.47357177734375, -0.446502685546875, -0.41943359375, -0.392364501953125, -0.36529541015625, -0.338226318359375, -0.3111572265625, -0.284088134765625, -0.25701904296875, -0.229949951171875, -0.202880859375, -0.175811767578125, -0.14874267578125, -0.121673583984375, -0.0946044921875, -0.067535400390625, -0.04046630859375, -0.013397216796875, 0.013671875, 0.040740966796875, 0.06781005859375, 0.094879150390625, 0.1219482421875, 0.149017333984375, 0.17608642578125, 0.203155517578125, 0.230224609375, 0.257293701171875, 0.28436279296875, 0.311431884765625, 0.3385009765625, 0.365570068359375, 0.39263916015625, 0.419708251953125, 0.44677734375, 0.473846435546875, 0.50091552734375, 0.527984619140625, 0.5550537109375, 0.582122802734375, 0.60919189453125, 0.636260986328125, 0.663330078125, 0.690399169921875, 0.71746826171875, 0.744537353515625, 0.7716064453125, 0.798675537109375, 0.82574462890625, 0.852813720703125, 0.8798828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 11.0, 14.0, 14.0, 11.0, 22.0, 26.0, 25.0, 28.0, 34.0, 50.0, 38.0, 45.0, 62.0, 47.0, 59.0, 55.0, 53.0, 59.0, 58.0, 47.0, 43.0, 38.0, 39.0, 24.0, 21.0, 20.0, 20.0, 12.0, 7.0, 4.0, 10.0, 3.0, 3.0, 4.0], "bins": [-1.537109375, -1.5028533935546875, -1.468597412109375, -1.4343414306640625, -1.40008544921875, -1.3658294677734375, -1.331573486328125, -1.2973175048828125, -1.2630615234375, -1.2288055419921875, -1.194549560546875, -1.1602935791015625, -1.12603759765625, -1.0917816162109375, -1.057525634765625, -1.0232696533203125, -0.989013671875, -0.9547576904296875, -0.920501708984375, -0.8862457275390625, -0.85198974609375, -0.8177337646484375, -0.783477783203125, -0.7492218017578125, -0.7149658203125, -0.6807098388671875, -0.646453857421875, -0.6121978759765625, -0.57794189453125, -0.5436859130859375, -0.509429931640625, -0.4751739501953125, -0.44091796875, -0.4066619873046875, -0.372406005859375, -0.3381500244140625, -0.30389404296875, -0.2696380615234375, -0.235382080078125, -0.2011260986328125, -0.1668701171875, -0.1326141357421875, -0.098358154296875, -0.0641021728515625, -0.02984619140625, 0.0044097900390625, 0.038665771484375, 0.0729217529296875, 0.107177734375, 0.1414337158203125, 0.175689697265625, 0.2099456787109375, 0.24420166015625, 0.2784576416015625, 0.312713623046875, 0.3469696044921875, 0.3812255859375, 0.4154815673828125, 0.449737548828125, 0.4839935302734375, 0.51824951171875, 0.5525054931640625, 0.586761474609375, 0.6210174560546875, 0.6552734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 9.0, 4.0, 10.0, 18.0, 14.0, 29.0, 42.0, 68.0, 98.0, 134.0, 252.0, 461.0, 836.0, 1866.0, 3993.0, 9843.0, 26179.0, 75619.0, 214008.0, 364947.0, 223803.0, 79855.0, 27819.0, 10349.0, 4191.0, 1931.0, 908.0, 463.0, 282.0, 178.0, 99.0, 77.0, 56.0, 33.0, 21.0, 14.0, 10.0, 13.0, 5.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.4853515625, -0.4683380126953125, -0.451324462890625, -0.4343109130859375, -0.41729736328125, -0.4002838134765625, -0.383270263671875, -0.3662567138671875, -0.3492431640625, -0.3322296142578125, -0.315216064453125, -0.2982025146484375, -0.28118896484375, -0.2641754150390625, -0.247161865234375, -0.2301483154296875, -0.213134765625, -0.1961212158203125, -0.179107666015625, -0.1620941162109375, -0.14508056640625, -0.1280670166015625, -0.111053466796875, -0.0940399169921875, -0.0770263671875, -0.0600128173828125, -0.042999267578125, -0.0259857177734375, -0.00897216796875, 0.0080413818359375, 0.025054931640625, 0.0420684814453125, 0.05908203125, 0.0760955810546875, 0.093109130859375, 0.1101226806640625, 0.12713623046875, 0.1441497802734375, 0.161163330078125, 0.1781768798828125, 0.1951904296875, 0.2122039794921875, 0.229217529296875, 0.2462310791015625, 0.26324462890625, 0.2802581787109375, 0.297271728515625, 0.3142852783203125, 0.331298828125, 0.3483123779296875, 0.365325927734375, 0.3823394775390625, 0.39935302734375, 0.4163665771484375, 0.433380126953125, 0.4503936767578125, 0.4674072265625, 0.4844207763671875, 0.501434326171875, 0.5184478759765625, 0.53546142578125, 0.5524749755859375, 0.569488525390625, 0.5865020751953125, 0.603515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 4.0, 4.0, 7.0, 12.0, 21.0, 16.0, 23.0, 24.0, 30.0, 25.0, 40.0, 38.0, 41.0, 56.0, 49.0, 51.0, 52.0, 63.0, 45.0, 39.0, 55.0, 43.0, 35.0, 38.0, 23.0, 23.0, 33.0, 23.0, 18.0, 11.0, 12.0, 14.0, 5.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7939453125, -1.7426300048828125, -1.691314697265625, -1.6399993896484375, -1.58868408203125, -1.5373687744140625, -1.486053466796875, -1.4347381591796875, -1.3834228515625, -1.3321075439453125, -1.280792236328125, -1.2294769287109375, -1.17816162109375, -1.1268463134765625, -1.075531005859375, -1.0242156982421875, -0.972900390625, -0.9215850830078125, -0.870269775390625, -0.8189544677734375, -0.76763916015625, -0.7163238525390625, -0.665008544921875, -0.6136932373046875, -0.5623779296875, -0.5110626220703125, -0.459747314453125, -0.4084320068359375, -0.35711669921875, -0.3058013916015625, -0.254486083984375, -0.2031707763671875, -0.15185546875, -0.1005401611328125, -0.049224853515625, 0.0020904541015625, 0.05340576171875, 0.1047210693359375, 0.156036376953125, 0.2073516845703125, 0.2586669921875, 0.3099822998046875, 0.361297607421875, 0.4126129150390625, 0.46392822265625, 0.5152435302734375, 0.566558837890625, 0.6178741455078125, 0.669189453125, 0.7205047607421875, 0.771820068359375, 0.8231353759765625, 0.87445068359375, 0.9257659912109375, 0.977081298828125, 1.0283966064453125, 1.0797119140625, 1.1310272216796875, 1.182342529296875, 1.2336578369140625, 1.28497314453125, 1.3362884521484375, 1.387603759765625, 1.4389190673828125, 1.490234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 4.0, 10.0, 5.0, 12.0, 18.0, 35.0, 34.0, 54.0, 104.0, 160.0, 276.0, 437.0, 785.0, 1411.0, 2662.0, 5300.0, 11376.0, 27112.0, 70291.0, 189485.0, 343318.0, 239927.0, 93128.0, 34570.0, 14338.0, 6574.0, 3171.0, 1723.0, 887.0, 525.0, 307.0, 168.0, 109.0, 58.0, 52.0, 34.0, 28.0, 22.0, 10.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.1294422149658203, -0.12521743774414062, -0.12099266052246094, -0.11676788330078125, -0.11254310607910156, -0.10831832885742188, -0.10409355163574219, -0.0998687744140625, -0.09564399719238281, -0.09141921997070312, -0.08719444274902344, -0.08296966552734375, -0.07874488830566406, -0.07452011108398438, -0.07029533386230469, -0.066070556640625, -0.06184577941894531, -0.057621002197265625, -0.05339622497558594, -0.04917144775390625, -0.04494667053222656, -0.040721893310546875, -0.03649711608886719, -0.0322723388671875, -0.028047561645507812, -0.023822784423828125, -0.019598007202148438, -0.01537322998046875, -0.011148452758789062, -0.006923675537109375, -0.0026988983154296875, 0.00152587890625, 0.0057506561279296875, 0.009975433349609375, 0.014200210571289062, 0.01842498779296875, 0.022649765014648438, 0.026874542236328125, 0.031099319458007812, 0.0353240966796875, 0.03954887390136719, 0.043773651123046875, 0.04799842834472656, 0.05222320556640625, 0.05644798278808594, 0.060672760009765625, 0.06489753723144531, 0.069122314453125, 0.07334709167480469, 0.07757186889648438, 0.08179664611816406, 0.08602142333984375, 0.09024620056152344, 0.09447097778320312, 0.09869575500488281, 0.1029205322265625, 0.10714530944824219, 0.11137008666992188, 0.11559486389160156, 0.11981964111328125, 0.12404441833496094, 0.12826919555664062, 0.1324939727783203, 0.13671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 15.0, 15.0, 18.0, 24.0, 43.0, 54.0, 90.0, 134.0, 145.0, 115.0, 104.0, 67.0, 56.0, 35.0, 26.0, 19.0, 9.0, 6.0, 6.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.334087371826172e-05, -8.860230445861816e-05, -8.386373519897461e-05, -7.912516593933105e-05, -7.43865966796875e-05, -6.964802742004395e-05, -6.490945816040039e-05, -6.0170888900756836e-05, -5.543231964111328e-05, -5.0693750381469727e-05, -4.595518112182617e-05, -4.121661186218262e-05, -3.647804260253906e-05, -3.173947334289551e-05, -2.7000904083251953e-05, -2.22623348236084e-05, -1.7523765563964844e-05, -1.2785196304321289e-05, -8.046627044677734e-06, -3.3080577850341797e-06, 1.430511474609375e-06, 6.16908073425293e-06, 1.0907649993896484e-05, 1.564621925354004e-05, 2.0384788513183594e-05, 2.512335777282715e-05, 2.9861927032470703e-05, 3.460049629211426e-05, 3.933906555175781e-05, 4.407763481140137e-05, 4.881620407104492e-05, 5.3554773330688477e-05, 5.829334259033203e-05, 6.303191184997559e-05, 6.777048110961914e-05, 7.25090503692627e-05, 7.724761962890625e-05, 8.19861888885498e-05, 8.672475814819336e-05, 9.146332740783691e-05, 9.620189666748047e-05, 0.00010094046592712402, 0.00010567903518676758, 0.00011041760444641113, 0.00011515617370605469, 0.00011989474296569824, 0.0001246333122253418, 0.00012937188148498535, 0.0001341104507446289, 0.00013884902000427246, 0.00014358758926391602, 0.00014832615852355957, 0.00015306472778320312, 0.00015780329704284668, 0.00016254186630249023, 0.0001672804355621338, 0.00017201900482177734, 0.0001767575740814209, 0.00018149614334106445, 0.000186234712600708, 0.00019097328186035156, 0.00019571185111999512, 0.00020045042037963867, 0.00020518898963928223, 0.00020992755889892578]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 6.0, 11.0, 15.0, 10.0, 9.0, 16.0, 24.0, 28.0, 36.0, 57.0, 77.0, 129.0, 243.0, 534.0, 1268.0, 4109.0, 17168.0, 97396.0, 495578.0, 356024.0, 59647.0, 11339.0, 2921.0, 927.0, 388.0, 200.0, 127.0, 73.0, 48.0, 27.0, 33.0, 19.0, 13.0, 14.0, 7.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2406005859375, -0.2328052520751953, -0.22500991821289062, -0.21721458435058594, -0.20941925048828125, -0.20162391662597656, -0.19382858276367188, -0.1860332489013672, -0.1782379150390625, -0.1704425811767578, -0.16264724731445312, -0.15485191345214844, -0.14705657958984375, -0.13926124572753906, -0.13146591186523438, -0.12367057800292969, -0.115875244140625, -0.10807991027832031, -0.10028457641601562, -0.09248924255371094, -0.08469390869140625, -0.07689857482910156, -0.06910324096679688, -0.06130790710449219, -0.0535125732421875, -0.04571723937988281, -0.037921905517578125, -0.030126571655273438, -0.02233123779296875, -0.014535903930664062, -0.006740570068359375, 0.0010547637939453125, 0.00885009765625, 0.016645431518554688, 0.024440765380859375, 0.03223609924316406, 0.04003143310546875, 0.04782676696777344, 0.055622100830078125, 0.06341743469238281, 0.0712127685546875, 0.07900810241699219, 0.08680343627929688, 0.09459877014160156, 0.10239410400390625, 0.11018943786621094, 0.11798477172851562, 0.1257801055908203, 0.133575439453125, 0.1413707733154297, 0.14916610717773438, 0.15696144104003906, 0.16475677490234375, 0.17255210876464844, 0.18034744262695312, 0.1881427764892578, 0.1959381103515625, 0.2037334442138672, 0.21152877807617188, 0.21932411193847656, 0.22711944580078125, 0.23491477966308594, 0.24271011352539062, 0.2505054473876953, 0.25830078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 6.0, 5.0, 18.0, 15.0, 22.0, 22.0, 40.0, 43.0, 54.0, 66.0, 50.0, 75.0, 69.0, 73.0, 59.0, 53.0, 60.0, 47.0, 50.0, 36.0, 23.0, 25.0, 17.0, 14.0, 15.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03460693359375, -0.03331613540649414, -0.03202533721923828, -0.030734539031982422, -0.029443740844726562, -0.028152942657470703, -0.026862144470214844, -0.025571346282958984, -0.024280548095703125, -0.022989749908447266, -0.021698951721191406, -0.020408153533935547, -0.019117355346679688, -0.017826557159423828, -0.01653575897216797, -0.01524496078491211, -0.01395416259765625, -0.01266336441040039, -0.011372566223144531, -0.010081768035888672, -0.008790969848632812, -0.007500171661376953, -0.006209373474121094, -0.004918575286865234, -0.003627777099609375, -0.0023369789123535156, -0.0010461807250976562, 0.0002446174621582031, 0.0015354156494140625, 0.002826213836669922, 0.004117012023925781, 0.005407810211181641, 0.0066986083984375, 0.00798940658569336, 0.009280204772949219, 0.010571002960205078, 0.011861801147460938, 0.013152599334716797, 0.014443397521972656, 0.015734195709228516, 0.017024993896484375, 0.018315792083740234, 0.019606590270996094, 0.020897388458251953, 0.022188186645507812, 0.023478984832763672, 0.02476978302001953, 0.02606058120727539, 0.02735137939453125, 0.02864217758178711, 0.02993297576904297, 0.031223773956298828, 0.03251457214355469, 0.03380537033081055, 0.035096168518066406, 0.036386966705322266, 0.037677764892578125, 0.038968563079833984, 0.040259361267089844, 0.0415501594543457, 0.04284095764160156, 0.04413175582885742, 0.04542255401611328, 0.04671335220336914, 0.048004150390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 22.0, 29.0, 47.0, 66.0, 118.0, 154.0, 163.0, 118.0, 105.0, 59.0, 43.0, 28.0, 19.0, 13.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8371949195861816, -1.770077109336853, -1.702959418296814, -1.6358416080474854, -1.5687239170074463, -1.5016061067581177, -1.434488296508789, -1.36737060546875, -1.3002527952194214, -1.2331349849700928, -1.1660172939300537, -1.098899483680725, -1.0317816734313965, -0.9646639823913574, -0.8975461721420288, -0.830428421497345, -0.7633106708526611, -0.6961929202079773, -0.6290751695632935, -0.5619573593139648, -0.494839608669281, -0.42772185802459717, -0.36060407757759094, -0.2934862971305847, -0.22636854648590088, -0.15925078094005585, -0.09213301539421082, -0.025015249848365784, 0.04210251569747925, 0.10922026634216309, 0.1763380467891693, 0.24345582723617554, 0.3105735778808594, 0.3776913285255432, 0.44480910897254944, 0.5119268894195557, 0.5790446400642395, 0.6461623907089233, 0.713280200958252, 0.7803979516029358, 0.8475157022476196, 0.9146334528923035, 0.9817512035369873, 1.048869013786316, 1.1159868240356445, 1.1831045150756836, 1.2502223253250122, 1.3173401355743408, 1.3844578266143799, 1.4515756368637085, 1.5186933279037476, 1.5858111381530762, 1.6529288291931152, 1.7200466394424438, 1.7871644496917725, 1.8542821407318115, 1.9213999509811401, 1.9885177612304688, 2.055635452270508, 2.122753143310547, 2.189871072769165, 2.256988763809204, 2.324106454849243, 2.3912243843078613, 2.4583420753479004]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 9.0, 7.0, 13.0, 12.0, 16.0, 13.0, 28.0, 27.0, 28.0, 31.0, 25.0, 47.0, 42.0, 48.0, 64.0, 55.0, 44.0, 30.0, 37.0, 49.0, 53.0, 48.0, 41.0, 34.0, 30.0, 29.0, 17.0, 32.0, 20.0, 13.0, 19.0, 11.0, 10.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0645387172698975, -1.0363905429840088, -1.0082424879074097, -0.9800943732261658, -0.9519462585449219, -0.923798143863678, -0.8956500291824341, -0.8675018548965454, -0.8393537998199463, -0.8112056851387024, -0.7830575704574585, -0.7549094557762146, -0.7267613410949707, -0.6986132264137268, -0.6704651117324829, -0.6423169374465942, -0.6141688227653503, -0.5860207080841064, -0.5578725934028625, -0.5297244787216187, -0.5015763640403748, -0.47342824935913086, -0.4452801048755646, -0.4171319901943207, -0.3889838755130768, -0.3608357608318329, -0.332687646150589, -0.3045395016670227, -0.2763913869857788, -0.2482432872056961, -0.22009515762329102, -0.19194704294204712, -0.16379886865615845, -0.13565075397491455, -0.10750263184309006, -0.07935450971126556, -0.05120639503002167, -0.02305828034877777, 0.005089849233627319, 0.033237963914871216, 0.06138607859611511, 0.08953419327735901, 0.1176823154091835, 0.145830437541008, 0.1739785522222519, 0.2021266669034958, 0.23027479648590088, 0.2584229111671448, 0.28657102584838867, 0.31471914052963257, 0.34286725521087646, 0.37101536989212036, 0.39916348457336426, 0.42731159925460815, 0.45545974373817444, 0.48360785841941833, 0.5117559432983398, 0.5399040579795837, 0.5680521726608276, 0.5962002873420715, 0.6243484020233154, 0.6524965167045593, 0.6806446313858032, 0.7087928056716919, 0.7369409203529358]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 17.0, 16.0, 29.0, 67.0, 144.0, 344.0, 871.0, 2515.0, 9087.0, 44085.0, 348635.0, 563134.0, 62600.0, 12135.0, 3125.0, 1034.0, 375.0, 155.0, 72.0, 41.0, 22.0, 13.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.29473876953125, -1.2486572265625, -1.20257568359375, -1.156494140625, -1.11041259765625, -1.0643310546875, -1.01824951171875, -0.97216796875, -0.92608642578125, -0.8800048828125, -0.83392333984375, -0.787841796875, -0.74176025390625, -0.6956787109375, -0.64959716796875, -0.603515625, -0.55743408203125, -0.5113525390625, -0.46527099609375, -0.419189453125, -0.37310791015625, -0.3270263671875, -0.28094482421875, -0.23486328125, -0.18878173828125, -0.1427001953125, -0.09661865234375, -0.050537109375, -0.00445556640625, 0.0416259765625, 0.08770751953125, 0.1337890625, 0.17987060546875, 0.2259521484375, 0.27203369140625, 0.318115234375, 0.36419677734375, 0.4102783203125, 0.45635986328125, 0.50244140625, 0.54852294921875, 0.5946044921875, 0.64068603515625, 0.686767578125, 0.73284912109375, 0.7789306640625, 0.82501220703125, 0.87109375, 0.91717529296875, 0.9632568359375, 1.00933837890625, 1.055419921875, 1.10150146484375, 1.1475830078125, 1.19366455078125, 1.23974609375, 1.28582763671875, 1.3319091796875, 1.37799072265625, 1.424072265625, 1.47015380859375, 1.5162353515625, 1.56231689453125, 1.6083984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 5.0, 13.0, 15.0, 14.0, 21.0, 24.0, 29.0, 20.0, 31.0, 27.0, 37.0, 45.0, 46.0, 59.0, 44.0, 55.0, 50.0, 48.0, 43.0, 45.0, 56.0, 28.0, 27.0, 19.0, 37.0, 23.0, 27.0, 21.0, 16.0, 11.0, 11.0, 7.0, 5.0, 8.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.48046875, -2.4150238037109375, -2.349578857421875, -2.2841339111328125, -2.21868896484375, -2.1532440185546875, -2.087799072265625, -2.0223541259765625, -1.9569091796875, -1.8914642333984375, -1.826019287109375, -1.7605743408203125, -1.69512939453125, -1.6296844482421875, -1.564239501953125, -1.4987945556640625, -1.433349609375, -1.3679046630859375, -1.302459716796875, -1.2370147705078125, -1.17156982421875, -1.1061248779296875, -1.040679931640625, -0.9752349853515625, -0.9097900390625, -0.8443450927734375, -0.778900146484375, -0.7134552001953125, -0.64801025390625, -0.5825653076171875, -0.517120361328125, -0.4516754150390625, -0.38623046875, -0.3207855224609375, -0.255340576171875, -0.1898956298828125, -0.12445068359375, -0.0590057373046875, 0.006439208984375, 0.0718841552734375, 0.1373291015625, 0.2027740478515625, 0.268218994140625, 0.3336639404296875, 0.39910888671875, 0.4645538330078125, 0.529998779296875, 0.5954437255859375, 0.660888671875, 0.7263336181640625, 0.791778564453125, 0.8572235107421875, 0.92266845703125, 0.9881134033203125, 1.053558349609375, 1.1190032958984375, 1.1844482421875, 1.2498931884765625, 1.315338134765625, 1.3807830810546875, 1.44622802734375, 1.5116729736328125, 1.577117919921875, 1.6425628662109375, 1.7080078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 8.0, 10.0, 13.0, 18.0, 23.0, 26.0, 36.0, 40.0, 47.0, 62.0, 65.0, 110.0, 2177.0, 1044149.0, 1311.0, 93.0, 55.0, 61.0, 52.0, 38.0, 36.0, 36.0, 16.0, 12.0, 14.0, 12.0, 10.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.640625, -14.249755859375, -13.85888671875, -13.468017578125, -13.0771484375, -12.686279296875, -12.29541015625, -11.904541015625, -11.513671875, -11.122802734375, -10.73193359375, -10.341064453125, -9.9501953125, -9.559326171875, -9.16845703125, -8.777587890625, -8.38671875, -7.995849609375, -7.60498046875, -7.214111328125, -6.8232421875, -6.432373046875, -6.04150390625, -5.650634765625, -5.259765625, -4.868896484375, -4.47802734375, -4.087158203125, -3.6962890625, -3.305419921875, -2.91455078125, -2.523681640625, -2.1328125, -1.741943359375, -1.35107421875, -0.960205078125, -0.5693359375, -0.178466796875, 0.21240234375, 0.603271484375, 0.994140625, 1.385009765625, 1.77587890625, 2.166748046875, 2.5576171875, 2.948486328125, 3.33935546875, 3.730224609375, 4.12109375, 4.511962890625, 4.90283203125, 5.293701171875, 5.6845703125, 6.075439453125, 6.46630859375, 6.857177734375, 7.248046875, 7.638916015625, 8.02978515625, 8.420654296875, 8.8115234375, 9.202392578125, 9.59326171875, 9.984130859375, 10.375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 8.0, 19.0, 24.0, 21.0, 31.0, 42.0, 27.0, 51.0, 60.0, 51.0, 61.0, 52.0, 60.0, 61.0, 50.0, 64.0, 49.0, 47.0, 36.0, 44.0, 26.0, 25.0, 11.0, 16.0, 11.0, 11.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.228515625, -3.14202880859375, -3.0555419921875, -2.96905517578125, -2.882568359375, -2.79608154296875, -2.7095947265625, -2.62310791015625, -2.53662109375, -2.45013427734375, -2.3636474609375, -2.27716064453125, -2.190673828125, -2.10418701171875, -2.0177001953125, -1.93121337890625, -1.8447265625, -1.75823974609375, -1.6717529296875, -1.58526611328125, -1.498779296875, -1.41229248046875, -1.3258056640625, -1.23931884765625, -1.15283203125, -1.06634521484375, -0.9798583984375, -0.89337158203125, -0.806884765625, -0.72039794921875, -0.6339111328125, -0.54742431640625, -0.4609375, -0.37445068359375, -0.2879638671875, -0.20147705078125, -0.114990234375, -0.02850341796875, 0.0579833984375, 0.14447021484375, 0.23095703125, 0.31744384765625, 0.4039306640625, 0.49041748046875, 0.576904296875, 0.66339111328125, 0.7498779296875, 0.83636474609375, 0.9228515625, 1.00933837890625, 1.0958251953125, 1.18231201171875, 1.268798828125, 1.35528564453125, 1.4417724609375, 1.52825927734375, 1.61474609375, 1.70123291015625, 1.7877197265625, 1.87420654296875, 1.960693359375, 2.04718017578125, 2.1336669921875, 2.22015380859375, 2.306640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 7.0, 7.0, 8.0, 10.0, 26.0, 32.0, 36.0, 43.0, 72.0, 132.0, 206.0, 459.0, 1139.0, 2995.0, 11154.0, 127677.0, 859749.0, 35227.0, 6117.0, 1901.0, 732.0, 331.0, 164.0, 91.0, 50.0, 47.0, 30.0, 20.0, 18.0, 19.0, 8.0, 6.0, 5.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8857421875, -0.8564987182617188, -0.8272552490234375, -0.7980117797851562, -0.768768310546875, -0.7395248413085938, -0.7102813720703125, -0.6810379028320312, -0.65179443359375, -0.6225509643554688, -0.5933074951171875, -0.5640640258789062, -0.534820556640625, -0.5055770874023438, -0.4763336181640625, -0.44709014892578125, -0.4178466796875, -0.38860321044921875, -0.3593597412109375, -0.33011627197265625, -0.300872802734375, -0.27162933349609375, -0.2423858642578125, -0.21314239501953125, -0.18389892578125, -0.15465545654296875, -0.1254119873046875, -0.09616851806640625, -0.066925048828125, -0.03768157958984375, -0.0084381103515625, 0.02080535888671875, 0.050048828125, 0.07929229736328125, 0.1085357666015625, 0.13777923583984375, 0.167022705078125, 0.19626617431640625, 0.2255096435546875, 0.25475311279296875, 0.28399658203125, 0.31324005126953125, 0.3424835205078125, 0.37172698974609375, 0.400970458984375, 0.43021392822265625, 0.4594573974609375, 0.48870086669921875, 0.5179443359375, 0.5471878051757812, 0.5764312744140625, 0.6056747436523438, 0.634918212890625, 0.6641616821289062, 0.6934051513671875, 0.7226486206054688, 0.75189208984375, 0.7811355590820312, 0.8103790283203125, 0.8396224975585938, 0.868865966796875, 0.8981094360351562, 0.9273529052734375, 0.9565963745117188, 0.98583984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 9.0, 13.0, 24.0, 34.0, 67.0, 170.0, 280.0, 187.0, 90.0, 35.0, 22.0, 9.0, 7.0, 6.0, 9.0, 1.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012004375457763672, -0.00011597760021686554, -0.00011191144585609436, -0.00010784529149532318, -0.000103779137134552, -9.971298277378082e-05, -9.564682841300964e-05, -9.158067405223846e-05, -8.751451969146729e-05, -8.34483653306961e-05, -7.938221096992493e-05, -7.531605660915375e-05, -7.124990224838257e-05, -6.718374788761139e-05, -6.311759352684021e-05, -5.905143916606903e-05, -5.498528480529785e-05, -5.091913044452667e-05, -4.685297608375549e-05, -4.2786821722984314e-05, -3.8720667362213135e-05, -3.4654513001441956e-05, -3.0588358640670776e-05, -2.6522204279899597e-05, -2.2456049919128418e-05, -1.838989555835724e-05, -1.432374119758606e-05, -1.025758683681488e-05, -6.191432476043701e-06, -2.125278115272522e-06, 1.9408762454986572e-06, 6.0070306062698364e-06, 1.0073184967041016e-05, 1.4139339327812195e-05, 1.8205493688583374e-05, 2.2271648049354553e-05, 2.6337802410125732e-05, 3.040395677089691e-05, 3.447011113166809e-05, 3.853626549243927e-05, 4.260241985321045e-05, 4.666857421398163e-05, 5.073472857475281e-05, 5.480088293552399e-05, 5.8867037296295166e-05, 6.293319165706635e-05, 6.699934601783752e-05, 7.10655003786087e-05, 7.513165473937988e-05, 7.919780910015106e-05, 8.326396346092224e-05, 8.733011782169342e-05, 9.13962721824646e-05, 9.546242654323578e-05, 9.952858090400696e-05, 0.00010359473526477814, 0.00010766088962554932, 0.0001117270439863205, 0.00011579319834709167, 0.00011985935270786285, 0.00012392550706863403, 0.0001279916614294052, 0.0001320578157901764, 0.00013612397015094757, 0.00014019012451171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 20.0, 38.0, 59.0, 99.0, 248.0, 621.0, 2089.0, 10859.0, 208391.0, 800501.0, 20892.0, 3223.0, 846.0, 327.0, 148.0, 77.0, 42.0, 19.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.1592559814453125, -1.123199462890625, -1.0871429443359375, -1.05108642578125, -1.0150299072265625, -0.978973388671875, -0.9429168701171875, -0.9068603515625, -0.8708038330078125, -0.834747314453125, -0.7986907958984375, -0.76263427734375, -0.7265777587890625, -0.690521240234375, -0.6544647216796875, -0.618408203125, -0.5823516845703125, -0.546295166015625, -0.5102386474609375, -0.47418212890625, -0.4381256103515625, -0.402069091796875, -0.3660125732421875, -0.3299560546875, -0.2938995361328125, -0.257843017578125, -0.2217864990234375, -0.18572998046875, -0.1496734619140625, -0.113616943359375, -0.0775604248046875, -0.04150390625, -0.0054473876953125, 0.030609130859375, 0.0666656494140625, 0.10272216796875, 0.1387786865234375, 0.174835205078125, 0.2108917236328125, 0.2469482421875, 0.2830047607421875, 0.319061279296875, 0.3551177978515625, 0.39117431640625, 0.4272308349609375, 0.463287353515625, 0.4993438720703125, 0.535400390625, 0.5714569091796875, 0.607513427734375, 0.6435699462890625, 0.67962646484375, 0.7156829833984375, 0.751739501953125, 0.7877960205078125, 0.8238525390625, 0.8599090576171875, 0.895965576171875, 0.9320220947265625, 0.96807861328125, 1.0041351318359375, 1.040191650390625, 1.0762481689453125, 1.1123046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 9.0, 15.0, 14.0, 17.0, 29.0, 33.0, 68.0, 104.0, 234.0, 220.0, 92.0, 53.0, 42.0, 23.0, 13.0, 7.0, 9.0, 6.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.4277763366699219, -0.41585540771484375, -0.4039344787597656, -0.3920135498046875, -0.3800926208496094, -0.36817169189453125, -0.3562507629394531, -0.344329833984375, -0.3324089050292969, -0.32048797607421875, -0.3085670471191406, -0.2966461181640625, -0.2847251892089844, -0.27280426025390625, -0.2608833312988281, -0.24896240234375, -0.23704147338867188, -0.22512054443359375, -0.21319961547851562, -0.2012786865234375, -0.18935775756835938, -0.17743682861328125, -0.16551589965820312, -0.153594970703125, -0.14167404174804688, -0.12975311279296875, -0.11783218383789062, -0.1059112548828125, -0.09399032592773438, -0.08206939697265625, -0.07014846801757812, -0.0582275390625, -0.046306610107421875, -0.03438568115234375, -0.022464752197265625, -0.0105438232421875, 0.001377105712890625, 0.01329803466796875, 0.025218963623046875, 0.037139892578125, 0.049060821533203125, 0.06098175048828125, 0.07290267944335938, 0.0848236083984375, 0.09674453735351562, 0.10866546630859375, 0.12058639526367188, 0.13250732421875, 0.14442825317382812, 0.15634918212890625, 0.16827011108398438, 0.1801910400390625, 0.19211196899414062, 0.20403289794921875, 0.21595382690429688, 0.227874755859375, 0.23979568481445312, 0.25171661376953125, 0.2636375427246094, 0.2755584716796875, 0.2874794006347656, 0.29940032958984375, 0.3113212585449219, 0.3232421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 15.0, 26.0, 71.0, 114.0, 199.0, 215.0, 164.0, 111.0, 50.0, 27.0, 9.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.747708559036255, -2.5428552627563477, -2.3380017280578613, -2.133148431777954, -1.9282951354980469, -1.72344172000885, -1.5185883045196533, -1.313735008239746, -1.1088815927505493, -0.9040282368659973, -0.6991748809814453, -0.49432146549224854, -0.28946810960769653, -0.08461475372314453, 0.12023866176605225, 0.3250919580459595, 0.5299453735351562, 0.7347987294197083, 0.9396520853042603, 1.144505500793457, 1.3493587970733643, 1.554212212562561, 1.7590656280517578, 1.963918924331665, 2.1687722206115723, 2.3736255168914795, 2.578479051589966, 2.783332347869873, 2.9881856441497803, 3.1930389404296875, 3.397892475128174, 3.602745771408081, 3.8075995445251465, 4.012453079223633, 4.217306137084961, 4.422159671783447, 4.627013206481934, 4.831866264343262, 5.036719799041748, 5.241573333740234, 5.4464263916015625, 5.651279926300049, 5.856132984161377, 6.060986518859863, 6.26584005355835, 6.470693111419678, 6.675546646118164, 6.880399703979492, 7.085253715515137, 7.290107250213623, 7.494960308074951, 7.6998138427734375, 7.904667377471924, 8.10952091217041, 8.314373970031738, 8.519227027893066, 8.724080085754395, 8.928933143615723, 9.133787155151367, 9.338640213012695, 9.543493270874023, 9.748347282409668, 9.953200340270996, 10.158053398132324, 10.362907409667969]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 6.0, 8.0, 9.0, 9.0, 6.0, 16.0, 18.0, 14.0, 20.0, 24.0, 30.0, 32.0, 26.0, 28.0, 43.0, 33.0, 40.0, 41.0, 43.0, 47.0, 44.0, 32.0, 43.0, 39.0, 41.0, 36.0, 28.0, 36.0, 22.0, 26.0, 31.0, 22.0, 20.0, 10.0, 13.0, 11.0, 11.0, 8.0, 12.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.525723457336426, -2.4319987297058105, -2.338273763656616, -2.244549036026001, -2.1508243083953857, -2.0570995807647705, -1.9633746147155762, -1.869649887084961, -1.7759251594543457, -1.682200312614441, -1.5884755849838257, -1.494750738143921, -1.4010260105133057, -1.3073011636734009, -1.213576316833496, -1.1198515892028809, -1.026126742362976, -0.9324019551277161, -0.838677167892456, -0.7449523210525513, -0.651227593421936, -0.5575027465820312, -0.46377795934677124, -0.37005317211151123, -0.2763283848762512, -0.1826035976409912, -0.08887879550457001, 0.004846006631851196, 0.0985707938671112, 0.19229558110237122, 0.2860203981399536, 0.3797451853752136, 0.47346997261047363, 0.5671947598457336, 0.6609195470809937, 0.7546443939208984, 0.8483691215515137, 0.9420939683914185, 1.0358188152313232, 1.1295435428619385, 1.2232682704925537, 1.3169931173324585, 1.4107178449630737, 1.5044426918029785, 1.5981674194335938, 1.6918922662734985, 1.7856171131134033, 1.8793418407440186, 1.9730666875839233, 2.066791534423828, 2.1605162620544434, 2.2542409896850586, 2.347965955734253, 2.441690683364868, 2.5354154109954834, 2.6291403770446777, 2.722865104675293, 2.816589832305908, 2.9103147983551025, 3.0040395259857178, 3.097764253616333, 3.1914889812469482, 3.2852139472961426, 3.378938674926758, 3.472663402557373]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 4.0, 7.0, 16.0, 15.0, 29.0, 20.0, 44.0, 49.0, 58.0, 101.0, 159.0, 320.0, 661.0, 1507.0, 4252.0, 15752.0, 96677.0, 906842.0, 2466325.0, 614956.0, 67528.0, 12890.0, 3449.0, 1323.0, 514.0, 277.0, 146.0, 104.0, 54.0, 51.0, 33.0, 27.0, 17.0, 12.0, 13.0, 6.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-2.537109375, -2.4654541015625, -2.393798828125, -2.3221435546875, -2.25048828125, -2.1788330078125, -2.107177734375, -2.0355224609375, -1.9638671875, -1.8922119140625, -1.820556640625, -1.7489013671875, -1.67724609375, -1.6055908203125, -1.533935546875, -1.4622802734375, -1.390625, -1.3189697265625, -1.247314453125, -1.1756591796875, -1.10400390625, -1.0323486328125, -0.960693359375, -0.8890380859375, -0.8173828125, -0.7457275390625, -0.674072265625, -0.6024169921875, -0.53076171875, -0.4591064453125, -0.387451171875, -0.3157958984375, -0.244140625, -0.1724853515625, -0.100830078125, -0.0291748046875, 0.04248046875, 0.1141357421875, 0.185791015625, 0.2574462890625, 0.3291015625, 0.4007568359375, 0.472412109375, 0.5440673828125, 0.61572265625, 0.6873779296875, 0.759033203125, 0.8306884765625, 0.90234375, 0.9739990234375, 1.045654296875, 1.1173095703125, 1.18896484375, 1.2606201171875, 1.332275390625, 1.4039306640625, 1.4755859375, 1.5472412109375, 1.618896484375, 1.6905517578125, 1.76220703125, 1.8338623046875, 1.905517578125, 1.9771728515625, 2.048828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 7.0, 7.0, 18.0, 10.0, 16.0, 16.0, 16.0, 28.0, 33.0, 27.0, 44.0, 48.0, 42.0, 45.0, 49.0, 56.0, 49.0, 54.0, 39.0, 41.0, 59.0, 46.0, 43.0, 33.0, 29.0, 23.0, 28.0, 19.0, 16.0, 11.0, 14.0, 9.0, 6.0, 7.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4609375, -1.4176788330078125, -1.374420166015625, -1.3311614990234375, -1.28790283203125, -1.2446441650390625, -1.201385498046875, -1.1581268310546875, -1.1148681640625, -1.0716094970703125, -1.028350830078125, -0.9850921630859375, -0.94183349609375, -0.8985748291015625, -0.855316162109375, -0.8120574951171875, -0.768798828125, -0.7255401611328125, -0.682281494140625, -0.6390228271484375, -0.59576416015625, -0.5525054931640625, -0.509246826171875, -0.4659881591796875, -0.4227294921875, -0.3794708251953125, -0.336212158203125, -0.2929534912109375, -0.24969482421875, -0.2064361572265625, -0.163177490234375, -0.1199188232421875, -0.07666015625, -0.0334014892578125, 0.009857177734375, 0.0531158447265625, 0.09637451171875, 0.1396331787109375, 0.182891845703125, 0.2261505126953125, 0.2694091796875, 0.3126678466796875, 0.355926513671875, 0.3991851806640625, 0.44244384765625, 0.4857025146484375, 0.528961181640625, 0.5722198486328125, 0.615478515625, 0.6587371826171875, 0.701995849609375, 0.7452545166015625, 0.78851318359375, 0.8317718505859375, 0.875030517578125, 0.9182891845703125, 0.9615478515625, 1.0048065185546875, 1.048065185546875, 1.0913238525390625, 1.13458251953125, 1.1778411865234375, 1.221099853515625, 1.2643585205078125, 1.3076171875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 20.0, 38.0, 57.0, 104.0, 159.0, 385.0, 2090.0, 138848.0, 4035556.0, 15477.0, 1028.0, 255.0, 104.0, 52.0, 27.0, 21.0, 17.0, 9.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.20367431640625, -7.9776611328125, -7.75164794921875, -7.525634765625, -7.29962158203125, -7.0736083984375, -6.84759521484375, -6.62158203125, -6.39556884765625, -6.1695556640625, -5.94354248046875, -5.717529296875, -5.49151611328125, -5.2655029296875, -5.03948974609375, -4.8134765625, -4.58746337890625, -4.3614501953125, -4.13543701171875, -3.909423828125, -3.68341064453125, -3.4573974609375, -3.23138427734375, -3.00537109375, -2.77935791015625, -2.5533447265625, -2.32733154296875, -2.101318359375, -1.87530517578125, -1.6492919921875, -1.42327880859375, -1.197265625, -0.97125244140625, -0.7452392578125, -0.51922607421875, -0.293212890625, -0.06719970703125, 0.1588134765625, 0.38482666015625, 0.61083984375, 0.83685302734375, 1.0628662109375, 1.28887939453125, 1.514892578125, 1.74090576171875, 1.9669189453125, 2.19293212890625, 2.4189453125, 2.64495849609375, 2.8709716796875, 3.09698486328125, 3.322998046875, 3.54901123046875, 3.7750244140625, 4.00103759765625, 4.22705078125, 4.45306396484375, 4.6790771484375, 4.90509033203125, 5.131103515625, 5.35711669921875, 5.5831298828125, 5.80914306640625, 6.03515625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 12.0, 11.0, 19.0, 10.0, 35.0, 42.0, 62.0, 99.0, 175.0, 236.0, 408.0, 574.0, 613.0, 595.0, 383.0, 228.0, 174.0, 99.0, 85.0, 59.0, 34.0, 29.0, 24.0, 21.0, 7.0, 12.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.8028106689453125, -0.781402587890625, -0.7599945068359375, -0.73858642578125, -0.7171783447265625, -0.695770263671875, -0.6743621826171875, -0.6529541015625, -0.6315460205078125, -0.610137939453125, -0.5887298583984375, -0.56732177734375, -0.5459136962890625, -0.524505615234375, -0.5030975341796875, -0.481689453125, -0.4602813720703125, -0.438873291015625, -0.4174652099609375, -0.39605712890625, -0.3746490478515625, -0.353240966796875, -0.3318328857421875, -0.3104248046875, -0.2890167236328125, -0.267608642578125, -0.2462005615234375, -0.22479248046875, -0.2033843994140625, -0.181976318359375, -0.1605682373046875, -0.13916015625, -0.1177520751953125, -0.096343994140625, -0.0749359130859375, -0.05352783203125, -0.0321197509765625, -0.010711669921875, 0.0106964111328125, 0.0321044921875, 0.0535125732421875, 0.074920654296875, 0.0963287353515625, 0.11773681640625, 0.1391448974609375, 0.160552978515625, 0.1819610595703125, 0.203369140625, 0.2247772216796875, 0.246185302734375, 0.2675933837890625, 0.28900146484375, 0.3104095458984375, 0.331817626953125, 0.3532257080078125, 0.3746337890625, 0.3960418701171875, 0.417449951171875, 0.4388580322265625, 0.46026611328125, 0.4816741943359375, 0.503082275390625, 0.5244903564453125, 0.5458984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 8.0, 7.0, 10.0, 11.0, 19.0, 25.0, 49.0, 55.0, 64.0, 77.0, 91.0, 95.0, 96.0, 82.0, 79.0, 54.0, 39.0, 43.0, 22.0, 29.0, 12.0, 8.0, 9.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.056018829345703, -1.9849971532821655, -1.913975477218628, -1.8429536819458008, -1.7719320058822632, -1.7009103298187256, -1.6298885345458984, -1.5588668584823608, -1.4878451824188232, -1.4168235063552856, -1.345801830291748, -1.274780035018921, -1.2037583589553833, -1.1327366828918457, -1.0617148876190186, -0.990693211555481, -0.9196715354919434, -0.8486498594284058, -0.7776281237602234, -0.706606388092041, -0.6355847120285034, -0.5645630359649658, -0.49354130029678345, -0.42251959443092346, -0.3514978885650635, -0.2804761826992035, -0.2094544768333435, -0.13843277096748352, -0.06741106510162354, 0.00361064076423645, 0.07463234663009644, 0.14565405249595642, 0.2166755199432373, 0.2876972258090973, 0.3587189316749573, 0.42974063754081726, 0.5007623434066772, 0.5717840194702148, 0.6428057551383972, 0.7138274908065796, 0.7848491668701172, 0.8558708429336548, 0.9268925786018372, 0.9979143142700195, 1.0689359903335571, 1.1399576663970947, 1.2109794616699219, 1.2820011377334595, 1.353022813796997, 1.4240444898605347, 1.4950661659240723, 1.5660879611968994, 1.637109637260437, 1.7081313133239746, 1.7791531085968018, 1.8501747846603394, 1.921196460723877, 1.9922181367874146, 2.063239812850952, 2.1342616081237793, 2.2052831649780273, 2.2763049602508545, 2.3473267555236816, 2.4183483123779297, 2.489370107650757]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 8.0, 8.0, 11.0, 13.0, 10.0, 19.0, 18.0, 21.0, 21.0, 38.0, 30.0, 30.0, 37.0, 30.0, 36.0, 49.0, 37.0, 48.0, 36.0, 27.0, 34.0, 36.0, 44.0, 40.0, 35.0, 49.0, 20.0, 33.0, 30.0, 15.0, 22.0, 20.0, 11.0, 12.0, 16.0, 11.0, 7.0, 10.0, 5.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.21942138671875, -1.1815359592437744, -1.1436506509780884, -1.1057652235031128, -1.0678799152374268, -1.0299944877624512, -0.9921091198921204, -0.9542237520217896, -0.9163383841514587, -0.8784530162811279, -0.8405676484107971, -0.8026822805404663, -0.7647968530654907, -0.7269115447998047, -0.6890261173248291, -0.6511407494544983, -0.6132553815841675, -0.5753700137138367, -0.5374846458435059, -0.49959924817085266, -0.46171388030052185, -0.42382851243019104, -0.38594311475753784, -0.34805774688720703, -0.3101723790168762, -0.2722870111465454, -0.2344016283750534, -0.1965162456035614, -0.1586308777332306, -0.12074550986289978, -0.08286012709140778, -0.04497474431991577, -0.007089376449584961, 0.030795998871326447, 0.06868137419223785, 0.10656674951314926, 0.14445212483406067, 0.18233749270439148, 0.22022287547588348, 0.2581082582473755, 0.2959936261177063, 0.3338789939880371, 0.3717643618583679, 0.4096497595310211, 0.44753512740135193, 0.48542049527168274, 0.5233058929443359, 0.5611912608146667, 0.5990766286849976, 0.6369619965553284, 0.6748473644256592, 0.71273273229599, 0.7506181001663208, 0.7885035276412964, 0.8263888955116272, 0.864274263381958, 0.9021596312522888, 0.9400449991226196, 0.9779303669929504, 1.0158157348632812, 1.0537011623382568, 1.0915864706039429, 1.1294718980789185, 1.1673572063446045, 1.20524263381958]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 14.0, 5.0, 11.0, 12.0, 16.0, 25.0, 41.0, 68.0, 103.0, 217.0, 350.0, 933.0, 2190.0, 7112.0, 29072.0, 153614.0, 527577.0, 262042.0, 48688.0, 11031.0, 3182.0, 1213.0, 475.0, 217.0, 123.0, 70.0, 41.0, 23.0, 22.0, 10.0, 10.0, 11.0, 2.0, 3.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0], "bins": [-0.9111328125, -0.8887252807617188, -0.8663177490234375, -0.8439102172851562, -0.821502685546875, -0.7990951538085938, -0.7766876220703125, -0.7542800903320312, -0.73187255859375, -0.7094650268554688, -0.6870574951171875, -0.6646499633789062, -0.642242431640625, -0.6198348999023438, -0.5974273681640625, -0.5750198364257812, -0.5526123046875, -0.5302047729492188, -0.5077972412109375, -0.48538970947265625, -0.462982177734375, -0.44057464599609375, -0.4181671142578125, -0.39575958251953125, -0.37335205078125, -0.35094451904296875, -0.3285369873046875, -0.30612945556640625, -0.283721923828125, -0.26131439208984375, -0.2389068603515625, -0.21649932861328125, -0.194091796875, -0.17168426513671875, -0.1492767333984375, -0.12686920166015625, -0.104461669921875, -0.08205413818359375, -0.0596466064453125, -0.03723907470703125, -0.01483154296875, 0.00757598876953125, 0.0299835205078125, 0.05239105224609375, 0.074798583984375, 0.09720611572265625, 0.1196136474609375, 0.14202117919921875, 0.1644287109375, 0.18683624267578125, 0.2092437744140625, 0.23165130615234375, 0.254058837890625, 0.27646636962890625, 0.2988739013671875, 0.32128143310546875, 0.34368896484375, 0.36609649658203125, 0.3885040283203125, 0.41091156005859375, 0.433319091796875, 0.45572662353515625, 0.4781341552734375, 0.5005416870117188, 0.52294921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 7.0, 20.0, 21.0, 42.0, 41.0, 58.0, 75.0, 92.0, 96.0, 89.0, 112.0, 80.0, 82.0, 54.0, 46.0, 33.0, 29.0, 11.0, 10.0, 6.0, 0.0, 5.0, 2.0], "bins": [-2.63671875, -2.5844573974609375, -2.532196044921875, -2.4799346923828125, -2.42767333984375, -2.3754119873046875, -2.323150634765625, -2.2708892822265625, -2.2186279296875, -2.1663665771484375, -2.114105224609375, -2.0618438720703125, -2.00958251953125, -1.9573211669921875, -1.905059814453125, -1.8527984619140625, -1.800537109375, -1.7482757568359375, -1.696014404296875, -1.6437530517578125, -1.59149169921875, -1.5392303466796875, -1.486968994140625, -1.4347076416015625, -1.3824462890625, -1.3301849365234375, -1.277923583984375, -1.2256622314453125, -1.17340087890625, -1.1211395263671875, -1.068878173828125, -1.0166168212890625, -0.96435546875, -0.9120941162109375, -0.859832763671875, -0.8075714111328125, -0.75531005859375, -0.7030487060546875, -0.650787353515625, -0.5985260009765625, -0.5462646484375, -0.4940032958984375, -0.441741943359375, -0.3894805908203125, -0.33721923828125, -0.2849578857421875, -0.232696533203125, -0.1804351806640625, -0.128173828125, -0.0759124755859375, -0.023651123046875, 0.0286102294921875, 0.08087158203125, 0.1331329345703125, 0.185394287109375, 0.2376556396484375, 0.2899169921875, 0.3421783447265625, 0.394439697265625, 0.4467010498046875, 0.49896240234375, 0.5512237548828125, 0.603485107421875, 0.6557464599609375, 0.7080078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 6.0, 3.0, 7.0, 9.0, 11.0, 8.0, 20.0, 38.0, 34.0, 49.0, 92.0, 98.0, 166.0, 275.0, 481.0, 796.0, 1439.0, 2591.0, 5263.0, 11056.0, 25290.0, 60462.0, 141791.0, 264817.0, 270761.0, 149146.0, 63737.0, 26620.0, 11640.0, 5435.0, 2755.0, 1477.0, 819.0, 504.0, 293.0, 187.0, 107.0, 70.0, 61.0, 40.0, 24.0, 23.0, 14.0, 5.0, 8.0, 3.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.343994140625, -0.33358001708984375, -0.3231658935546875, -0.31275177001953125, -0.302337646484375, -0.29192352294921875, -0.2815093994140625, -0.27109527587890625, -0.26068115234375, -0.25026702880859375, -0.2398529052734375, -0.22943878173828125, -0.219024658203125, -0.20861053466796875, -0.1981964111328125, -0.18778228759765625, -0.1773681640625, -0.16695404052734375, -0.1565399169921875, -0.14612579345703125, -0.135711669921875, -0.12529754638671875, -0.1148834228515625, -0.10446929931640625, -0.09405517578125, -0.08364105224609375, -0.0732269287109375, -0.06281280517578125, -0.052398681640625, -0.04198455810546875, -0.0315704345703125, -0.02115631103515625, -0.0107421875, -0.00032806396484375, 0.0100860595703125, 0.02050018310546875, 0.030914306640625, 0.04132843017578125, 0.0517425537109375, 0.06215667724609375, 0.07257080078125, 0.08298492431640625, 0.0933990478515625, 0.10381317138671875, 0.114227294921875, 0.12464141845703125, 0.1350555419921875, 0.14546966552734375, 0.1558837890625, 0.16629791259765625, 0.1767120361328125, 0.18712615966796875, 0.197540283203125, 0.20795440673828125, 0.2183685302734375, 0.22878265380859375, 0.23919677734375, 0.24961090087890625, 0.2600250244140625, 0.27043914794921875, 0.280853271484375, 0.29126739501953125, 0.3016815185546875, 0.31209564208984375, 0.322509765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 2.0, 8.0, 6.0, 17.0, 11.0, 17.0, 27.0, 17.0, 36.0, 48.0, 71.0, 54.0, 67.0, 66.0, 72.0, 56.0, 65.0, 54.0, 54.0, 38.0, 40.0, 30.0, 21.0, 35.0, 18.0, 12.0, 13.0, 16.0, 3.0, 5.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8095703125, -1.7507476806640625, -1.691925048828125, -1.6331024169921875, -1.57427978515625, -1.5154571533203125, -1.456634521484375, -1.3978118896484375, -1.3389892578125, -1.2801666259765625, -1.221343994140625, -1.1625213623046875, -1.10369873046875, -1.0448760986328125, -0.986053466796875, -0.9272308349609375, -0.868408203125, -0.8095855712890625, -0.750762939453125, -0.6919403076171875, -0.63311767578125, -0.5742950439453125, -0.515472412109375, -0.4566497802734375, -0.3978271484375, -0.3390045166015625, -0.280181884765625, -0.2213592529296875, -0.16253662109375, -0.1037139892578125, -0.044891357421875, 0.0139312744140625, 0.07275390625, 0.1315765380859375, 0.190399169921875, 0.2492218017578125, 0.30804443359375, 0.3668670654296875, 0.425689697265625, 0.4845123291015625, 0.5433349609375, 0.6021575927734375, 0.660980224609375, 0.7198028564453125, 0.77862548828125, 0.8374481201171875, 0.896270751953125, 0.9550933837890625, 1.013916015625, 1.0727386474609375, 1.131561279296875, 1.1903839111328125, 1.24920654296875, 1.3080291748046875, 1.366851806640625, 1.4256744384765625, 1.4844970703125, 1.5433197021484375, 1.602142333984375, 1.6609649658203125, 1.71978759765625, 1.7786102294921875, 1.837432861328125, 1.8962554931640625, 1.955078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 6.0, 13.0, 9.0, 26.0, 28.0, 44.0, 58.0, 96.0, 134.0, 226.0, 388.0, 682.0, 1085.0, 2111.0, 3978.0, 8045.0, 17870.0, 43395.0, 116024.0, 290539.0, 326700.0, 143281.0, 52800.0, 21039.0, 9644.0, 4725.0, 2322.0, 1297.0, 750.0, 452.0, 265.0, 169.0, 101.0, 66.0, 52.0, 29.0, 29.0, 23.0, 12.0, 8.0, 5.0, 9.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10400390625, -0.10016632080078125, -0.0963287353515625, -0.09249114990234375, -0.088653564453125, -0.08481597900390625, -0.0809783935546875, -0.07714080810546875, -0.07330322265625, -0.06946563720703125, -0.0656280517578125, -0.06179046630859375, -0.057952880859375, -0.05411529541015625, -0.0502777099609375, -0.04644012451171875, -0.0426025390625, -0.03876495361328125, -0.0349273681640625, -0.03108978271484375, -0.027252197265625, -0.02341461181640625, -0.0195770263671875, -0.01573944091796875, -0.01190185546875, -0.00806427001953125, -0.0042266845703125, -0.00038909912109375, 0.003448486328125, 0.00728607177734375, 0.0111236572265625, 0.01496124267578125, 0.018798828125, 0.02263641357421875, 0.0264739990234375, 0.03031158447265625, 0.034149169921875, 0.03798675537109375, 0.0418243408203125, 0.04566192626953125, 0.04949951171875, 0.05333709716796875, 0.0571746826171875, 0.06101226806640625, 0.064849853515625, 0.06868743896484375, 0.0725250244140625, 0.07636260986328125, 0.0802001953125, 0.08403778076171875, 0.0878753662109375, 0.09171295166015625, 0.095550537109375, 0.09938812255859375, 0.1032257080078125, 0.10706329345703125, 0.11090087890625, 0.11473846435546875, 0.1185760498046875, 0.12241363525390625, 0.126251220703125, 0.13008880615234375, 0.1339263916015625, 0.13776397705078125, 0.1416015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 2.0, 5.0, 7.0, 10.0, 7.0, 17.0, 22.0, 34.0, 48.0, 63.0, 91.0, 92.0, 108.0, 88.0, 94.0, 74.0, 62.0, 50.0, 33.0, 23.0, 22.0, 16.0, 10.0, 4.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.745359420776367e-05, -9.451154619455338e-05, -9.156949818134308e-05, -8.862745016813278e-05, -8.568540215492249e-05, -8.274335414171219e-05, -7.980130612850189e-05, -7.68592581152916e-05, -7.39172101020813e-05, -7.0975162088871e-05, -6.80331140756607e-05, -6.509106606245041e-05, -6.214901804924011e-05, -5.9206970036029816e-05, -5.626492202281952e-05, -5.332287400960922e-05, -5.0380825996398926e-05, -4.743877798318863e-05, -4.449672996997833e-05, -4.1554681956768036e-05, -3.861263394355774e-05, -3.567058593034744e-05, -3.2728537917137146e-05, -2.978648990392685e-05, -2.6844441890716553e-05, -2.3902393877506256e-05, -2.096034586429596e-05, -1.8018297851085663e-05, -1.5076249837875366e-05, -1.213420182466507e-05, -9.192153811454773e-06, -6.250105798244476e-06, -3.3080577850341797e-06, -3.6600977182388306e-07, 2.5760382413864136e-06, 5.51808625459671e-06, 8.460134267807007e-06, 1.1402182281017303e-05, 1.43442302942276e-05, 1.7286278307437897e-05, 2.0228326320648193e-05, 2.317037433385849e-05, 2.6112422347068787e-05, 2.9054470360279083e-05, 3.199651837348938e-05, 3.4938566386699677e-05, 3.788061439990997e-05, 4.082266241312027e-05, 4.3764710426330566e-05, 4.670675843954086e-05, 4.964880645275116e-05, 5.2590854465961456e-05, 5.553290247917175e-05, 5.847495049238205e-05, 6.141699850559235e-05, 6.435904651880264e-05, 6.730109453201294e-05, 7.024314254522324e-05, 7.318519055843353e-05, 7.612723857164383e-05, 7.906928658485413e-05, 8.201133459806442e-05, 8.495338261127472e-05, 8.789543062448502e-05, 9.083747863769531e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 7.0, 9.0, 12.0, 25.0, 14.0, 23.0, 48.0, 53.0, 72.0, 157.0, 284.0, 601.0, 1377.0, 3568.0, 10683.0, 36506.0, 155950.0, 514478.0, 246712.0, 54585.0, 15022.0, 4925.0, 1794.0, 746.0, 342.0, 207.0, 100.0, 48.0, 51.0, 40.0, 17.0, 21.0, 15.0, 13.0, 14.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.23583984375, -0.22940444946289062, -0.22296905517578125, -0.21653366088867188, -0.2100982666015625, -0.20366287231445312, -0.19722747802734375, -0.19079208374023438, -0.184356689453125, -0.17792129516601562, -0.17148590087890625, -0.16505050659179688, -0.1586151123046875, -0.15217971801757812, -0.14574432373046875, -0.13930892944335938, -0.13287353515625, -0.12643814086914062, -0.12000274658203125, -0.11356735229492188, -0.1071319580078125, -0.10069656372070312, -0.09426116943359375, -0.08782577514648438, -0.081390380859375, -0.07495498657226562, -0.06851959228515625, -0.062084197998046875, -0.0556488037109375, -0.049213409423828125, -0.04277801513671875, -0.036342620849609375, -0.0299072265625, -0.023471832275390625, -0.01703643798828125, -0.010601043701171875, -0.0041656494140625, 0.002269744873046875, 0.00870513916015625, 0.015140533447265625, 0.021575927734375, 0.028011322021484375, 0.03444671630859375, 0.040882110595703125, 0.0473175048828125, 0.053752899169921875, 0.06018829345703125, 0.06662368774414062, 0.07305908203125, 0.07949447631835938, 0.08592987060546875, 0.09236526489257812, 0.0988006591796875, 0.10523605346679688, 0.11167144775390625, 0.11810684204101562, 0.124542236328125, 0.13097763061523438, 0.13741302490234375, 0.14384841918945312, 0.1502838134765625, 0.15671920776367188, 0.16315460205078125, 0.16958999633789062, 0.176025390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 7.0, 3.0, 10.0, 16.0, 9.0, 26.0, 19.0, 25.0, 34.0, 37.0, 53.0, 60.0, 76.0, 76.0, 84.0, 82.0, 71.0, 51.0, 39.0, 52.0, 31.0, 26.0, 19.0, 19.0, 8.0, 12.0, 15.0, 7.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.038238525390625, -0.0369720458984375, -0.03570556640625, -0.0344390869140625, -0.033172607421875, -0.0319061279296875, -0.0306396484375, -0.0293731689453125, -0.028106689453125, -0.0268402099609375, -0.02557373046875, -0.0243072509765625, -0.023040771484375, -0.0217742919921875, -0.0205078125, -0.0192413330078125, -0.017974853515625, -0.0167083740234375, -0.01544189453125, -0.0141754150390625, -0.012908935546875, -0.0116424560546875, -0.0103759765625, -0.0091094970703125, -0.007843017578125, -0.0065765380859375, -0.00531005859375, -0.0040435791015625, -0.002777099609375, -0.0015106201171875, -0.000244140625, 0.0010223388671875, 0.002288818359375, 0.0035552978515625, 0.00482177734375, 0.0060882568359375, 0.007354736328125, 0.0086212158203125, 0.0098876953125, 0.0111541748046875, 0.012420654296875, 0.0136871337890625, 0.01495361328125, 0.0162200927734375, 0.017486572265625, 0.0187530517578125, 0.02001953125, 0.0212860107421875, 0.022552490234375, 0.0238189697265625, 0.02508544921875, 0.0263519287109375, 0.027618408203125, 0.0288848876953125, 0.0301513671875, 0.0314178466796875, 0.032684326171875, 0.0339508056640625, 0.03521728515625, 0.0364837646484375, 0.037750244140625, 0.0390167236328125, 0.040283203125, 0.0415496826171875, 0.042816162109375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 25.0, 36.0, 72.0, 78.0, 105.0, 144.0, 140.0, 111.0, 96.0, 49.0, 44.0, 28.0, 19.0, 18.0, 6.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5933345556259155, -1.5387074947357178, -1.48408043384552, -1.4294533729553223, -1.374826192855835, -1.3201992511749268, -1.2655720710754395, -1.2109450101852417, -1.156317949295044, -1.1016908884048462, -1.0470638275146484, -0.9924367070198059, -0.9378096461296082, -0.8831825852394104, -0.8285554647445679, -0.7739284038543701, -0.7193013429641724, -0.6646742820739746, -0.6100472211837769, -0.5554201006889343, -0.5007930397987366, -0.4461659789085388, -0.3915388882160187, -0.33691179752349854, -0.2822847366333008, -0.22765766084194183, -0.17303058505058289, -0.11840350925922394, -0.06377643346786499, -0.009149372577667236, 0.045477718114852905, 0.10010480880737305, 0.15473198890686035, 0.2093590646982193, 0.26398614048957825, 0.3186132311820984, 0.37324029207229614, 0.4278673529624939, 0.48249444365501404, 0.5371215343475342, 0.5917485952377319, 0.6463756561279297, 0.7010027170181274, 0.75562983751297, 0.8102568984031677, 0.8648839592933655, 0.919511079788208, 0.9741381406784058, 1.0287652015686035, 1.0833922624588013, 1.138019323348999, 1.1926463842391968, 1.2472734451293945, 1.3019006252288818, 1.3565276861190796, 1.4111547470092773, 1.465781807899475, 1.5204088687896729, 1.5750359296798706, 1.6296629905700684, 1.6842901706695557, 1.7389171123504639, 1.7935442924499512, 1.848171353340149, 1.9027984142303467]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 7.0, 21.0, 19.0, 24.0, 30.0, 39.0, 53.0, 69.0, 63.0, 71.0, 79.0, 61.0, 68.0, 88.0, 62.0, 54.0, 52.0, 34.0, 28.0, 24.0, 19.0, 11.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6685205698013306, -1.629874348640442, -1.5912282466888428, -1.552582025527954, -1.513935923576355, -1.4752897024154663, -1.4366436004638672, -1.3979973793029785, -1.3593511581420898, -1.3207049369812012, -1.282058835029602, -1.2434126138687134, -1.2047665119171143, -1.1661202907562256, -1.1274741888046265, -1.0888279676437378, -1.0501818656921387, -1.01153564453125, -0.9728895425796509, -0.934243381023407, -0.8955972194671631, -0.8569509983062744, -0.8183048367500305, -0.7796586751937866, -0.7410125136375427, -0.7023663520812988, -0.6637201905250549, -0.625074028968811, -0.5864278078079224, -0.5477817058563232, -0.5091354846954346, -0.4704893231391907, -0.43184322118759155, -0.39319705963134766, -0.35455089807510376, -0.3159047067165375, -0.2772585451602936, -0.23861238360404968, -0.1999662071466446, -0.1613200306892395, -0.1226738691329956, -0.08402770012617111, -0.04538153111934662, -0.006735362112522125, 0.03191080689430237, 0.07055696845054626, 0.10920314490795135, 0.14784932136535645, 0.18649548292160034, 0.22514164447784424, 0.26378780603408813, 0.3024339973926544, 0.3410801589488983, 0.3797263205051422, 0.4183725118637085, 0.4570186734199524, 0.4956648349761963, 0.5343109965324402, 0.5729571580886841, 0.611603319644928, 0.6502494812011719, 0.6888957023620605, 0.7275418639183044, 0.7661880254745483, 0.8048341870307922]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 4.0, 14.0, 10.0, 24.0, 24.0, 46.0, 75.0, 173.0, 343.0, 845.0, 2131.0, 5614.0, 17462.0, 76559.0, 474037.0, 387887.0, 60359.0, 14761.0, 4928.0, 1866.0, 722.0, 312.0, 149.0, 81.0, 41.0, 19.0, 15.0, 9.0, 9.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2568359375, -1.21484375, -1.1728515625, -1.130859375, -1.0888671875, -1.046875, -1.0048828125, -0.962890625, -0.9208984375, -0.87890625, -0.8369140625, -0.794921875, -0.7529296875, -0.7109375, -0.6689453125, -0.626953125, -0.5849609375, -0.54296875, -0.5009765625, -0.458984375, -0.4169921875, -0.375, -0.3330078125, -0.291015625, -0.2490234375, -0.20703125, -0.1650390625, -0.123046875, -0.0810546875, -0.0390625, 0.0029296875, 0.044921875, 0.0869140625, 0.12890625, 0.1708984375, 0.212890625, 0.2548828125, 0.296875, 0.3388671875, 0.380859375, 0.4228515625, 0.46484375, 0.5068359375, 0.548828125, 0.5908203125, 0.6328125, 0.6748046875, 0.716796875, 0.7587890625, 0.80078125, 0.8427734375, 0.884765625, 0.9267578125, 0.96875, 1.0107421875, 1.052734375, 1.0947265625, 1.13671875, 1.1787109375, 1.220703125, 1.2626953125, 1.3046875, 1.3466796875, 1.388671875, 1.4306640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 3.0, 9.0, 9.0, 15.0, 23.0, 23.0, 37.0, 50.0, 39.0, 59.0, 62.0, 54.0, 71.0, 47.0, 69.0, 59.0, 63.0, 65.0, 44.0, 33.0, 43.0, 22.0, 25.0, 21.0, 14.0, 11.0, 9.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0], "bins": [-3.02734375, -2.9594573974609375, -2.891571044921875, -2.8236846923828125, -2.75579833984375, -2.6879119873046875, -2.620025634765625, -2.5521392822265625, -2.4842529296875, -2.4163665771484375, -2.348480224609375, -2.2805938720703125, -2.21270751953125, -2.1448211669921875, -2.076934814453125, -2.0090484619140625, -1.941162109375, -1.8732757568359375, -1.805389404296875, -1.7375030517578125, -1.66961669921875, -1.6017303466796875, -1.533843994140625, -1.4659576416015625, -1.3980712890625, -1.3301849365234375, -1.262298583984375, -1.1944122314453125, -1.12652587890625, -1.0586395263671875, -0.990753173828125, -0.9228668212890625, -0.85498046875, -0.7870941162109375, -0.719207763671875, -0.6513214111328125, -0.58343505859375, -0.5155487060546875, -0.447662353515625, -0.3797760009765625, -0.3118896484375, -0.2440032958984375, -0.176116943359375, -0.1082305908203125, -0.04034423828125, 0.0275421142578125, 0.095428466796875, 0.1633148193359375, 0.231201171875, 0.2990875244140625, 0.366973876953125, 0.4348602294921875, 0.50274658203125, 0.5706329345703125, 0.638519287109375, 0.7064056396484375, 0.7742919921875, 0.8421783447265625, 0.910064697265625, 0.9779510498046875, 1.04583740234375, 1.1137237548828125, 1.181610107421875, 1.2494964599609375, 1.3173828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 3.0, 9.0, 6.0, 5.0, 11.0, 10.0, 14.0, 12.0, 18.0, 18.0, 20.0, 22.0, 28.0, 37.0, 62.0, 57.0, 106.0, 156.0, 349.0, 2876.0, 422156.0, 618118.0, 3467.0, 350.0, 180.0, 101.0, 68.0, 48.0, 32.0, 27.0, 29.0, 29.0, 18.0, 16.0, 14.0, 11.0, 14.0, 13.0, 7.0, 7.0, 13.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.4609375, -4.31719970703125, -4.1734619140625, -4.02972412109375, -3.885986328125, -3.74224853515625, -3.5985107421875, -3.45477294921875, -3.31103515625, -3.16729736328125, -3.0235595703125, -2.87982177734375, -2.736083984375, -2.59234619140625, -2.4486083984375, -2.30487060546875, -2.1611328125, -2.01739501953125, -1.8736572265625, -1.72991943359375, -1.586181640625, -1.44244384765625, -1.2987060546875, -1.15496826171875, -1.01123046875, -0.86749267578125, -0.7237548828125, -0.58001708984375, -0.436279296875, -0.29254150390625, -0.1488037109375, -0.00506591796875, 0.138671875, 0.28240966796875, 0.4261474609375, 0.56988525390625, 0.713623046875, 0.85736083984375, 1.0010986328125, 1.14483642578125, 1.28857421875, 1.43231201171875, 1.5760498046875, 1.71978759765625, 1.863525390625, 2.00726318359375, 2.1510009765625, 2.29473876953125, 2.4384765625, 2.58221435546875, 2.7259521484375, 2.86968994140625, 3.013427734375, 3.15716552734375, 3.3009033203125, 3.44464111328125, 3.58837890625, 3.73211669921875, 3.8758544921875, 4.01959228515625, 4.163330078125, 4.30706787109375, 4.4508056640625, 4.59454345703125, 4.73828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 9.0, 9.0, 11.0, 13.0, 10.0, 13.0, 19.0, 22.0, 23.0, 32.0, 31.0, 37.0, 40.0, 35.0, 36.0, 44.0, 43.0, 38.0, 32.0, 38.0, 41.0, 43.0, 31.0, 31.0, 38.0, 23.0, 32.0, 28.0, 26.0, 23.0, 23.0, 15.0, 7.0, 8.0, 10.0, 15.0, 10.0, 11.0, 10.0, 2.0, 8.0, 0.0, 8.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4287109375, -1.3848419189453125, -1.340972900390625, -1.2971038818359375, -1.25323486328125, -1.2093658447265625, -1.165496826171875, -1.1216278076171875, -1.0777587890625, -1.0338897705078125, -0.990020751953125, -0.9461517333984375, -0.90228271484375, -0.8584136962890625, -0.814544677734375, -0.7706756591796875, -0.726806640625, -0.6829376220703125, -0.639068603515625, -0.5951995849609375, -0.55133056640625, -0.5074615478515625, -0.463592529296875, -0.4197235107421875, -0.3758544921875, -0.3319854736328125, -0.288116455078125, -0.2442474365234375, -0.20037841796875, -0.1565093994140625, -0.112640380859375, -0.0687713623046875, -0.02490234375, 0.0189666748046875, 0.062835693359375, 0.1067047119140625, 0.15057373046875, 0.1944427490234375, 0.238311767578125, 0.2821807861328125, 0.3260498046875, 0.3699188232421875, 0.413787841796875, 0.4576568603515625, 0.50152587890625, 0.5453948974609375, 0.589263916015625, 0.6331329345703125, 0.677001953125, 0.7208709716796875, 0.764739990234375, 0.8086090087890625, 0.85247802734375, 0.8963470458984375, 0.940216064453125, 0.9840850830078125, 1.0279541015625, 1.0718231201171875, 1.115692138671875, 1.1595611572265625, 1.20343017578125, 1.2472991943359375, 1.291168212890625, 1.3350372314453125, 1.37890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 16.0, 14.0, 24.0, 27.0, 33.0, 32.0, 54.0, 62.0, 85.0, 161.0, 271.0, 542.0, 987.0, 2253.0, 6041.0, 18878.0, 75500.0, 367460.0, 443502.0, 97167.0, 23087.0, 7081.0, 2600.0, 1139.0, 587.0, 321.0, 181.0, 115.0, 80.0, 61.0, 42.0, 34.0, 28.0, 21.0, 19.0, 8.0, 11.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.263671875, -0.25518798828125, -0.2467041015625, -0.23822021484375, -0.229736328125, -0.22125244140625, -0.2127685546875, -0.20428466796875, -0.19580078125, -0.18731689453125, -0.1788330078125, -0.17034912109375, -0.161865234375, -0.15338134765625, -0.1448974609375, -0.13641357421875, -0.1279296875, -0.11944580078125, -0.1109619140625, -0.10247802734375, -0.093994140625, -0.08551025390625, -0.0770263671875, -0.06854248046875, -0.06005859375, -0.05157470703125, -0.0430908203125, -0.03460693359375, -0.026123046875, -0.01763916015625, -0.0091552734375, -0.00067138671875, 0.0078125, 0.01629638671875, 0.0247802734375, 0.03326416015625, 0.041748046875, 0.05023193359375, 0.0587158203125, 0.06719970703125, 0.07568359375, 0.08416748046875, 0.0926513671875, 0.10113525390625, 0.109619140625, 0.11810302734375, 0.1265869140625, 0.13507080078125, 0.1435546875, 0.15203857421875, 0.1605224609375, 0.16900634765625, 0.177490234375, 0.18597412109375, 0.1944580078125, 0.20294189453125, 0.21142578125, 0.21990966796875, 0.2283935546875, 0.23687744140625, 0.245361328125, 0.25384521484375, 0.2623291015625, 0.27081298828125, 0.279296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 5.0, 8.0, 18.0, 14.0, 20.0, 23.0, 22.0, 41.0, 39.0, 66.0, 88.0, 87.0, 73.0, 88.0, 76.0, 70.0, 42.0, 38.0, 29.0, 22.0, 24.0, 18.0, 13.0, 13.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.49879264831543e-05, -3.3809803426265717e-05, -3.2631680369377136e-05, -3.1453557312488556e-05, -3.0275434255599976e-05, -2.9097311198711395e-05, -2.7919188141822815e-05, -2.6741065084934235e-05, -2.5562942028045654e-05, -2.4384818971157074e-05, -2.3206695914268494e-05, -2.2028572857379913e-05, -2.0850449800491333e-05, -1.9672326743602753e-05, -1.8494203686714172e-05, -1.7316080629825592e-05, -1.6137957572937012e-05, -1.4959834516048431e-05, -1.3781711459159851e-05, -1.260358840227127e-05, -1.142546534538269e-05, -1.024734228849411e-05, -9.06921923160553e-06, -7.89109617471695e-06, -6.712973117828369e-06, -5.534850060939789e-06, -4.3567270040512085e-06, -3.178603947162628e-06, -2.000480890274048e-06, -8.223578333854675e-07, 3.557652235031128e-07, 1.5338882803916931e-06, 2.7120113372802734e-06, 3.890134394168854e-06, 5.068257451057434e-06, 6.246380507946014e-06, 7.424503564834595e-06, 8.602626621723175e-06, 9.780749678611755e-06, 1.0958872735500336e-05, 1.2136995792388916e-05, 1.3315118849277496e-05, 1.4493241906166077e-05, 1.5671364963054657e-05, 1.6849488019943237e-05, 1.8027611076831818e-05, 1.9205734133720398e-05, 2.0383857190608978e-05, 2.156198024749756e-05, 2.274010330438614e-05, 2.391822636127472e-05, 2.50963494181633e-05, 2.627447247505188e-05, 2.745259553194046e-05, 2.863071858882904e-05, 2.980884164571762e-05, 3.09869647026062e-05, 3.216508775949478e-05, 3.334321081638336e-05, 3.452133387327194e-05, 3.569945693016052e-05, 3.68775799870491e-05, 3.805570304393768e-05, 3.9233826100826263e-05, 4.0411949157714844e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 10.0, 11.0, 9.0, 20.0, 23.0, 22.0, 41.0, 61.0, 100.0, 188.0, 286.0, 623.0, 1237.0, 3090.0, 9261.0, 35114.0, 187433.0, 585194.0, 177697.0, 33556.0, 8902.0, 3078.0, 1246.0, 544.0, 305.0, 167.0, 98.0, 62.0, 51.0, 28.0, 22.0, 16.0, 15.0, 8.0, 10.0, 2.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.327392578125, -0.31731414794921875, -0.3072357177734375, -0.29715728759765625, -0.287078857421875, -0.27700042724609375, -0.2669219970703125, -0.25684356689453125, -0.24676513671875, -0.23668670654296875, -0.2266082763671875, -0.21652984619140625, -0.206451416015625, -0.19637298583984375, -0.1862945556640625, -0.17621612548828125, -0.1661376953125, -0.15605926513671875, -0.1459808349609375, -0.13590240478515625, -0.125823974609375, -0.11574554443359375, -0.1056671142578125, -0.09558868408203125, -0.08551025390625, -0.07543182373046875, -0.0653533935546875, -0.05527496337890625, -0.045196533203125, -0.03511810302734375, -0.0250396728515625, -0.01496124267578125, -0.0048828125, 0.00519561767578125, 0.0152740478515625, 0.02535247802734375, 0.035430908203125, 0.04550933837890625, 0.0555877685546875, 0.06566619873046875, 0.07574462890625, 0.08582305908203125, 0.0959014892578125, 0.10597991943359375, 0.116058349609375, 0.12613677978515625, 0.1362152099609375, 0.14629364013671875, 0.1563720703125, 0.16645050048828125, 0.1765289306640625, 0.18660736083984375, 0.196685791015625, 0.20676422119140625, 0.2168426513671875, 0.22692108154296875, 0.23699951171875, 0.24707794189453125, 0.2571563720703125, 0.26723480224609375, 0.277313232421875, 0.28739166259765625, 0.2974700927734375, 0.30754852294921875, 0.317626953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 10.0, 13.0, 17.0, 14.0, 21.0, 31.0, 29.0, 28.0, 36.0, 33.0, 46.0, 49.0, 59.0, 54.0, 48.0, 50.0, 49.0, 49.0, 49.0, 39.0, 40.0, 29.0, 38.0, 27.0, 25.0, 23.0, 14.0, 20.0, 8.0, 4.0, 4.0, 9.0, 1.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0794677734375, -0.07685089111328125, -0.0742340087890625, -0.07161712646484375, -0.069000244140625, -0.06638336181640625, -0.0637664794921875, -0.06114959716796875, -0.05853271484375, -0.05591583251953125, -0.0532989501953125, -0.05068206787109375, -0.048065185546875, -0.04544830322265625, -0.0428314208984375, -0.04021453857421875, -0.03759765625, -0.03498077392578125, -0.0323638916015625, -0.02974700927734375, -0.027130126953125, -0.02451324462890625, -0.0218963623046875, -0.01927947998046875, -0.01666259765625, -0.01404571533203125, -0.0114288330078125, -0.00881195068359375, -0.006195068359375, -0.00357818603515625, -0.0009613037109375, 0.00165557861328125, 0.0042724609375, 0.00688934326171875, 0.0095062255859375, 0.01212310791015625, 0.014739990234375, 0.01735687255859375, 0.0199737548828125, 0.02259063720703125, 0.02520751953125, 0.02782440185546875, 0.0304412841796875, 0.03305816650390625, 0.035675048828125, 0.03829193115234375, 0.0409088134765625, 0.04352569580078125, 0.046142578125, 0.04875946044921875, 0.0513763427734375, 0.05399322509765625, 0.056610107421875, 0.05922698974609375, 0.0618438720703125, 0.06446075439453125, 0.06707763671875, 0.06969451904296875, 0.0723114013671875, 0.07492828369140625, 0.077545166015625, 0.08016204833984375, 0.0827789306640625, 0.08539581298828125, 0.0880126953125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 33.0, 181.0, 447.0, 248.0, 76.0, 15.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.67369270324707, -20.302457809448242, -19.931224822998047, -19.55998992919922, -19.18875503540039, -18.817520141601562, -18.446287155151367, -18.07505226135254, -17.70381736755371, -17.332582473754883, -16.961349487304688, -16.59011459350586, -16.21887969970703, -15.84764575958252, -15.476411819458008, -15.10517692565918, -14.733943939208984, -14.362709999084473, -13.991475105285645, -13.620241165161133, -13.249006271362305, -12.877772331237793, -12.506538391113281, -12.135303497314453, -11.764068603515625, -11.392834663391113, -11.021599769592285, -10.650365829467773, -10.279130935668945, -9.907896995544434, -9.536663055419922, -9.165428161621094, -8.794193267822266, -8.422959327697754, -8.051724433898926, -7.680490493774414, -7.309256076812744, -6.938021659851074, -6.566787242889404, -6.195552825927734, -5.824318885803223, -5.453084468841553, -5.081850051879883, -4.710616111755371, -4.339381694793701, -3.9681472778320312, -3.5969128608703613, -3.2256786823272705, -2.8544442653656006, -2.4832098484039307, -2.11197566986084, -1.74074125289917, -1.3695069551467896, -0.9982726573944092, -0.6270382404327393, -0.25580406188964844, 0.11543035507202148, 0.48666468262672424, 0.857899010181427, 1.2291333675384521, 1.6003676652908325, 1.971601963043213, 2.342836380004883, 2.7140705585479736, 3.0853049755096436]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 10.0, 13.0, 12.0, 3.0, 10.0, 11.0, 16.0, 21.0, 24.0, 26.0, 41.0, 41.0, 41.0, 41.0, 35.0, 58.0, 38.0, 48.0, 39.0, 46.0, 49.0, 39.0, 44.0, 38.0, 33.0, 28.0, 34.0, 21.0, 15.0, 23.0, 12.0, 20.0, 8.0, 13.0, 11.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0], "bins": [-2.831918239593506, -2.7496049404144287, -2.6672916412353516, -2.5849781036376953, -2.502664804458618, -2.420351505279541, -2.3380379676818848, -2.2557246685028076, -2.1734113693237305, -2.0910980701446533, -2.008784770965576, -1.92647123336792, -1.8441579341888428, -1.7618446350097656, -1.679531216621399, -1.5972177982330322, -1.514904499053955, -1.432591199874878, -1.3502777814865112, -1.2679643630981445, -1.1856510639190674, -1.1033377647399902, -1.0210243463516235, -0.9387109875679016, -0.8563976287841797, -0.7740842700004578, -0.6917709112167358, -0.6094575524330139, -0.527144193649292, -0.44483083486557007, -0.36251747608184814, -0.2802041172981262, -0.1978909969329834, -0.11557763814926147, -0.03326427936553955, 0.04904907941818237, 0.1313624382019043, 0.21367579698562622, 0.29598915576934814, 0.37830251455307007, 0.460615873336792, 0.5429292321205139, 0.6252425909042358, 0.7075559496879578, 0.7898693084716797, 0.8721826672554016, 0.9544960260391235, 1.0368094444274902, 1.1191227436065674, 1.2014360427856445, 1.2837494611740112, 1.366062879562378, 1.448376178741455, 1.5306894779205322, 1.613002896308899, 1.6953163146972656, 1.7776296138763428, 1.85994291305542, 1.9422563314437866, 2.0245697498321533, 2.1068830490112305, 2.1891963481903076, 2.2715096473693848, 2.353823184967041, 2.436136484146118]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 7.0, 15.0, 25.0, 37.0, 65.0, 123.0, 290.0, 770.0, 2743.0, 14266.0, 206653.0, 2996335.0, 923117.0, 42328.0, 5465.0, 1281.0, 383.0, 159.0, 98.0, 48.0, 36.0, 17.0, 12.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.5738525390625, -1.479736328125, -1.3856201171875, -1.29150390625, -1.1973876953125, -1.103271484375, -1.0091552734375, -0.9150390625, -0.8209228515625, -0.726806640625, -0.6326904296875, -0.53857421875, -0.4444580078125, -0.350341796875, -0.2562255859375, -0.162109375, -0.0679931640625, 0.026123046875, 0.1202392578125, 0.21435546875, 0.3084716796875, 0.402587890625, 0.4967041015625, 0.5908203125, 0.6849365234375, 0.779052734375, 0.8731689453125, 0.96728515625, 1.0614013671875, 1.155517578125, 1.2496337890625, 1.34375, 1.4378662109375, 1.531982421875, 1.6260986328125, 1.72021484375, 1.8143310546875, 1.908447265625, 2.0025634765625, 2.0966796875, 2.1907958984375, 2.284912109375, 2.3790283203125, 2.47314453125, 2.5672607421875, 2.661376953125, 2.7554931640625, 2.849609375, 2.9437255859375, 3.037841796875, 3.1319580078125, 3.22607421875, 3.3201904296875, 3.414306640625, 3.5084228515625, 3.6025390625, 3.6966552734375, 3.790771484375, 3.8848876953125, 3.97900390625, 4.0731201171875, 4.167236328125, 4.2613525390625, 4.35546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 9.0, 12.0, 14.0, 16.0, 16.0, 28.0, 32.0, 27.0, 24.0, 46.0, 46.0, 52.0, 38.0, 47.0, 64.0, 37.0, 41.0, 46.0, 47.0, 38.0, 41.0, 34.0, 41.0, 44.0, 19.0, 14.0, 17.0, 18.0, 13.0, 13.0, 10.0, 5.0, 8.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1470489501953125, -1.111480712890625, -1.0759124755859375, -1.04034423828125, -1.0047760009765625, -0.969207763671875, -0.9336395263671875, -0.8980712890625, -0.8625030517578125, -0.826934814453125, -0.7913665771484375, -0.75579833984375, -0.7202301025390625, -0.684661865234375, -0.6490936279296875, -0.613525390625, -0.5779571533203125, -0.542388916015625, -0.5068206787109375, -0.47125244140625, -0.4356842041015625, -0.400115966796875, -0.3645477294921875, -0.3289794921875, -0.2934112548828125, -0.257843017578125, -0.2222747802734375, -0.18670654296875, -0.1511383056640625, -0.115570068359375, -0.0800018310546875, -0.04443359375, -0.0088653564453125, 0.026702880859375, 0.0622711181640625, 0.09783935546875, 0.1334075927734375, 0.168975830078125, 0.2045440673828125, 0.2401123046875, 0.2756805419921875, 0.311248779296875, 0.3468170166015625, 0.38238525390625, 0.4179534912109375, 0.453521728515625, 0.4890899658203125, 0.524658203125, 0.5602264404296875, 0.595794677734375, 0.6313629150390625, 0.66693115234375, 0.7024993896484375, 0.738067626953125, 0.7736358642578125, 0.8092041015625, 0.8447723388671875, 0.880340576171875, 0.9159088134765625, 0.95147705078125, 0.9870452880859375, 1.022613525390625, 1.0581817626953125, 1.09375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 4.0, 7.0, 5.0, 13.0, 3.0, 16.0, 24.0, 34.0, 43.0, 52.0, 75.0, 89.0, 156.0, 293.0, 806.0, 5551.0, 592278.0, 3577568.0, 15018.0, 1267.0, 411.0, 182.0, 108.0, 67.0, 53.0, 40.0, 33.0, 19.0, 19.0, 13.0, 6.0, 11.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.22711181640625, -4.0714111328125, -3.91571044921875, -3.760009765625, -3.60430908203125, -3.4486083984375, -3.29290771484375, -3.13720703125, -2.98150634765625, -2.8258056640625, -2.67010498046875, -2.514404296875, -2.35870361328125, -2.2030029296875, -2.04730224609375, -1.8916015625, -1.73590087890625, -1.5802001953125, -1.42449951171875, -1.268798828125, -1.11309814453125, -0.9573974609375, -0.80169677734375, -0.64599609375, -0.49029541015625, -0.3345947265625, -0.17889404296875, -0.023193359375, 0.13250732421875, 0.2882080078125, 0.44390869140625, 0.599609375, 0.75531005859375, 0.9110107421875, 1.06671142578125, 1.222412109375, 1.37811279296875, 1.5338134765625, 1.68951416015625, 1.84521484375, 2.00091552734375, 2.1566162109375, 2.31231689453125, 2.468017578125, 2.62371826171875, 2.7794189453125, 2.93511962890625, 3.0908203125, 3.24652099609375, 3.4022216796875, 3.55792236328125, 3.713623046875, 3.86932373046875, 4.0250244140625, 4.18072509765625, 4.33642578125, 4.49212646484375, 4.6478271484375, 4.80352783203125, 4.959228515625, 5.11492919921875, 5.2706298828125, 5.42633056640625, 5.58203125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 4.0, 13.0, 8.0, 23.0, 33.0, 47.0, 41.0, 78.0, 103.0, 165.0, 237.0, 318.0, 424.0, 486.0, 537.0, 427.0, 363.0, 191.0, 159.0, 130.0, 70.0, 56.0, 46.0, 25.0, 23.0, 17.0, 9.0, 13.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.61224365234375, -0.5965576171875, -0.58087158203125, -0.565185546875, -0.54949951171875, -0.5338134765625, -0.51812744140625, -0.50244140625, -0.48675537109375, -0.4710693359375, -0.45538330078125, -0.439697265625, -0.42401123046875, -0.4083251953125, -0.39263916015625, -0.376953125, -0.36126708984375, -0.3455810546875, -0.32989501953125, -0.314208984375, -0.29852294921875, -0.2828369140625, -0.26715087890625, -0.25146484375, -0.23577880859375, -0.2200927734375, -0.20440673828125, -0.188720703125, -0.17303466796875, -0.1573486328125, -0.14166259765625, -0.1259765625, -0.11029052734375, -0.0946044921875, -0.07891845703125, -0.063232421875, -0.04754638671875, -0.0318603515625, -0.01617431640625, -0.00048828125, 0.01519775390625, 0.0308837890625, 0.04656982421875, 0.062255859375, 0.07794189453125, 0.0936279296875, 0.10931396484375, 0.125, 0.14068603515625, 0.1563720703125, 0.17205810546875, 0.187744140625, 0.20343017578125, 0.2191162109375, 0.23480224609375, 0.25048828125, 0.26617431640625, 0.2818603515625, 0.29754638671875, 0.313232421875, 0.32891845703125, 0.3446044921875, 0.36029052734375, 0.3759765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 24.0, 25.0, 39.0, 43.0, 68.0, 92.0, 100.0, 108.0, 104.0, 95.0, 86.0, 63.0, 50.0, 30.0, 16.0, 20.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9770522117614746, -1.9064325094223022, -1.8358129262924194, -1.765193223953247, -1.6945736408233643, -1.623953938484192, -1.5533342361450195, -1.4827146530151367, -1.4120949506759644, -1.341475248336792, -1.2708556652069092, -1.2002359628677368, -1.1296162605285645, -1.0589966773986816, -0.9883769750595093, -0.9177573323249817, -0.8471376895904541, -0.7765180468559265, -0.7058984041213989, -0.6352787017822266, -0.564659059047699, -0.4940394163131714, -0.4234197437763214, -0.35280007123947144, -0.28218042850494385, -0.21156077086925507, -0.14094111323356628, -0.0703214555978775, 0.0002982020378112793, 0.07091784477233887, 0.14153751730918884, 0.21215718984603882, 0.2827770709991455, 0.3533967137336731, 0.42401638627052307, 0.49463605880737305, 0.5652557015419006, 0.6358753442764282, 0.7064950466156006, 0.7771146893501282, 0.8477343320846558, 0.9183539748191833, 0.9889736175537109, 1.0595933198928833, 1.1302130222320557, 1.2008326053619385, 1.2714523077011108, 1.3420720100402832, 1.412691593170166, 1.4833112955093384, 1.5539308786392212, 1.6245505809783936, 1.6951701641082764, 1.7657898664474487, 1.836409568786621, 1.907029151916504, 1.9776488542556763, 2.0482685565948486, 2.1188881397247314, 2.1895077228546143, 2.260127544403076, 2.330747127532959, 2.401366710662842, 2.4719865322113037, 2.5426061153411865]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 11.0, 6.0, 7.0, 7.0, 10.0, 14.0, 19.0, 19.0, 29.0, 34.0, 39.0, 40.0, 33.0, 39.0, 41.0, 37.0, 53.0, 30.0, 32.0, 64.0, 33.0, 37.0, 43.0, 40.0, 35.0, 45.0, 30.0, 27.0, 24.0, 21.0, 13.0, 19.0, 17.0, 10.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2569193840026855, -1.2209765911102295, -1.1850337982177734, -1.1490910053253174, -1.1131482124328613, -1.0772054195404053, -1.0412626266479492, -1.0053198337554932, -0.9693770408630371, -0.933434247970581, -0.897491455078125, -0.861548662185669, -0.8256058692932129, -0.7896630764007568, -0.7537202835083008, -0.7177774906158447, -0.6818346977233887, -0.6458919048309326, -0.6099491119384766, -0.5740063190460205, -0.5380635261535645, -0.5021207332611084, -0.46617794036865234, -0.4302351474761963, -0.39429235458374023, -0.3583495616912842, -0.3224067687988281, -0.28646397590637207, -0.250521183013916, -0.21457839012145996, -0.1786355972290039, -0.14269280433654785, -0.10675013065338135, -0.07080733776092529, -0.03486454486846924, 0.0010782480239868164, 0.03702104091644287, 0.07296383380889893, 0.10890662670135498, 0.14484941959381104, 0.1807922124862671, 0.21673500537872314, 0.2526777982711792, 0.28862059116363525, 0.3245633840560913, 0.36050617694854736, 0.3964489698410034, 0.4323917627334595, 0.4683345556259155, 0.5042773485183716, 0.5402201414108276, 0.5761629343032837, 0.6121057271957397, 0.6480485200881958, 0.6839913129806519, 0.7199341058731079, 0.755876898765564, 0.79181969165802, 0.8277624845504761, 0.8637052774429321, 0.8996480703353882, 0.9355908632278442, 0.9715336561203003, 1.0074764490127563, 1.0434192419052124]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 15.0, 12.0, 9.0, 9.0, 24.0, 21.0, 24.0, 41.0, 57.0, 102.0, 180.0, 317.0, 668.0, 1688.0, 4610.0, 15103.0, 63299.0, 274362.0, 475601.0, 161173.0, 36379.0, 9496.0, 3035.0, 1140.0, 511.0, 260.0, 155.0, 72.0, 46.0, 28.0, 20.0, 22.0, 10.0, 9.0, 11.0, 9.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.462158203125, -0.4486885070800781, -0.43521881103515625, -0.4217491149902344, -0.4082794189453125, -0.3948097229003906, -0.38134002685546875, -0.3678703308105469, -0.354400634765625, -0.3409309387207031, -0.32746124267578125, -0.3139915466308594, -0.3005218505859375, -0.2870521545410156, -0.27358245849609375, -0.2601127624511719, -0.24664306640625, -0.23317337036132812, -0.21970367431640625, -0.20623397827148438, -0.1927642822265625, -0.17929458618164062, -0.16582489013671875, -0.15235519409179688, -0.138885498046875, -0.12541580200195312, -0.11194610595703125, -0.09847640991210938, -0.0850067138671875, -0.07153701782226562, -0.05806732177734375, -0.044597625732421875, -0.0311279296875, -0.017658233642578125, -0.00418853759765625, 0.009281158447265625, 0.0227508544921875, 0.036220550537109375, 0.04969024658203125, 0.06315994262695312, 0.076629638671875, 0.09009933471679688, 0.10356903076171875, 0.11703872680664062, 0.1305084228515625, 0.14397811889648438, 0.15744781494140625, 0.17091751098632812, 0.18438720703125, 0.19785690307617188, 0.21132659912109375, 0.22479629516601562, 0.2382659912109375, 0.2517356872558594, 0.26520538330078125, 0.2786750793457031, 0.292144775390625, 0.3056144714355469, 0.31908416748046875, 0.3325538635253906, 0.3460235595703125, 0.3594932556152344, 0.37296295166015625, 0.3864326477050781, 0.39990234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 9.0, 13.0, 11.0, 25.0, 28.0, 47.0, 39.0, 48.0, 49.0, 63.0, 45.0, 51.0, 57.0, 56.0, 59.0, 54.0, 53.0, 46.0, 39.0, 41.0, 25.0, 35.0, 20.0, 13.0, 11.0, 6.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9241714477539062, -0.8957061767578125, -0.8672409057617188, -0.838775634765625, -0.8103103637695312, -0.7818450927734375, -0.7533798217773438, -0.72491455078125, -0.6964492797851562, -0.6679840087890625, -0.6395187377929688, -0.611053466796875, -0.5825881958007812, -0.5541229248046875, -0.5256576538085938, -0.4971923828125, -0.46872711181640625, -0.4402618408203125, -0.41179656982421875, -0.383331298828125, -0.35486602783203125, -0.3264007568359375, -0.29793548583984375, -0.26947021484375, -0.24100494384765625, -0.2125396728515625, -0.18407440185546875, -0.155609130859375, -0.12714385986328125, -0.0986785888671875, -0.07021331787109375, -0.041748046875, -0.01328277587890625, 0.0151824951171875, 0.04364776611328125, 0.072113037109375, 0.10057830810546875, 0.1290435791015625, 0.15750885009765625, 0.18597412109375, 0.21443939208984375, 0.2429046630859375, 0.27136993408203125, 0.299835205078125, 0.32830047607421875, 0.3567657470703125, 0.38523101806640625, 0.4136962890625, 0.44216156005859375, 0.4706268310546875, 0.49909210205078125, 0.527557373046875, 0.5560226440429688, 0.5844879150390625, 0.6129531860351562, 0.64141845703125, 0.6698837280273438, 0.6983489990234375, 0.7268142700195312, 0.755279541015625, 0.7837448120117188, 0.8122100830078125, 0.8406753540039062, 0.869140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 10.0, 10.0, 9.0, 15.0, 20.0, 19.0, 55.0, 66.0, 83.0, 173.0, 371.0, 685.0, 1391.0, 3199.0, 7729.0, 21576.0, 66657.0, 201881.0, 373968.0, 242594.0, 84112.0, 27080.0, 9630.0, 3794.0, 1634.0, 794.0, 408.0, 225.0, 113.0, 81.0, 53.0, 37.0, 19.0, 18.0, 12.0, 7.0, 2.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29344940185546875, -0.2831878662109375, -0.27292633056640625, -0.262664794921875, -0.25240325927734375, -0.2421417236328125, -0.23188018798828125, -0.22161865234375, -0.21135711669921875, -0.2010955810546875, -0.19083404541015625, -0.180572509765625, -0.17031097412109375, -0.1600494384765625, -0.14978790283203125, -0.1395263671875, -0.12926483154296875, -0.1190032958984375, -0.10874176025390625, -0.098480224609375, -0.08821868896484375, -0.0779571533203125, -0.06769561767578125, -0.05743408203125, -0.04717254638671875, -0.0369110107421875, -0.02664947509765625, -0.016387939453125, -0.00612640380859375, 0.0041351318359375, 0.01439666748046875, 0.024658203125, 0.03491973876953125, 0.0451812744140625, 0.05544281005859375, 0.065704345703125, 0.07596588134765625, 0.0862274169921875, 0.09648895263671875, 0.10675048828125, 0.11701202392578125, 0.1272735595703125, 0.13753509521484375, 0.147796630859375, 0.15805816650390625, 0.1683197021484375, 0.17858123779296875, 0.1888427734375, 0.19910430908203125, 0.2093658447265625, 0.21962738037109375, 0.229888916015625, 0.24015045166015625, 0.2504119873046875, 0.26067352294921875, 0.27093505859375, 0.28119659423828125, 0.2914581298828125, 0.30171966552734375, 0.311981201171875, 0.32224273681640625, 0.3325042724609375, 0.34276580810546875, 0.35302734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 13.0, 14.0, 22.0, 19.0, 28.0, 24.0, 28.0, 29.0, 36.0, 45.0, 49.0, 53.0, 60.0, 47.0, 40.0, 48.0, 40.0, 43.0, 42.0, 40.0, 32.0, 28.0, 30.0, 26.0, 15.0, 20.0, 16.0, 20.0, 12.0, 10.0, 6.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.283203125, -1.2394866943359375, -1.195770263671875, -1.1520538330078125, -1.10833740234375, -1.0646209716796875, -1.020904541015625, -0.9771881103515625, -0.9334716796875, -0.8897552490234375, -0.846038818359375, -0.8023223876953125, -0.75860595703125, -0.7148895263671875, -0.671173095703125, -0.6274566650390625, -0.583740234375, -0.5400238037109375, -0.496307373046875, -0.4525909423828125, -0.40887451171875, -0.3651580810546875, -0.321441650390625, -0.2777252197265625, -0.2340087890625, -0.1902923583984375, -0.146575927734375, -0.1028594970703125, -0.05914306640625, -0.0154266357421875, 0.028289794921875, 0.0720062255859375, 0.11572265625, 0.1594390869140625, 0.203155517578125, 0.2468719482421875, 0.29058837890625, 0.3343048095703125, 0.378021240234375, 0.4217376708984375, 0.4654541015625, 0.5091705322265625, 0.552886962890625, 0.5966033935546875, 0.64031982421875, 0.6840362548828125, 0.727752685546875, 0.7714691162109375, 0.815185546875, 0.8589019775390625, 0.902618408203125, 0.9463348388671875, 0.99005126953125, 1.0337677001953125, 1.077484130859375, 1.1212005615234375, 1.1649169921875, 1.2086334228515625, 1.252349853515625, 1.2960662841796875, 1.33978271484375, 1.3834991455078125, 1.427215576171875, 1.4709320068359375, 1.5146484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 21.0, 26.0, 56.0, 58.0, 95.0, 143.0, 262.0, 431.0, 776.0, 1520.0, 2999.0, 6825.0, 17509.0, 50591.0, 161311.0, 370968.0, 284003.0, 98259.0, 31427.0, 11446.0, 4850.0, 2290.0, 1168.0, 611.0, 326.0, 196.0, 129.0, 81.0, 49.0, 30.0, 18.0, 23.0, 12.0, 6.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08392333984375, -0.0810079574584961, -0.07809257507324219, -0.07517719268798828, -0.07226181030273438, -0.06934642791748047, -0.06643104553222656, -0.06351566314697266, -0.06060028076171875, -0.057684898376464844, -0.05476951599121094, -0.05185413360595703, -0.048938751220703125, -0.04602336883544922, -0.04310798645019531, -0.040192604064941406, -0.0372772216796875, -0.034361839294433594, -0.03144645690917969, -0.02853107452392578, -0.025615692138671875, -0.02270030975341797, -0.019784927368164062, -0.016869544982910156, -0.01395416259765625, -0.011038780212402344, -0.008123397827148438, -0.005208015441894531, -0.002292633056640625, 0.0006227493286132812, 0.0035381317138671875, 0.006453514099121094, 0.009368896484375, 0.012284278869628906, 0.015199661254882812, 0.01811504364013672, 0.021030426025390625, 0.02394580841064453, 0.026861190795898438, 0.029776573181152344, 0.03269195556640625, 0.035607337951660156, 0.03852272033691406, 0.04143810272216797, 0.044353485107421875, 0.04726886749267578, 0.05018424987792969, 0.053099632263183594, 0.0560150146484375, 0.058930397033691406, 0.06184577941894531, 0.06476116180419922, 0.06767654418945312, 0.07059192657470703, 0.07350730895996094, 0.07642269134521484, 0.07933807373046875, 0.08225345611572266, 0.08516883850097656, 0.08808422088623047, 0.09099960327148438, 0.09391498565673828, 0.09683036804199219, 0.0997457504272461, 0.1026611328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 12.0, 16.0, 22.0, 36.0, 52.0, 40.0, 91.0, 82.0, 103.0, 102.0, 85.0, 75.0, 62.0, 64.0, 36.0, 34.0, 22.0, 19.0, 10.0, 9.0, 4.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-8.082389831542969e-05, -7.886812090873718e-05, -7.691234350204468e-05, -7.495656609535217e-05, -7.300078868865967e-05, -7.104501128196716e-05, -6.908923387527466e-05, -6.713345646858215e-05, -6.517767906188965e-05, -6.322190165519714e-05, -6.126612424850464e-05, -5.9310346841812134e-05, -5.735456943511963e-05, -5.5398792028427124e-05, -5.344301462173462e-05, -5.1487237215042114e-05, -4.953145980834961e-05, -4.7575682401657104e-05, -4.56199049949646e-05, -4.3664127588272095e-05, -4.170835018157959e-05, -3.9752572774887085e-05, -3.779679536819458e-05, -3.5841017961502075e-05, -3.388524055480957e-05, -3.1929463148117065e-05, -2.997368574142456e-05, -2.8017908334732056e-05, -2.606213092803955e-05, -2.4106353521347046e-05, -2.215057611465454e-05, -2.0194798707962036e-05, -1.823902130126953e-05, -1.6283243894577026e-05, -1.4327466487884521e-05, -1.2371689081192017e-05, -1.0415911674499512e-05, -8.460134267807007e-06, -6.504356861114502e-06, -4.548579454421997e-06, -2.592802047729492e-06, -6.370246410369873e-07, 1.3187527656555176e-06, 3.2745301723480225e-06, 5.230307579040527e-06, 7.186084985733032e-06, 9.141862392425537e-06, 1.1097639799118042e-05, 1.3053417205810547e-05, 1.5009194612503052e-05, 1.6964972019195557e-05, 1.892074942588806e-05, 2.0876526832580566e-05, 2.283230423927307e-05, 2.4788081645965576e-05, 2.674385905265808e-05, 2.8699636459350586e-05, 3.065541386604309e-05, 3.2611191272735596e-05, 3.45669686794281e-05, 3.6522746086120605e-05, 3.847852349281311e-05, 4.0434300899505615e-05, 4.239007830619812e-05, 4.4345855712890625e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 7.0, 10.0, 23.0, 27.0, 24.0, 43.0, 81.0, 110.0, 204.0, 426.0, 1158.0, 3053.0, 11306.0, 53552.0, 299702.0, 517862.0, 127753.0, 24180.0, 5844.0, 1756.0, 688.0, 296.0, 142.0, 91.0, 60.0, 22.0, 33.0, 27.0, 12.0, 12.0, 9.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1424560546875, -0.13789749145507812, -0.13333892822265625, -0.12878036499023438, -0.1242218017578125, -0.11966323852539062, -0.11510467529296875, -0.11054611206054688, -0.105987548828125, -0.10142898559570312, -0.09687042236328125, -0.09231185913085938, -0.0877532958984375, -0.08319473266601562, -0.07863616943359375, -0.07407760620117188, -0.06951904296875, -0.06496047973632812, -0.06040191650390625, -0.055843353271484375, -0.0512847900390625, -0.046726226806640625, -0.04216766357421875, -0.037609100341796875, -0.033050537109375, -0.028491973876953125, -0.02393341064453125, -0.019374847412109375, -0.0148162841796875, -0.010257720947265625, -0.00569915771484375, -0.001140594482421875, 0.00341796875, 0.007976531982421875, 0.01253509521484375, 0.017093658447265625, 0.0216522216796875, 0.026210784912109375, 0.03076934814453125, 0.035327911376953125, 0.039886474609375, 0.044445037841796875, 0.04900360107421875, 0.053562164306640625, 0.0581207275390625, 0.06267929077148438, 0.06723785400390625, 0.07179641723632812, 0.07635498046875, 0.08091354370117188, 0.08547210693359375, 0.09003067016601562, 0.0945892333984375, 0.09914779663085938, 0.10370635986328125, 0.10826492309570312, 0.112823486328125, 0.11738204956054688, 0.12194061279296875, 0.12649917602539062, 0.1310577392578125, 0.13561630249023438, 0.14017486572265625, 0.14473342895507812, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 5.0, 13.0, 9.0, 14.0, 12.0, 16.0, 15.0, 22.0, 50.0, 37.0, 42.0, 57.0, 65.0, 63.0, 80.0, 66.0, 67.0, 65.0, 65.0, 48.0, 42.0, 34.0, 31.0, 17.0, 16.0, 12.0, 12.0, 3.0, 6.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.029449462890625, -0.028606176376342773, -0.027762889862060547, -0.02691960334777832, -0.026076316833496094, -0.025233030319213867, -0.02438974380493164, -0.023546457290649414, -0.022703170776367188, -0.02185988426208496, -0.021016597747802734, -0.020173311233520508, -0.01933002471923828, -0.018486738204956055, -0.017643451690673828, -0.0168001651763916, -0.015956878662109375, -0.015113592147827148, -0.014270305633544922, -0.013427019119262695, -0.012583732604980469, -0.011740446090698242, -0.010897159576416016, -0.010053873062133789, -0.009210586547851562, -0.008367300033569336, -0.007524013519287109, -0.006680727005004883, -0.005837440490722656, -0.00499415397644043, -0.004150867462158203, -0.0033075809478759766, -0.00246429443359375, -0.0016210079193115234, -0.0007777214050292969, 6.556510925292969e-05, 0.0009088516235351562, 0.0017521381378173828, 0.0025954246520996094, 0.003438711166381836, 0.0042819976806640625, 0.005125284194946289, 0.005968570709228516, 0.006811857223510742, 0.007655143737792969, 0.008498430252075195, 0.009341716766357422, 0.010185003280639648, 0.011028289794921875, 0.011871576309204102, 0.012714862823486328, 0.013558149337768555, 0.014401435852050781, 0.015244722366333008, 0.016088008880615234, 0.01693129539489746, 0.017774581909179688, 0.018617868423461914, 0.01946115493774414, 0.020304441452026367, 0.021147727966308594, 0.02199101448059082, 0.022834300994873047, 0.023677587509155273, 0.0245208740234375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 15.0, 21.0, 63.0, 66.0, 111.0, 137.0, 172.0, 142.0, 108.0, 58.0, 42.0, 22.0, 13.0, 11.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6638085842132568, -1.6052571535110474, -1.546705722808838, -1.4881542921066284, -1.429602861404419, -1.371051549911499, -1.3125001192092896, -1.25394868850708, -1.1953972578048706, -1.1368458271026611, -1.0782943964004517, -1.0197429656982422, -0.9611915946006775, -0.902640163898468, -0.8440887928009033, -0.7855373620986938, -0.7269859313964844, -0.6684345006942749, -0.6098830699920654, -0.5513316988945007, -0.49278026819229126, -0.4342288374900818, -0.3756774365901947, -0.3171260356903076, -0.25857460498809814, -0.20002318918704987, -0.1414717733860016, -0.08292035758495331, -0.02436894178390503, 0.03418248891830444, 0.09273388981819153, 0.1512852907180786, 0.20983672142028809, 0.26838815212249756, 0.32693955302238464, 0.38549095392227173, 0.4440423846244812, 0.5025938153266907, 0.5611451864242554, 0.6196966171264648, 0.6782480478286743, 0.7367994785308838, 0.7953509092330933, 0.853902280330658, 0.9124537110328674, 0.9710051417350769, 1.0295565128326416, 1.088107943534851, 1.1466593742370605, 1.20521080493927, 1.2637622356414795, 1.322313666343689, 1.3808650970458984, 1.4394164085388184, 1.4979678392410278, 1.5565192699432373, 1.6150707006454468, 1.6736221313476562, 1.7321735620498657, 1.7907249927520752, 1.8492763042449951, 1.9078278541564941, 1.966379165649414, 2.024930477142334, 2.083482027053833]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 2.0, 7.0, 10.0, 9.0, 10.0, 10.0, 13.0, 25.0, 29.0, 42.0, 35.0, 58.0, 41.0, 58.0, 47.0, 43.0, 57.0, 51.0, 53.0, 55.0, 49.0, 38.0, 53.0, 45.0, 29.0, 28.0, 23.0, 15.0, 25.0, 11.0, 7.0, 7.0, 10.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9053064584732056, -0.8786220550537109, -0.8519375920295715, -0.8252531886100769, -0.7985687255859375, -0.7718843221664429, -0.7451999187469482, -0.7185154557228088, -0.6918310523033142, -0.6651466488838196, -0.6384621858596802, -0.6117777824401855, -0.5850933194160461, -0.5584089159965515, -0.5317244529724121, -0.5050400495529175, -0.47835561633110046, -0.45167118310928345, -0.42498674988746643, -0.3983023166656494, -0.3716179132461548, -0.34493348002433777, -0.31824904680252075, -0.2915646433830261, -0.2648801803588867, -0.2381957471370697, -0.21151132881641388, -0.18482689559459686, -0.15814247727394104, -0.13145804405212402, -0.104773610830307, -0.07808919250965118, -0.05140477418899536, -0.024720346555113792, 0.0019640810787677765, 0.028648510575294495, 0.055332936346530914, 0.08201736211776733, 0.10870179533958435, 0.13538621366024017, 0.1620706468820572, 0.1887550801038742, 0.21543949842453003, 0.24212393164634705, 0.26880836486816406, 0.2954927682876587, 0.3221772313117981, 0.3488616347312927, 0.37554606795310974, 0.40223050117492676, 0.4289149343967438, 0.4555993676185608, 0.4822837710380554, 0.5089682340621948, 0.5356526374816895, 0.5623370409011841, 0.5890215039253235, 0.6157059073448181, 0.6423903703689575, 0.6690747737884521, 0.6957592368125916, 0.7224436402320862, 0.7491281032562256, 0.7758125066757202, 0.8024969100952148]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 20.0, 39.0, 108.0, 376.0, 2220.0, 41542.0, 947498.0, 53720.0, 2408.0, 387.0, 118.0, 38.0, 26.0, 12.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.706573486328125, -2.60455322265625, -2.502532958984375, -2.4005126953125, -2.298492431640625, -2.19647216796875, -2.094451904296875, -1.992431640625, -1.890411376953125, -1.78839111328125, -1.686370849609375, -1.5843505859375, -1.482330322265625, -1.38031005859375, -1.278289794921875, -1.17626953125, -1.074249267578125, -0.97222900390625, -0.870208740234375, -0.7681884765625, -0.666168212890625, -0.56414794921875, -0.462127685546875, -0.360107421875, -0.258087158203125, -0.15606689453125, -0.054046630859375, 0.0479736328125, 0.149993896484375, 0.25201416015625, 0.354034423828125, 0.4560546875, 0.558074951171875, 0.66009521484375, 0.762115478515625, 0.8641357421875, 0.966156005859375, 1.06817626953125, 1.170196533203125, 1.272216796875, 1.374237060546875, 1.47625732421875, 1.578277587890625, 1.6802978515625, 1.782318115234375, 1.88433837890625, 1.986358642578125, 2.08837890625, 2.190399169921875, 2.29241943359375, 2.394439697265625, 2.4964599609375, 2.598480224609375, 2.70050048828125, 2.802520751953125, 2.904541015625, 3.006561279296875, 3.10858154296875, 3.210601806640625, 3.3126220703125, 3.414642333984375, 3.51666259765625, 3.618682861328125, 3.720703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 4.0, 11.0, 8.0, 12.0, 12.0, 18.0, 14.0, 23.0, 23.0, 27.0, 37.0, 49.0, 55.0, 33.0, 44.0, 62.0, 56.0, 46.0, 49.0, 41.0, 39.0, 44.0, 47.0, 44.0, 25.0, 35.0, 35.0, 16.0, 10.0, 18.0, 15.0, 8.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6222076416015625, -1.573516845703125, -1.5248260498046875, -1.47613525390625, -1.4274444580078125, -1.378753662109375, -1.3300628662109375, -1.2813720703125, -1.2326812744140625, -1.183990478515625, -1.1352996826171875, -1.08660888671875, -1.0379180908203125, -0.989227294921875, -0.9405364990234375, -0.891845703125, -0.8431549072265625, -0.794464111328125, -0.7457733154296875, -0.69708251953125, -0.6483917236328125, -0.599700927734375, -0.5510101318359375, -0.5023193359375, -0.4536285400390625, -0.404937744140625, -0.3562469482421875, -0.30755615234375, -0.2588653564453125, -0.210174560546875, -0.1614837646484375, -0.11279296875, -0.0641021728515625, -0.015411376953125, 0.0332794189453125, 0.08197021484375, 0.1306610107421875, 0.179351806640625, 0.2280426025390625, 0.2767333984375, 0.3254241943359375, 0.374114990234375, 0.4228057861328125, 0.47149658203125, 0.5201873779296875, 0.568878173828125, 0.6175689697265625, 0.666259765625, 0.7149505615234375, 0.763641357421875, 0.8123321533203125, 0.86102294921875, 0.9097137451171875, 0.958404541015625, 1.0070953369140625, 1.0557861328125, 1.1044769287109375, 1.153167724609375, 1.2018585205078125, 1.25054931640625, 1.2992401123046875, 1.347930908203125, 1.3966217041015625, 1.4453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 6.0, 10.0, 12.0, 16.0, 17.0, 22.0, 22.0, 43.0, 45.0, 70.0, 77.0, 111.0, 138.0, 162.0, 211.0, 336.0, 983.0, 4718.0, 66645.0, 847932.0, 118155.0, 6286.0, 1142.0, 406.0, 213.0, 165.0, 106.0, 99.0, 71.0, 78.0, 67.0, 46.0, 29.0, 19.0, 22.0, 15.0, 14.0, 12.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-2.37109375, -2.30963134765625, -2.2481689453125, -2.18670654296875, -2.125244140625, -2.06378173828125, -2.0023193359375, -1.94085693359375, -1.87939453125, -1.81793212890625, -1.7564697265625, -1.69500732421875, -1.633544921875, -1.57208251953125, -1.5106201171875, -1.44915771484375, -1.3876953125, -1.32623291015625, -1.2647705078125, -1.20330810546875, -1.141845703125, -1.08038330078125, -1.0189208984375, -0.95745849609375, -0.89599609375, -0.83453369140625, -0.7730712890625, -0.71160888671875, -0.650146484375, -0.58868408203125, -0.5272216796875, -0.46575927734375, -0.404296875, -0.34283447265625, -0.2813720703125, -0.21990966796875, -0.158447265625, -0.09698486328125, -0.0355224609375, 0.02593994140625, 0.08740234375, 0.14886474609375, 0.2103271484375, 0.27178955078125, 0.333251953125, 0.39471435546875, 0.4561767578125, 0.51763916015625, 0.5791015625, 0.64056396484375, 0.7020263671875, 0.76348876953125, 0.824951171875, 0.88641357421875, 0.9478759765625, 1.00933837890625, 1.07080078125, 1.13226318359375, 1.1937255859375, 1.25518798828125, 1.316650390625, 1.37811279296875, 1.4395751953125, 1.50103759765625, 1.5625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 6.0, 4.0, 12.0, 8.0, 7.0, 13.0, 6.0, 9.0, 23.0, 15.0, 20.0, 30.0, 34.0, 25.0, 25.0, 29.0, 36.0, 32.0, 43.0, 48.0, 45.0, 51.0, 40.0, 44.0, 41.0, 38.0, 47.0, 37.0, 22.0, 34.0, 33.0, 20.0, 20.0, 22.0, 10.0, 7.0, 14.0, 13.0, 5.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 6.0], "bins": [-1.6904296875, -1.647552490234375, -1.60467529296875, -1.561798095703125, -1.5189208984375, -1.476043701171875, -1.43316650390625, -1.390289306640625, -1.347412109375, -1.304534912109375, -1.26165771484375, -1.218780517578125, -1.1759033203125, -1.133026123046875, -1.09014892578125, -1.047271728515625, -1.00439453125, -0.961517333984375, -0.91864013671875, -0.875762939453125, -0.8328857421875, -0.790008544921875, -0.74713134765625, -0.704254150390625, -0.661376953125, -0.618499755859375, -0.57562255859375, -0.532745361328125, -0.4898681640625, -0.446990966796875, -0.40411376953125, -0.361236572265625, -0.318359375, -0.275482177734375, -0.23260498046875, -0.189727783203125, -0.1468505859375, -0.103973388671875, -0.06109619140625, -0.018218994140625, 0.024658203125, 0.067535400390625, 0.11041259765625, 0.153289794921875, 0.1961669921875, 0.239044189453125, 0.28192138671875, 0.324798583984375, 0.36767578125, 0.410552978515625, 0.45343017578125, 0.496307373046875, 0.5391845703125, 0.582061767578125, 0.62493896484375, 0.667816162109375, 0.710693359375, 0.753570556640625, 0.79644775390625, 0.839324951171875, 0.8822021484375, 0.925079345703125, 0.96795654296875, 1.010833740234375, 1.0537109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 12.0, 23.0, 41.0, 52.0, 88.0, 143.0, 350.0, 1201.0, 7102.0, 106543.0, 811757.0, 111725.0, 7522.0, 1189.0, 363.0, 164.0, 82.0, 47.0, 38.0, 29.0, 12.0, 19.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.502105712890625, -0.48712158203125, -0.472137451171875, -0.4571533203125, -0.442169189453125, -0.42718505859375, -0.412200927734375, -0.397216796875, -0.382232666015625, -0.36724853515625, -0.352264404296875, -0.3372802734375, -0.322296142578125, -0.30731201171875, -0.292327880859375, -0.27734375, -0.262359619140625, -0.24737548828125, -0.232391357421875, -0.2174072265625, -0.202423095703125, -0.18743896484375, -0.172454833984375, -0.157470703125, -0.142486572265625, -0.12750244140625, -0.112518310546875, -0.0975341796875, -0.082550048828125, -0.06756591796875, -0.052581787109375, -0.03759765625, -0.022613525390625, -0.00762939453125, 0.007354736328125, 0.0223388671875, 0.037322998046875, 0.05230712890625, 0.067291259765625, 0.082275390625, 0.097259521484375, 0.11224365234375, 0.127227783203125, 0.1422119140625, 0.157196044921875, 0.17218017578125, 0.187164306640625, 0.2021484375, 0.217132568359375, 0.23211669921875, 0.247100830078125, 0.2620849609375, 0.277069091796875, 0.29205322265625, 0.307037353515625, 0.322021484375, 0.337005615234375, 0.35198974609375, 0.366973876953125, 0.3819580078125, 0.396942138671875, 0.41192626953125, 0.426910400390625, 0.44189453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 8.0, 11.0, 23.0, 28.0, 39.0, 58.0, 63.0, 97.0, 94.0, 119.0, 104.0, 83.0, 69.0, 54.0, 36.0, 32.0, 31.0, 12.0, 11.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.29425048828125e-05, -6.136111915111542e-05, -5.9779733419418335e-05, -5.819834768772125e-05, -5.661696195602417e-05, -5.503557622432709e-05, -5.3454190492630005e-05, -5.187280476093292e-05, -5.029141902923584e-05, -4.871003329753876e-05, -4.7128647565841675e-05, -4.554726183414459e-05, -4.396587610244751e-05, -4.238449037075043e-05, -4.0803104639053345e-05, -3.922171890735626e-05, -3.764033317565918e-05, -3.60589474439621e-05, -3.4477561712265015e-05, -3.289617598056793e-05, -3.131479024887085e-05, -2.9733404517173767e-05, -2.8152018785476685e-05, -2.6570633053779602e-05, -2.498924732208252e-05, -2.3407861590385437e-05, -2.1826475858688354e-05, -2.0245090126991272e-05, -1.866370439529419e-05, -1.7082318663597107e-05, -1.5500932931900024e-05, -1.3919547200202942e-05, -1.233816146850586e-05, -1.0756775736808777e-05, -9.175390005111694e-06, -7.594004273414612e-06, -6.012618541717529e-06, -4.431232810020447e-06, -2.8498470783233643e-06, -1.2684613466262817e-06, 3.129243850708008e-07, 1.8943101167678833e-06, 3.475695848464966e-06, 5.057081580162048e-06, 6.638467311859131e-06, 8.219853043556213e-06, 9.801238775253296e-06, 1.1382624506950378e-05, 1.2964010238647461e-05, 1.4545395970344543e-05, 1.6126781702041626e-05, 1.770816743373871e-05, 1.928955316543579e-05, 2.0870938897132874e-05, 2.2452324628829956e-05, 2.403371036052704e-05, 2.561509609222412e-05, 2.7196481823921204e-05, 2.8777867555618286e-05, 3.035925328731537e-05, 3.194063901901245e-05, 3.3522024750709534e-05, 3.5103410482406616e-05, 3.66847962141037e-05, 3.826618194580078e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 6.0, 12.0, 9.0, 28.0, 54.0, 57.0, 138.0, 278.0, 719.0, 2180.0, 9119.0, 73882.0, 729767.0, 209198.0, 17479.0, 3642.0, 1183.0, 375.0, 180.0, 88.0, 41.0, 25.0, 27.0, 16.0, 10.0, 6.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57373046875, -0.55889892578125, -0.5440673828125, -0.52923583984375, -0.514404296875, -0.49957275390625, -0.4847412109375, -0.46990966796875, -0.455078125, -0.44024658203125, -0.4254150390625, -0.41058349609375, -0.395751953125, -0.38092041015625, -0.3660888671875, -0.35125732421875, -0.33642578125, -0.32159423828125, -0.3067626953125, -0.29193115234375, -0.277099609375, -0.26226806640625, -0.2474365234375, -0.23260498046875, -0.2177734375, -0.20294189453125, -0.1881103515625, -0.17327880859375, -0.158447265625, -0.14361572265625, -0.1287841796875, -0.11395263671875, -0.09912109375, -0.08428955078125, -0.0694580078125, -0.05462646484375, -0.039794921875, -0.02496337890625, -0.0101318359375, 0.00469970703125, 0.01953125, 0.03436279296875, 0.0491943359375, 0.06402587890625, 0.078857421875, 0.09368896484375, 0.1085205078125, 0.12335205078125, 0.13818359375, 0.15301513671875, 0.1678466796875, 0.18267822265625, 0.197509765625, 0.21234130859375, 0.2271728515625, 0.24200439453125, 0.2568359375, 0.27166748046875, 0.2864990234375, 0.30133056640625, 0.316162109375, 0.33099365234375, 0.3458251953125, 0.36065673828125, 0.37548828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 13.0, 5.0, 10.0, 15.0, 19.0, 25.0, 32.0, 53.0, 58.0, 61.0, 72.0, 76.0, 70.0, 88.0, 70.0, 64.0, 63.0, 46.0, 37.0, 25.0, 17.0, 17.0, 13.0, 9.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09131717681884766, -0.08772468566894531, -0.08413219451904297, -0.08053970336914062, -0.07694721221923828, -0.07335472106933594, -0.0697622299194336, -0.06616973876953125, -0.0625772476196289, -0.05898475646972656, -0.05539226531982422, -0.051799774169921875, -0.04820728302001953, -0.04461479187011719, -0.041022300720214844, -0.0374298095703125, -0.033837318420410156, -0.030244827270507812, -0.02665233612060547, -0.023059844970703125, -0.01946735382080078, -0.015874862670898438, -0.012282371520996094, -0.00868988037109375, -0.005097389221191406, -0.0015048980712890625, 0.0020875930786132812, 0.005680084228515625, 0.009272575378417969, 0.012865066528320312, 0.016457557678222656, 0.020050048828125, 0.023642539978027344, 0.027235031127929688, 0.03082752227783203, 0.034420013427734375, 0.03801250457763672, 0.04160499572753906, 0.045197486877441406, 0.04878997802734375, 0.052382469177246094, 0.05597496032714844, 0.05956745147705078, 0.06315994262695312, 0.06675243377685547, 0.07034492492675781, 0.07393741607666016, 0.0775299072265625, 0.08112239837646484, 0.08471488952636719, 0.08830738067626953, 0.09189987182617188, 0.09549236297607422, 0.09908485412597656, 0.1026773452758789, 0.10626983642578125, 0.1098623275756836, 0.11345481872558594, 0.11704730987548828, 0.12063980102539062, 0.12423229217529297, 0.1278247833251953, 0.13141727447509766, 0.135009765625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 11.0, 10.0, 23.0, 57.0, 92.0, 117.0, 159.0, 162.0, 140.0, 108.0, 52.0, 29.0, 19.0, 12.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6468746662139893, -3.52596378326416, -3.405052900314331, -3.284142017364502, -3.163231372833252, -3.0423202514648438, -2.9214096069335938, -2.8004987239837646, -2.6795878410339355, -2.5586769580841064, -2.4377660751342773, -2.3168551921844482, -2.195944309234619, -2.075033664703369, -1.95412278175354, -1.833211898803711, -1.7123010158538818, -1.5913901329040527, -1.4704792499542236, -1.349568486213684, -1.228657603263855, -1.1077467203140259, -0.9868358969688416, -0.8659250736236572, -0.7450141906738281, -0.624103307723999, -0.5031924843788147, -0.382281631231308, -0.26137077808380127, -0.14045989513397217, -0.019549071788787842, 0.10136175155639648, 0.22227239608764648, 0.3431832492351532, 0.4640941023826599, 0.5850049257278442, 0.7059158086776733, 0.8268266916275024, 0.9477375149726868, 1.068648338317871, 1.1895592212677002, 1.3104701042175293, 1.4313809871673584, 1.552291750907898, 1.673202633857727, 1.7941135168075562, 1.9150242805480957, 2.035935163497925, 2.156846046447754, 2.277756929397583, 2.398667812347412, 2.519578695297241, 2.6404895782470703, 2.7614002227783203, 2.8823111057281494, 3.0032219886779785, 3.1241328716278076, 3.2450437545776367, 3.365954637527466, 3.486865520477295, 3.607776165008545, 3.728687286376953, 3.849597930908203, 3.9705088138580322, 4.091419696807861]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 10.0, 11.0, 20.0, 16.0, 18.0, 28.0, 26.0, 21.0, 42.0, 35.0, 47.0, 41.0, 54.0, 51.0, 43.0, 48.0, 50.0, 50.0, 49.0, 39.0, 35.0, 42.0, 37.0, 33.0, 30.0, 21.0, 27.0, 15.0, 14.0, 4.0, 6.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.958940267562866, -2.8722190856933594, -2.7854981422424316, -2.698776960372925, -2.612055778503418, -2.525334596633911, -2.4386136531829834, -2.3518924713134766, -2.2651712894439697, -2.178450107574463, -2.091729164123535, -2.0050079822540283, -1.9182868003845215, -1.8315657377243042, -1.744844675064087, -1.65812349319458, -1.5714024305343628, -1.4846813678741455, -1.3979601860046387, -1.3112391233444214, -1.2245179414749146, -1.1377968788146973, -1.0510756969451904, -0.9643546342849731, -0.8776335120201111, -0.790912389755249, -0.704191267490387, -0.6174701452255249, -0.5307490825653076, -0.44402793049812317, -0.3573068380355835, -0.27058571577072144, -0.18386459350585938, -0.09714347869157791, -0.010422363877296448, 0.07629874348640442, 0.16301986575126648, 0.24974098801612854, 0.3364620804786682, 0.4231832027435303, 0.5099043250083923, 0.5966254472732544, 0.6833465695381165, 0.7700676918029785, 0.8567887544631958, 0.9435099363327026, 1.03023099899292, 1.1169521808624268, 1.203673243522644, 1.2903943061828613, 1.3771154880523682, 1.4638365507125854, 1.5505577325820923, 1.6372787952423096, 1.7239999771118164, 1.8107210397720337, 1.897442102432251, 1.9841631650924683, 2.0708842277526855, 2.1576054096221924, 2.244326591491699, 2.331047773361206, 2.417768716812134, 2.5044898986816406, 2.5912110805511475]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 7.0, 10.0, 4.0, 16.0, 39.0, 62.0, 124.0, 232.0, 437.0, 1066.0, 2845.0, 9558.0, 48531.0, 542729.0, 2760691.0, 743170.0, 67155.0, 12117.0, 3366.0, 1170.0, 461.0, 215.0, 120.0, 54.0, 42.0, 23.0, 11.0, 7.0, 9.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.211517333984375, -1.14959716796875, -1.087677001953125, -1.0257568359375, -0.963836669921875, -0.90191650390625, -0.839996337890625, -0.778076171875, -0.716156005859375, -0.65423583984375, -0.592315673828125, -0.5303955078125, -0.468475341796875, -0.40655517578125, -0.344635009765625, -0.28271484375, -0.220794677734375, -0.15887451171875, -0.096954345703125, -0.0350341796875, 0.026885986328125, 0.08880615234375, 0.150726318359375, 0.212646484375, 0.274566650390625, 0.33648681640625, 0.398406982421875, 0.4603271484375, 0.522247314453125, 0.58416748046875, 0.646087646484375, 0.7080078125, 0.769927978515625, 0.83184814453125, 0.893768310546875, 0.9556884765625, 1.017608642578125, 1.07952880859375, 1.141448974609375, 1.203369140625, 1.265289306640625, 1.32720947265625, 1.389129638671875, 1.4510498046875, 1.512969970703125, 1.57489013671875, 1.636810302734375, 1.69873046875, 1.760650634765625, 1.82257080078125, 1.884490966796875, 1.9464111328125, 2.008331298828125, 2.07025146484375, 2.132171630859375, 2.194091796875, 2.256011962890625, 2.31793212890625, 2.379852294921875, 2.4417724609375, 2.503692626953125, 2.56561279296875, 2.627532958984375, 2.689453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 11.0, 5.0, 6.0, 9.0, 27.0, 25.0, 36.0, 31.0, 30.0, 44.0, 42.0, 53.0, 70.0, 40.0, 55.0, 57.0, 56.0, 54.0, 60.0, 50.0, 39.0, 41.0, 29.0, 29.0, 20.0, 20.0, 17.0, 11.0, 9.0, 11.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.349761962890625, -1.30987548828125, -1.269989013671875, -1.2301025390625, -1.190216064453125, -1.15032958984375, -1.110443115234375, -1.070556640625, -1.030670166015625, -0.99078369140625, -0.950897216796875, -0.9110107421875, -0.871124267578125, -0.83123779296875, -0.791351318359375, -0.75146484375, -0.711578369140625, -0.67169189453125, -0.631805419921875, -0.5919189453125, -0.552032470703125, -0.51214599609375, -0.472259521484375, -0.432373046875, -0.392486572265625, -0.35260009765625, -0.312713623046875, -0.2728271484375, -0.232940673828125, -0.19305419921875, -0.153167724609375, -0.11328125, -0.073394775390625, -0.03350830078125, 0.006378173828125, 0.0462646484375, 0.086151123046875, 0.12603759765625, 0.165924072265625, 0.205810546875, 0.245697021484375, 0.28558349609375, 0.325469970703125, 0.3653564453125, 0.405242919921875, 0.44512939453125, 0.485015869140625, 0.52490234375, 0.564788818359375, 0.60467529296875, 0.644561767578125, 0.6844482421875, 0.724334716796875, 0.76422119140625, 0.804107666015625, 0.843994140625, 0.883880615234375, 0.92376708984375, 0.963653564453125, 1.0035400390625, 1.043426513671875, 1.08331298828125, 1.123199462890625, 1.1630859375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 14.0, 18.0, 18.0, 31.0, 37.0, 68.0, 85.0, 128.0, 224.0, 444.0, 1066.0, 4785.0, 77723.0, 3908492.0, 191223.0, 7308.0, 1349.0, 496.0, 283.0, 142.0, 111.0, 78.0, 37.0, 36.0, 18.0, 21.0, 10.0, 10.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.52734375, -3.415740966796875, -3.30413818359375, -3.192535400390625, -3.0809326171875, -2.969329833984375, -2.85772705078125, -2.746124267578125, -2.634521484375, -2.522918701171875, -2.41131591796875, -2.299713134765625, -2.1881103515625, -2.076507568359375, -1.96490478515625, -1.853302001953125, -1.74169921875, -1.630096435546875, -1.51849365234375, -1.406890869140625, -1.2952880859375, -1.183685302734375, -1.07208251953125, -0.960479736328125, -0.848876953125, -0.737274169921875, -0.62567138671875, -0.514068603515625, -0.4024658203125, -0.290863037109375, -0.17926025390625, -0.067657470703125, 0.0439453125, 0.155548095703125, 0.26715087890625, 0.378753662109375, 0.4903564453125, 0.601959228515625, 0.71356201171875, 0.825164794921875, 0.936767578125, 1.048370361328125, 1.15997314453125, 1.271575927734375, 1.3831787109375, 1.494781494140625, 1.60638427734375, 1.717987060546875, 1.82958984375, 1.941192626953125, 2.05279541015625, 2.164398193359375, 2.2760009765625, 2.387603759765625, 2.49920654296875, 2.610809326171875, 2.722412109375, 2.834014892578125, 2.94561767578125, 3.057220458984375, 3.1688232421875, 3.280426025390625, 3.39202880859375, 3.503631591796875, 3.615234375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 15.0, 19.0, 20.0, 22.0, 26.0, 40.0, 64.0, 76.0, 110.0, 155.0, 224.0, 349.0, 462.0, 554.0, 491.0, 381.0, 331.0, 208.0, 148.0, 87.0, 60.0, 56.0, 42.0, 26.0, 24.0, 12.0, 17.0, 13.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.425872802734375, -0.41204833984375, -0.398223876953125, -0.3843994140625, -0.370574951171875, -0.35675048828125, -0.342926025390625, -0.3291015625, -0.315277099609375, -0.30145263671875, -0.287628173828125, -0.2738037109375, -0.259979248046875, -0.24615478515625, -0.232330322265625, -0.218505859375, -0.204681396484375, -0.19085693359375, -0.177032470703125, -0.1632080078125, -0.149383544921875, -0.13555908203125, -0.121734619140625, -0.10791015625, -0.094085693359375, -0.08026123046875, -0.066436767578125, -0.0526123046875, -0.038787841796875, -0.02496337890625, -0.011138916015625, 0.002685546875, 0.016510009765625, 0.03033447265625, 0.044158935546875, 0.0579833984375, 0.071807861328125, 0.08563232421875, 0.099456787109375, 0.11328125, 0.127105712890625, 0.14093017578125, 0.154754638671875, 0.1685791015625, 0.182403564453125, 0.19622802734375, 0.210052490234375, 0.223876953125, 0.237701416015625, 0.25152587890625, 0.265350341796875, 0.2791748046875, 0.292999267578125, 0.30682373046875, 0.320648193359375, 0.33447265625, 0.348297119140625, 0.36212158203125, 0.375946044921875, 0.3897705078125, 0.403594970703125, 0.41741943359375, 0.431243896484375, 0.445068359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 9.0, 22.0, 35.0, 43.0, 83.0, 111.0, 132.0, 136.0, 118.0, 114.0, 67.0, 41.0, 30.0, 20.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1864378452301025, -2.106645107269287, -2.026852607727051, -1.947059988975525, -1.867267370223999, -1.7874747514724731, -1.7076821327209473, -1.6278893947601318, -1.5480968952178955, -1.4683042764663696, -1.3885116577148438, -1.3087190389633179, -1.228926420211792, -1.1491338014602661, -1.0693411827087402, -0.9895485043525696, -0.9097558259963989, -0.829963207244873, -0.7501705884933472, -0.6703779697418213, -0.5905853509902954, -0.5107927322387695, -0.4310000538825989, -0.351207435131073, -0.2714148163795471, -0.19162219762802124, -0.11182956397533417, -0.032036930322647095, 0.047755688428878784, 0.12754830718040466, 0.20734095573425293, 0.2871335744857788, 0.3669261932373047, 0.44671881198883057, 0.5265114307403564, 0.6063040494918823, 0.6860966682434082, 0.7658892869949341, 0.8456819653511047, 0.9254745841026306, 1.0052671432495117, 1.0850597620010376, 1.1648523807525635, 1.2446449995040894, 1.3244376182556152, 1.4042302370071411, 1.484022855758667, 1.5638155937194824, 1.6436082124710083, 1.7234008312225342, 1.80319344997406, 1.882986068725586, 1.9627786874771118, 2.0425713062286377, 2.122364044189453, 2.2021565437316895, 2.281949281692505, 2.3617420196533203, 2.4415345191955566, 2.521327257156372, 2.6011197566986084, 2.680912494659424, 2.76070499420166, 2.8404977321624756, 2.920290231704712]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 9.0, 8.0, 3.0, 8.0, 14.0, 12.0, 19.0, 20.0, 20.0, 31.0, 30.0, 22.0, 35.0, 37.0, 32.0, 58.0, 62.0, 44.0, 53.0, 42.0, 58.0, 46.0, 50.0, 40.0, 43.0, 39.0, 36.0, 21.0, 18.0, 16.0, 22.0, 16.0, 8.0, 12.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4327870607376099, -1.394202709197998, -1.3556182384490967, -1.3170338869094849, -1.2784494161605835, -1.2398650646209717, -1.2012805938720703, -1.1626962423324585, -1.1241118907928467, -1.0855275392532349, -1.0469430685043335, -1.0083587169647217, -0.9697742462158203, -0.9311898946762085, -0.8926054835319519, -0.8540210723876953, -0.815436601638794, -0.7768521904945374, -0.7382677793502808, -0.6996833682060242, -0.6610989570617676, -0.6225146055221558, -0.5839301943778992, -0.5453457832336426, -0.506761372089386, -0.4681769609451294, -0.4295925498008728, -0.3910081684589386, -0.352423757314682, -0.3138393461704254, -0.2752549648284912, -0.23667055368423462, -0.19808626174926758, -0.159501850605011, -0.12091745436191559, -0.0823330506682396, -0.0437486469745636, -0.005164235830307007, 0.03342016041278839, 0.07200455665588379, 0.11058896780014038, 0.14917337894439697, 0.18775777518749237, 0.22634217143058777, 0.26492658257484436, 0.30351099371910095, 0.34209537506103516, 0.38067978620529175, 0.41926419734954834, 0.45784860849380493, 0.4964330196380615, 0.5350174307823181, 0.5736018419265747, 0.6121861934661865, 0.6507706046104431, 0.6893550157546997, 0.7279394268989563, 0.7665238380432129, 0.8051082491874695, 0.8436926603317261, 0.8822770118713379, 0.9208614826202393, 0.9594458341598511, 0.9980302453041077, 1.0366146564483643]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 14.0, 6.0, 10.0, 16.0, 32.0, 29.0, 77.0, 130.0, 243.0, 500.0, 1058.0, 2598.0, 6339.0, 17061.0, 55407.0, 241902.0, 502786.0, 159215.0, 39537.0, 13039.0, 4803.0, 2045.0, 866.0, 373.0, 188.0, 100.0, 51.0, 35.0, 18.0, 16.0, 10.0, 11.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.4091796875, -0.3969154357910156, -0.38465118408203125, -0.3723869323730469, -0.3601226806640625, -0.3478584289550781, -0.33559417724609375, -0.3233299255371094, -0.311065673828125, -0.2988014221191406, -0.28653717041015625, -0.2742729187011719, -0.2620086669921875, -0.24974441528320312, -0.23748016357421875, -0.22521591186523438, -0.21295166015625, -0.20068740844726562, -0.18842315673828125, -0.17615890502929688, -0.1638946533203125, -0.15163040161132812, -0.13936614990234375, -0.12710189819335938, -0.114837646484375, -0.10257339477539062, -0.09030914306640625, -0.07804489135742188, -0.0657806396484375, -0.053516387939453125, -0.04125213623046875, -0.028987884521484375, -0.0167236328125, -0.004459381103515625, 0.00780487060546875, 0.020069122314453125, 0.0323333740234375, 0.044597625732421875, 0.05686187744140625, 0.06912612915039062, 0.081390380859375, 0.09365463256835938, 0.10591888427734375, 0.11818313598632812, 0.1304473876953125, 0.14271163940429688, 0.15497589111328125, 0.16724014282226562, 0.17950439453125, 0.19176864624023438, 0.20403289794921875, 0.21629714965820312, 0.2285614013671875, 0.24082565307617188, 0.25308990478515625, 0.2653541564941406, 0.277618408203125, 0.2898826599121094, 0.30214691162109375, 0.3144111633300781, 0.3266754150390625, 0.3389396667480469, 0.35120391845703125, 0.3634681701660156, 0.375732421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 18.0, 14.0, 20.0, 30.0, 30.0, 32.0, 32.0, 43.0, 57.0, 49.0, 76.0, 55.0, 56.0, 61.0, 65.0, 64.0, 51.0, 42.0, 39.0, 25.0, 28.0, 16.0, 25.0, 13.0, 9.0, 13.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.0322723388671875, -1.002044677734375, -0.9718170166015625, -0.94158935546875, -0.9113616943359375, -0.881134033203125, -0.8509063720703125, -0.8206787109375, -0.7904510498046875, -0.760223388671875, -0.7299957275390625, -0.69976806640625, -0.6695404052734375, -0.639312744140625, -0.6090850830078125, -0.578857421875, -0.5486297607421875, -0.518402099609375, -0.4881744384765625, -0.45794677734375, -0.4277191162109375, -0.397491455078125, -0.3672637939453125, -0.3370361328125, -0.3068084716796875, -0.276580810546875, -0.2463531494140625, -0.21612548828125, -0.1858978271484375, -0.155670166015625, -0.1254425048828125, -0.09521484375, -0.0649871826171875, -0.034759521484375, -0.0045318603515625, 0.02569580078125, 0.0559234619140625, 0.086151123046875, 0.1163787841796875, 0.1466064453125, 0.1768341064453125, 0.207061767578125, 0.2372894287109375, 0.26751708984375, 0.2977447509765625, 0.327972412109375, 0.3582000732421875, 0.388427734375, 0.4186553955078125, 0.448883056640625, 0.4791107177734375, 0.50933837890625, 0.5395660400390625, 0.569793701171875, 0.6000213623046875, 0.6302490234375, 0.6604766845703125, 0.690704345703125, 0.7209320068359375, 0.75115966796875, 0.7813873291015625, 0.811614990234375, 0.8418426513671875, 0.8720703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 2.0, 3.0, 6.0, 7.0, 5.0, 7.0, 14.0, 17.0, 28.0, 28.0, 32.0, 62.0, 76.0, 125.0, 212.0, 327.0, 562.0, 1009.0, 1770.0, 3501.0, 7011.0, 14911.0, 35531.0, 98649.0, 277169.0, 358771.0, 155038.0, 53257.0, 20935.0, 9323.0, 4645.0, 2342.0, 1269.0, 746.0, 408.0, 238.0, 141.0, 117.0, 83.0, 47.0, 34.0, 28.0, 17.0, 10.0, 11.0, 6.0, 5.0, 5.0, 7.0, 3.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2303466796875, -0.2221813201904297, -0.21401596069335938, -0.20585060119628906, -0.19768524169921875, -0.18951988220214844, -0.18135452270507812, -0.1731891632080078, -0.1650238037109375, -0.1568584442138672, -0.14869308471679688, -0.14052772521972656, -0.13236236572265625, -0.12419700622558594, -0.11603164672851562, -0.10786628723144531, -0.099700927734375, -0.09153556823730469, -0.08337020874023438, -0.07520484924316406, -0.06703948974609375, -0.05887413024902344, -0.050708770751953125, -0.04254341125488281, -0.0343780517578125, -0.026212692260742188, -0.018047332763671875, -0.009881973266601562, -0.00171661376953125, 0.0064487457275390625, 0.014614105224609375, 0.022779464721679688, 0.03094482421875, 0.03911018371582031, 0.047275543212890625, 0.05544090270996094, 0.06360626220703125, 0.07177162170410156, 0.07993698120117188, 0.08810234069824219, 0.0962677001953125, 0.10443305969238281, 0.11259841918945312, 0.12076377868652344, 0.12892913818359375, 0.13709449768066406, 0.14525985717773438, 0.1534252166748047, 0.161590576171875, 0.1697559356689453, 0.17792129516601562, 0.18608665466308594, 0.19425201416015625, 0.20241737365722656, 0.21058273315429688, 0.2187480926513672, 0.2269134521484375, 0.2350788116455078, 0.24324417114257812, 0.25140953063964844, 0.25957489013671875, 0.26774024963378906, 0.2759056091308594, 0.2840709686279297, 0.292236328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 6.0, 6.0, 12.0, 15.0, 17.0, 21.0, 23.0, 27.0, 31.0, 40.0, 38.0, 43.0, 50.0, 56.0, 52.0, 64.0, 39.0, 60.0, 50.0, 46.0, 48.0, 44.0, 44.0, 27.0, 27.0, 19.0, 20.0, 20.0, 16.0, 10.0, 5.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8232421875, -1.7696533203125, -1.716064453125, -1.6624755859375, -1.60888671875, -1.5552978515625, -1.501708984375, -1.4481201171875, -1.39453125, -1.3409423828125, -1.287353515625, -1.2337646484375, -1.18017578125, -1.1265869140625, -1.072998046875, -1.0194091796875, -0.9658203125, -0.9122314453125, -0.858642578125, -0.8050537109375, -0.75146484375, -0.6978759765625, -0.644287109375, -0.5906982421875, -0.537109375, -0.4835205078125, -0.429931640625, -0.3763427734375, -0.32275390625, -0.2691650390625, -0.215576171875, -0.1619873046875, -0.1083984375, -0.0548095703125, -0.001220703125, 0.0523681640625, 0.10595703125, 0.1595458984375, 0.213134765625, 0.2667236328125, 0.3203125, 0.3739013671875, 0.427490234375, 0.4810791015625, 0.53466796875, 0.5882568359375, 0.641845703125, 0.6954345703125, 0.7490234375, 0.8026123046875, 0.856201171875, 0.9097900390625, 0.96337890625, 1.0169677734375, 1.070556640625, 1.1241455078125, 1.177734375, 1.2313232421875, 1.284912109375, 1.3385009765625, 1.39208984375, 1.4456787109375, 1.499267578125, 1.5528564453125, 1.6064453125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 5.0, 6.0, 7.0, 15.0, 19.0, 39.0, 56.0, 62.0, 122.0, 182.0, 309.0, 542.0, 934.0, 1815.0, 3522.0, 7798.0, 19762.0, 67696.0, 295821.0, 467385.0, 128516.0, 32389.0, 11302.0, 4907.0, 2343.0, 1258.0, 662.0, 415.0, 237.0, 134.0, 84.0, 59.0, 42.0, 37.0, 21.0, 16.0, 4.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1187744140625, -0.11519908905029297, -0.11162376403808594, -0.1080484390258789, -0.10447311401367188, -0.10089778900146484, -0.09732246398925781, -0.09374713897705078, -0.09017181396484375, -0.08659648895263672, -0.08302116394042969, -0.07944583892822266, -0.07587051391601562, -0.0722951889038086, -0.06871986389160156, -0.06514453887939453, -0.0615692138671875, -0.05799388885498047, -0.05441856384277344, -0.050843238830566406, -0.047267913818359375, -0.043692588806152344, -0.04011726379394531, -0.03654193878173828, -0.03296661376953125, -0.02939128875732422, -0.025815963745117188, -0.022240638732910156, -0.018665313720703125, -0.015089988708496094, -0.011514663696289062, -0.007939338684082031, -0.004364013671875, -0.0007886886596679688, 0.0027866363525390625, 0.006361961364746094, 0.009937286376953125, 0.013512611389160156, 0.017087936401367188, 0.02066326141357422, 0.02423858642578125, 0.02781391143798828, 0.03138923645019531, 0.034964561462402344, 0.038539886474609375, 0.042115211486816406, 0.04569053649902344, 0.04926586151123047, 0.0528411865234375, 0.05641651153564453, 0.05999183654785156, 0.0635671615600586, 0.06714248657226562, 0.07071781158447266, 0.07429313659667969, 0.07786846160888672, 0.08144378662109375, 0.08501911163330078, 0.08859443664550781, 0.09216976165771484, 0.09574508666992188, 0.0993204116821289, 0.10289573669433594, 0.10647106170654297, 0.11004638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 8.0, 4.0, 7.0, 17.0, 15.0, 32.0, 33.0, 58.0, 75.0, 97.0, 85.0, 88.0, 99.0, 89.0, 63.0, 40.0, 50.0, 24.0, 25.0, 15.0, 14.0, 6.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.365776062011719e-05, -6.185658276081085e-05, -6.0055404901504517e-05, -5.825422704219818e-05, -5.6453049182891846e-05, -5.465187132358551e-05, -5.2850693464279175e-05, -5.104951560497284e-05, -4.9248337745666504e-05, -4.744715988636017e-05, -4.564598202705383e-05, -4.38448041677475e-05, -4.204362630844116e-05, -4.024244844913483e-05, -3.844127058982849e-05, -3.6640092730522156e-05, -3.483891487121582e-05, -3.3037737011909485e-05, -3.123655915260315e-05, -2.9435381293296814e-05, -2.763420343399048e-05, -2.5833025574684143e-05, -2.4031847715377808e-05, -2.2230669856071472e-05, -2.0429491996765137e-05, -1.86283141374588e-05, -1.6827136278152466e-05, -1.502595841884613e-05, -1.3224780559539795e-05, -1.142360270023346e-05, -9.622424840927124e-06, -7.821246981620789e-06, -6.020069122314453e-06, -4.218891263008118e-06, -2.4177134037017822e-06, -6.165355443954468e-07, 1.1846423149108887e-06, 2.985820174217224e-06, 4.7869980335235596e-06, 6.588175892829895e-06, 8.38935375213623e-06, 1.0190531611442566e-05, 1.1991709470748901e-05, 1.3792887330055237e-05, 1.5594065189361572e-05, 1.7395243048667908e-05, 1.9196420907974243e-05, 2.099759876728058e-05, 2.2798776626586914e-05, 2.459995448589325e-05, 2.6401132345199585e-05, 2.820231020450592e-05, 3.0003488063812256e-05, 3.180466592311859e-05, 3.360584378242493e-05, 3.540702164173126e-05, 3.72081995010376e-05, 3.900937736034393e-05, 4.081055521965027e-05, 4.2611733078956604e-05, 4.441291093826294e-05, 4.6214088797569275e-05, 4.801526665687561e-05, 4.9816444516181946e-05, 5.161762237548828e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 7.0, 4.0, 11.0, 24.0, 16.0, 20.0, 34.0, 38.0, 69.0, 103.0, 152.0, 249.0, 527.0, 1157.0, 2796.0, 7322.0, 23307.0, 96345.0, 451466.0, 360659.0, 74711.0, 18688.0, 6298.0, 2358.0, 996.0, 493.0, 248.0, 126.0, 95.0, 52.0, 45.0, 30.0, 19.0, 15.0, 27.0, 7.0, 4.0, 8.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1300048828125, -0.1260547637939453, -0.12210464477539062, -0.11815452575683594, -0.11420440673828125, -0.11025428771972656, -0.10630416870117188, -0.10235404968261719, -0.0984039306640625, -0.09445381164550781, -0.09050369262695312, -0.08655357360839844, -0.08260345458984375, -0.07865333557128906, -0.07470321655273438, -0.07075309753417969, -0.066802978515625, -0.06285285949707031, -0.058902740478515625, -0.05495262145996094, -0.05100250244140625, -0.04705238342285156, -0.043102264404296875, -0.03915214538574219, -0.0352020263671875, -0.03125190734863281, -0.027301788330078125, -0.023351669311523438, -0.01940155029296875, -0.015451431274414062, -0.011501312255859375, -0.0075511932373046875, -0.00360107421875, 0.0003490447998046875, 0.004299163818359375, 0.008249282836914062, 0.01219940185546875, 0.016149520874023438, 0.020099639892578125, 0.024049758911132812, 0.0279998779296875, 0.03194999694824219, 0.035900115966796875, 0.03985023498535156, 0.04380035400390625, 0.04775047302246094, 0.051700592041015625, 0.05565071105957031, 0.059600830078125, 0.06355094909667969, 0.06750106811523438, 0.07145118713378906, 0.07540130615234375, 0.07935142517089844, 0.08330154418945312, 0.08725166320800781, 0.0912017822265625, 0.09515190124511719, 0.09910202026367188, 0.10305213928222656, 0.10700225830078125, 0.11095237731933594, 0.11490249633789062, 0.11885261535644531, 0.122802734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 4.0, 5.0, 7.0, 10.0, 12.0, 15.0, 23.0, 22.0, 21.0, 30.0, 38.0, 29.0, 60.0, 68.0, 70.0, 73.0, 85.0, 74.0, 59.0, 55.0, 46.0, 24.0, 31.0, 20.0, 14.0, 14.0, 16.0, 12.0, 7.0, 6.0, 8.0, 5.0, 2.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.023651123046875, -0.022872447967529297, -0.022093772888183594, -0.02131509780883789, -0.020536422729492188, -0.019757747650146484, -0.01897907257080078, -0.018200397491455078, -0.017421722412109375, -0.016643047332763672, -0.01586437225341797, -0.015085697174072266, -0.014307022094726562, -0.01352834701538086, -0.012749671936035156, -0.011970996856689453, -0.01119232177734375, -0.010413646697998047, -0.009634971618652344, -0.00885629653930664, -0.008077621459960938, -0.007298946380615234, -0.006520271301269531, -0.005741596221923828, -0.004962921142578125, -0.004184246063232422, -0.0034055709838867188, -0.0026268959045410156, -0.0018482208251953125, -0.0010695457458496094, -0.00029087066650390625, 0.0004878044128417969, 0.0012664794921875, 0.002045154571533203, 0.0028238296508789062, 0.0036025047302246094, 0.0043811798095703125, 0.005159854888916016, 0.005938529968261719, 0.006717205047607422, 0.007495880126953125, 0.008274555206298828, 0.009053230285644531, 0.009831905364990234, 0.010610580444335938, 0.01138925552368164, 0.012167930603027344, 0.012946605682373047, 0.01372528076171875, 0.014503955841064453, 0.015282630920410156, 0.01606130599975586, 0.016839981079101562, 0.017618656158447266, 0.01839733123779297, 0.019176006317138672, 0.019954681396484375, 0.020733356475830078, 0.02151203155517578, 0.022290706634521484, 0.023069381713867188, 0.02384805679321289, 0.024626731872558594, 0.025405406951904297, 0.02618408203125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 10.0, 11.0, 27.0, 48.0, 118.0, 155.0, 203.0, 189.0, 119.0, 50.0, 37.0, 17.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.835117220878601, -1.7660796642303467, -1.6970419883728027, -1.6280044317245483, -1.558966875076294, -1.4899293184280396, -1.4208917617797852, -1.3518540859222412, -1.2828165292739868, -1.2137789726257324, -1.1447412967681885, -1.075703740119934, -1.0066661834716797, -0.9376286268234253, -0.8685910105705261, -0.799553394317627, -0.7305158376693726, -0.6614782810211182, -0.592440664768219, -0.5234030485153198, -0.45436549186706543, -0.38532790541648865, -0.31629031896591187, -0.24725273251533508, -0.1782151460647583, -0.10917755961418152, -0.040139973163604736, 0.028897613286972046, 0.09793519973754883, 0.1669727861881256, 0.2360103726387024, 0.3050479590892792, 0.3740856647491455, 0.4431232511997223, 0.5121608376502991, 0.5811984539031982, 0.6502360105514526, 0.719273567199707, 0.7883111834526062, 0.8573487997055054, 0.9263863563537598, 0.9954239130020142, 1.0644614696502686, 1.1334991455078125, 1.202536702156067, 1.2715742588043213, 1.3406119346618652, 1.4096494913101196, 1.478687047958374, 1.5477246046066284, 1.6167621612548828, 1.6857998371124268, 1.7548373937606812, 1.8238749504089355, 1.8929126262664795, 1.9619501829147339, 2.0309877395629883, 2.1000254154205322, 2.169062852859497, 2.238100528717041, 2.307137966156006, 2.37617564201355, 2.4452133178710938, 2.5142507553100586, 2.5832884311676025]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 13.0, 6.0, 5.0, 10.0, 22.0, 16.0, 25.0, 31.0, 34.0, 24.0, 40.0, 33.0, 50.0, 76.0, 50.0, 60.0, 63.0, 55.0, 64.0, 58.0, 46.0, 39.0, 33.0, 31.0, 23.0, 26.0, 18.0, 13.0, 13.0, 7.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.037756085395813, -1.0096657276153564, -0.9815753102302551, -0.9534849524497986, -0.9253945350646973, -0.8973041772842407, -0.8692138195037842, -0.8411234021186829, -0.8130329847335815, -0.784942626953125, -0.7568522095680237, -0.7287618517875671, -0.7006714344024658, -0.6725810766220093, -0.6444907188415527, -0.6164003014564514, -0.5883099436759949, -0.5602195858955383, -0.532129168510437, -0.5040388107299805, -0.47594839334487915, -0.4478580355644226, -0.4197676479816437, -0.39167726039886475, -0.3635868728160858, -0.3354964852333069, -0.30740609765052795, -0.279315710067749, -0.2512253522872925, -0.22313494980335236, -0.19504457712173462, -0.1669541895389557, -0.13886386156082153, -0.1107734739780426, -0.08268309384584427, -0.054592713713645935, -0.026502326130867004, 0.0015880614519119263, 0.029678434133529663, 0.057768821716308594, 0.08585920929908752, 0.11394959688186646, 0.14203998446464539, 0.17013035714626312, 0.19822074472904205, 0.22631113231182098, 0.2544015049934387, 0.28249189257621765, 0.3105822801589966, 0.3386726677417755, 0.36676305532455444, 0.394853413105011, 0.4229438304901123, 0.45103418827056885, 0.4791245758533478, 0.5072149634361267, 0.535305380821228, 0.5633957386016846, 0.5914861559867859, 0.6195765137672424, 0.6476669311523438, 0.6757572889328003, 0.7038476467132568, 0.7319380640983582, 0.7600284218788147]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 10.0, 14.0, 28.0, 42.0, 83.0, 211.0, 790.0, 3624.0, 35315.0, 850553.0, 148132.0, 7789.0, 1315.0, 351.0, 128.0, 46.0, 22.0, 19.0, 14.0, 7.0, 4.0, 6.0, 5.0, 3.0, 5.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.095703125, -2.020050048828125, -1.94439697265625, -1.868743896484375, -1.7930908203125, -1.717437744140625, -1.64178466796875, -1.566131591796875, -1.490478515625, -1.414825439453125, -1.33917236328125, -1.263519287109375, -1.1878662109375, -1.112213134765625, -1.03656005859375, -0.960906982421875, -0.88525390625, -0.809600830078125, -0.73394775390625, -0.658294677734375, -0.5826416015625, -0.506988525390625, -0.43133544921875, -0.355682373046875, -0.280029296875, -0.204376220703125, -0.12872314453125, -0.053070068359375, 0.0225830078125, 0.098236083984375, 0.17388916015625, 0.249542236328125, 0.3251953125, 0.400848388671875, 0.47650146484375, 0.552154541015625, 0.6278076171875, 0.703460693359375, 0.77911376953125, 0.854766845703125, 0.930419921875, 1.006072998046875, 1.08172607421875, 1.157379150390625, 1.2330322265625, 1.308685302734375, 1.38433837890625, 1.459991455078125, 1.53564453125, 1.611297607421875, 1.68695068359375, 1.762603759765625, 1.8382568359375, 1.913909912109375, 1.98956298828125, 2.065216064453125, 2.140869140625, 2.216522216796875, 2.29217529296875, 2.367828369140625, 2.4434814453125, 2.519134521484375, 2.59478759765625, 2.670440673828125, 2.74609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 8.0, 6.0, 9.0, 12.0, 15.0, 18.0, 22.0, 29.0, 34.0, 22.0, 23.0, 24.0, 32.0, 36.0, 45.0, 45.0, 60.0, 55.0, 48.0, 53.0, 39.0, 50.0, 33.0, 39.0, 37.0, 30.0, 32.0, 21.0, 22.0, 17.0, 16.0, 16.0, 11.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.5673828125, -1.521240234375, -1.47509765625, -1.428955078125, -1.3828125, -1.336669921875, -1.29052734375, -1.244384765625, -1.1982421875, -1.152099609375, -1.10595703125, -1.059814453125, -1.013671875, -0.967529296875, -0.92138671875, -0.875244140625, -0.8291015625, -0.782958984375, -0.73681640625, -0.690673828125, -0.64453125, -0.598388671875, -0.55224609375, -0.506103515625, -0.4599609375, -0.413818359375, -0.36767578125, -0.321533203125, -0.275390625, -0.229248046875, -0.18310546875, -0.136962890625, -0.0908203125, -0.044677734375, 0.00146484375, 0.047607421875, 0.09375, 0.139892578125, 0.18603515625, 0.232177734375, 0.2783203125, 0.324462890625, 0.37060546875, 0.416748046875, 0.462890625, 0.509033203125, 0.55517578125, 0.601318359375, 0.6474609375, 0.693603515625, 0.73974609375, 0.785888671875, 0.83203125, 0.878173828125, 0.92431640625, 0.970458984375, 1.0166015625, 1.062744140625, 1.10888671875, 1.155029296875, 1.201171875, 1.247314453125, 1.29345703125, 1.339599609375, 1.3857421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 16.0, 11.0, 14.0, 20.0, 26.0, 28.0, 46.0, 60.0, 85.0, 87.0, 132.0, 211.0, 508.0, 1835.0, 13731.0, 411623.0, 598001.0, 18616.0, 2147.0, 553.0, 262.0, 133.0, 108.0, 64.0, 58.0, 36.0, 27.0, 19.0, 24.0, 9.0, 12.0, 8.0, 9.0, 8.0, 9.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.814453125, -1.75408935546875, -1.6937255859375, -1.63336181640625, -1.572998046875, -1.51263427734375, -1.4522705078125, -1.39190673828125, -1.33154296875, -1.27117919921875, -1.2108154296875, -1.15045166015625, -1.090087890625, -1.02972412109375, -0.9693603515625, -0.90899658203125, -0.8486328125, -0.78826904296875, -0.7279052734375, -0.66754150390625, -0.607177734375, -0.54681396484375, -0.4864501953125, -0.42608642578125, -0.36572265625, -0.30535888671875, -0.2449951171875, -0.18463134765625, -0.124267578125, -0.06390380859375, -0.0035400390625, 0.05682373046875, 0.1171875, 0.17755126953125, 0.2379150390625, 0.29827880859375, 0.358642578125, 0.41900634765625, 0.4793701171875, 0.53973388671875, 0.60009765625, 0.66046142578125, 0.7208251953125, 0.78118896484375, 0.841552734375, 0.90191650390625, 0.9622802734375, 1.02264404296875, 1.0830078125, 1.14337158203125, 1.2037353515625, 1.26409912109375, 1.324462890625, 1.38482666015625, 1.4451904296875, 1.50555419921875, 1.56591796875, 1.62628173828125, 1.6866455078125, 1.74700927734375, 1.807373046875, 1.86773681640625, 1.9281005859375, 1.98846435546875, 2.048828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 4.0, 4.0, 5.0, 12.0, 18.0, 12.0, 20.0, 23.0, 21.0, 16.0, 32.0, 31.0, 34.0, 29.0, 28.0, 35.0, 31.0, 41.0, 51.0, 47.0, 51.0, 43.0, 40.0, 39.0, 28.0, 32.0, 37.0, 37.0, 27.0, 20.0, 33.0, 22.0, 10.0, 21.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.6669921875, -1.61627197265625, -1.5655517578125, -1.51483154296875, -1.464111328125, -1.41339111328125, -1.3626708984375, -1.31195068359375, -1.26123046875, -1.21051025390625, -1.1597900390625, -1.10906982421875, -1.058349609375, -1.00762939453125, -0.9569091796875, -0.90618896484375, -0.85546875, -0.80474853515625, -0.7540283203125, -0.70330810546875, -0.652587890625, -0.60186767578125, -0.5511474609375, -0.50042724609375, -0.44970703125, -0.39898681640625, -0.3482666015625, -0.29754638671875, -0.246826171875, -0.19610595703125, -0.1453857421875, -0.09466552734375, -0.0439453125, 0.00677490234375, 0.0574951171875, 0.10821533203125, 0.158935546875, 0.20965576171875, 0.2603759765625, 0.31109619140625, 0.36181640625, 0.41253662109375, 0.4632568359375, 0.51397705078125, 0.564697265625, 0.61541748046875, 0.6661376953125, 0.71685791015625, 0.767578125, 0.81829833984375, 0.8690185546875, 0.91973876953125, 0.970458984375, 1.02117919921875, 1.0718994140625, 1.12261962890625, 1.17333984375, 1.22406005859375, 1.2747802734375, 1.32550048828125, 1.376220703125, 1.42694091796875, 1.4776611328125, 1.52838134765625, 1.5791015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 13.0, 24.0, 28.0, 39.0, 51.0, 80.0, 199.0, 631.0, 2965.0, 34522.0, 824552.0, 174687.0, 8607.0, 1417.0, 364.0, 146.0, 77.0, 38.0, 40.0, 18.0, 13.0, 13.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.890625, -0.8670272827148438, -0.8434295654296875, -0.8198318481445312, -0.796234130859375, -0.7726364135742188, -0.7490386962890625, -0.7254409790039062, -0.70184326171875, -0.6782455444335938, -0.6546478271484375, -0.6310501098632812, -0.607452392578125, -0.5838546752929688, -0.5602569580078125, -0.5366592407226562, -0.5130615234375, -0.48946380615234375, -0.4658660888671875, -0.44226837158203125, -0.418670654296875, -0.39507293701171875, -0.3714752197265625, -0.34787750244140625, -0.32427978515625, -0.30068206787109375, -0.2770843505859375, -0.25348663330078125, -0.229888916015625, -0.20629119873046875, -0.1826934814453125, -0.15909576416015625, -0.135498046875, -0.11190032958984375, -0.0883026123046875, -0.06470489501953125, -0.041107177734375, -0.01750946044921875, 0.0060882568359375, 0.02968597412109375, 0.05328369140625, 0.07688140869140625, 0.1004791259765625, 0.12407684326171875, 0.147674560546875, 0.17127227783203125, 0.1948699951171875, 0.21846771240234375, 0.2420654296875, 0.26566314697265625, 0.2892608642578125, 0.31285858154296875, 0.336456298828125, 0.36005401611328125, 0.3836517333984375, 0.40724945068359375, 0.43084716796875, 0.45444488525390625, 0.4780426025390625, 0.5016403198242188, 0.525238037109375, 0.5488357543945312, 0.5724334716796875, 0.5960311889648438, 0.61962890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 6.0, 6.0, 10.0, 6.0, 20.0, 25.0, 21.0, 34.0, 40.0, 59.0, 94.0, 145.0, 136.0, 113.0, 77.0, 60.0, 52.0, 34.0, 17.0, 15.0, 12.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.641315460205078e-05, -7.456168532371521e-05, -7.271021604537964e-05, -7.085874676704407e-05, -6.90072774887085e-05, -6.715580821037292e-05, -6.530433893203735e-05, -6.345286965370178e-05, -6.160140037536621e-05, -5.974993109703064e-05, -5.789846181869507e-05, -5.60469925403595e-05, -5.4195523262023926e-05, -5.2344053983688354e-05, -5.049258470535278e-05, -4.864111542701721e-05, -4.678964614868164e-05, -4.493817687034607e-05, -4.30867075920105e-05, -4.123523831367493e-05, -3.9383769035339355e-05, -3.7532299757003784e-05, -3.568083047866821e-05, -3.382936120033264e-05, -3.197789192199707e-05, -3.01264226436615e-05, -2.8274953365325928e-05, -2.6423484086990356e-05, -2.4572014808654785e-05, -2.2720545530319214e-05, -2.0869076251983643e-05, -1.901760697364807e-05, -1.71661376953125e-05, -1.531466841697693e-05, -1.3463199138641357e-05, -1.1611729860305786e-05, -9.760260581970215e-06, -7.908791303634644e-06, -6.057322025299072e-06, -4.205852746963501e-06, -2.3543834686279297e-06, -5.029141902923584e-07, 1.3485550880432129e-06, 3.200024366378784e-06, 5.0514936447143555e-06, 6.902962923049927e-06, 8.754432201385498e-06, 1.060590147972107e-05, 1.245737075805664e-05, 1.4308840036392212e-05, 1.6160309314727783e-05, 1.8011778593063354e-05, 1.9863247871398926e-05, 2.1714717149734497e-05, 2.356618642807007e-05, 2.541765570640564e-05, 2.726912498474121e-05, 2.9120594263076782e-05, 3.0972063541412354e-05, 3.2823532819747925e-05, 3.4675002098083496e-05, 3.652647137641907e-05, 3.837794065475464e-05, 4.022940993309021e-05, 4.208087921142578e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 16.0, 18.0, 38.0, 68.0, 148.0, 519.0, 2393.0, 29650.0, 956959.0, 54623.0, 3137.0, 616.0, 174.0, 76.0, 41.0, 24.0, 11.0, 6.0, 7.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.248046875, -1.21087646484375, -1.1737060546875, -1.13653564453125, -1.099365234375, -1.06219482421875, -1.0250244140625, -0.98785400390625, -0.95068359375, -0.91351318359375, -0.8763427734375, -0.83917236328125, -0.802001953125, -0.76483154296875, -0.7276611328125, -0.69049072265625, -0.6533203125, -0.61614990234375, -0.5789794921875, -0.54180908203125, -0.504638671875, -0.46746826171875, -0.4302978515625, -0.39312744140625, -0.35595703125, -0.31878662109375, -0.2816162109375, -0.24444580078125, -0.207275390625, -0.17010498046875, -0.1329345703125, -0.09576416015625, -0.05859375, -0.02142333984375, 0.0157470703125, 0.05291748046875, 0.090087890625, 0.12725830078125, 0.1644287109375, 0.20159912109375, 0.23876953125, 0.27593994140625, 0.3131103515625, 0.35028076171875, 0.387451171875, 0.42462158203125, 0.4617919921875, 0.49896240234375, 0.5361328125, 0.57330322265625, 0.6104736328125, 0.64764404296875, 0.684814453125, 0.72198486328125, 0.7591552734375, 0.79632568359375, 0.83349609375, 0.87066650390625, 0.9078369140625, 0.94500732421875, 0.982177734375, 1.01934814453125, 1.0565185546875, 1.09368896484375, 1.130859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 13.0, 14.0, 25.0, 32.0, 56.0, 83.0, 108.0, 155.0, 147.0, 105.0, 72.0, 60.0, 34.0, 28.0, 16.0, 10.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2933216094970703, -0.2848854064941406, -0.27644920349121094, -0.26801300048828125, -0.25957679748535156, -0.2511405944824219, -0.2427043914794922, -0.2342681884765625, -0.2258319854736328, -0.21739578247070312, -0.20895957946777344, -0.20052337646484375, -0.19208717346191406, -0.18365097045898438, -0.1752147674560547, -0.166778564453125, -0.1583423614501953, -0.14990615844726562, -0.14146995544433594, -0.13303375244140625, -0.12459754943847656, -0.11616134643554688, -0.10772514343261719, -0.0992889404296875, -0.09085273742675781, -0.08241653442382812, -0.07398033142089844, -0.06554412841796875, -0.05710792541503906, -0.048671722412109375, -0.04023551940917969, -0.03179931640625, -0.023363113403320312, -0.014926910400390625, -0.0064907073974609375, 0.00194549560546875, 0.010381698608398438, 0.018817901611328125, 0.027254104614257812, 0.0356903076171875, 0.04412651062011719, 0.052562713623046875, 0.06099891662597656, 0.06943511962890625, 0.07787132263183594, 0.08630752563476562, 0.09474372863769531, 0.103179931640625, 0.11161613464355469, 0.12005233764648438, 0.12848854064941406, 0.13692474365234375, 0.14536094665527344, 0.15379714965820312, 0.1622333526611328, 0.1706695556640625, 0.1791057586669922, 0.18754196166992188, 0.19597816467285156, 0.20441436767578125, 0.21285057067871094, 0.22128677368164062, 0.2297229766845703, 0.2381591796875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 18.0, 54.0, 137.0, 258.0, 291.0, 156.0, 51.0, 18.0, 11.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.365645408630371, -8.156628608703613, -7.947612285614014, -7.738595485687256, -7.529579162597656, -7.320562362670898, -7.111545562744141, -6.902528762817383, -6.693512439727783, -6.484495639801025, -6.275479316711426, -6.066462516784668, -5.85744571685791, -5.6484293937683105, -5.439412593841553, -5.230396270751953, -5.021379470825195, -4.8123626708984375, -4.603346347808838, -4.39432954788208, -4.1853132247924805, -3.9762964248657227, -3.767279624938965, -3.558263063430786, -3.3492465019226074, -3.1402299404144287, -2.93121337890625, -2.722196578979492, -2.5131800174713135, -2.3041634559631348, -2.095146656036377, -1.8861300945281982, -1.6771130561828613, -1.4680964946746826, -1.2590798139572144, -1.050063133239746, -0.8410465717315674, -0.6320300102233887, -0.4230133295059204, -0.21399664878845215, -0.0049800872802734375, 0.20403653383255005, 0.41305315494537354, 0.622069776058197, 0.8310863971710205, 1.0401029586791992, 1.2491196393966675, 1.4581363201141357, 1.6671528816223145, 1.8761694431304932, 2.085186004638672, 2.2942028045654297, 2.5032193660736084, 2.712235927581787, 2.921252727508545, 3.1302692890167236, 3.3392858505249023, 3.548302412033081, 3.7573189735412598, 3.9663357734680176, 4.175352096557617, 4.384368896484375, 4.593385696411133, 4.802402496337891, 5.01141881942749]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 13.0, 8.0, 11.0, 23.0, 19.0, 26.0, 20.0, 29.0, 29.0, 35.0, 32.0, 36.0, 42.0, 43.0, 45.0, 43.0, 43.0, 47.0, 45.0, 53.0, 31.0, 33.0, 36.0, 39.0, 23.0, 32.0, 36.0, 18.0, 17.0, 18.0, 11.0, 15.0, 6.0, 12.0, 5.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1289632320404053, -3.033628225326538, -2.938293218612671, -2.8429582118988037, -2.7476232051849365, -2.6522881984710693, -2.556953191757202, -2.461618185043335, -2.3662831783294678, -2.2709481716156006, -2.1756131649017334, -2.080278158187866, -1.984943151473999, -1.8896081447601318, -1.7942731380462646, -1.6989381313323975, -1.6036030054092407, -1.5082679986953735, -1.4129329919815063, -1.3175979852676392, -1.222262978553772, -1.1269279718399048, -1.031592845916748, -0.9362578988075256, -0.8409228920936584, -0.7455878853797913, -0.6502528786659241, -0.5549178123474121, -0.4595828354358673, -0.3642478287220001, -0.26891279220581055, -0.17357778549194336, -0.07824277877807617, 0.017092235386371613, 0.1124272495508194, 0.20776227116584778, 0.30309727787971497, 0.39843228459358215, 0.49376732110977173, 0.5891023278236389, 0.6844373345375061, 0.7797723412513733, 0.8751073479652405, 0.9704424142837524, 1.0657774209976196, 1.1611124277114868, 1.256447434425354, 1.3517824411392212, 1.4471174478530884, 1.5424524545669556, 1.6377874612808228, 1.73312246799469, 1.8284574747085571, 1.9237924814224243, 2.019127607345581, 2.1144626140594482, 2.2097976207733154, 2.3051326274871826, 2.40046763420105, 2.495802640914917, 2.591137647628784, 2.6864726543426514, 2.7818076610565186, 2.8771426677703857, 2.972477674484253]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 10.0, 15.0, 42.0, 48.0, 81.0, 146.0, 275.0, 521.0, 1048.0, 2413.0, 7534.0, 42085.0, 603344.0, 3032732.0, 459641.0, 34150.0, 6372.0, 2027.0, 869.0, 404.0, 217.0, 94.0, 73.0, 46.0, 23.0, 21.0, 11.0, 13.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.716796875, -1.651885986328125, -1.58697509765625, -1.522064208984375, -1.4571533203125, -1.392242431640625, -1.32733154296875, -1.262420654296875, -1.197509765625, -1.132598876953125, -1.06768798828125, -1.002777099609375, -0.9378662109375, -0.872955322265625, -0.80804443359375, -0.743133544921875, -0.67822265625, -0.613311767578125, -0.54840087890625, -0.483489990234375, -0.4185791015625, -0.353668212890625, -0.28875732421875, -0.223846435546875, -0.158935546875, -0.094024658203125, -0.02911376953125, 0.035797119140625, 0.1007080078125, 0.165618896484375, 0.23052978515625, 0.295440673828125, 0.3603515625, 0.425262451171875, 0.49017333984375, 0.555084228515625, 0.6199951171875, 0.684906005859375, 0.74981689453125, 0.814727783203125, 0.879638671875, 0.944549560546875, 1.00946044921875, 1.074371337890625, 1.1392822265625, 1.204193115234375, 1.26910400390625, 1.334014892578125, 1.39892578125, 1.463836669921875, 1.52874755859375, 1.593658447265625, 1.6585693359375, 1.723480224609375, 1.78839111328125, 1.853302001953125, 1.918212890625, 1.983123779296875, 2.04803466796875, 2.112945556640625, 2.1778564453125, 2.242767333984375, 2.30767822265625, 2.372589111328125, 2.4375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 14.0, 23.0, 13.0, 18.0, 19.0, 31.0, 31.0, 34.0, 43.0, 47.0, 60.0, 52.0, 50.0, 68.0, 66.0, 53.0, 68.0, 51.0, 45.0, 47.0, 30.0, 31.0, 20.0, 23.0, 13.0, 9.0, 10.0, 12.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3408203125, -1.301055908203125, -1.26129150390625, -1.221527099609375, -1.1817626953125, -1.141998291015625, -1.10223388671875, -1.062469482421875, -1.022705078125, -0.982940673828125, -0.94317626953125, -0.903411865234375, -0.8636474609375, -0.823883056640625, -0.78411865234375, -0.744354248046875, -0.70458984375, -0.664825439453125, -0.62506103515625, -0.585296630859375, -0.5455322265625, -0.505767822265625, -0.46600341796875, -0.426239013671875, -0.386474609375, -0.346710205078125, -0.30694580078125, -0.267181396484375, -0.2274169921875, -0.187652587890625, -0.14788818359375, -0.108123779296875, -0.068359375, -0.028594970703125, 0.01116943359375, 0.050933837890625, 0.0906982421875, 0.130462646484375, 0.17022705078125, 0.209991455078125, 0.249755859375, 0.289520263671875, 0.32928466796875, 0.369049072265625, 0.4088134765625, 0.448577880859375, 0.48834228515625, 0.528106689453125, 0.56787109375, 0.607635498046875, 0.64739990234375, 0.687164306640625, 0.7269287109375, 0.766693115234375, 0.80645751953125, 0.846221923828125, 0.885986328125, 0.925750732421875, 0.96551513671875, 1.005279541015625, 1.0450439453125, 1.084808349609375, 1.12457275390625, 1.164337158203125, 1.2041015625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 16.0, 24.0, 42.0, 81.0, 208.0, 409.0, 1195.0, 6969.0, 346850.0, 3809063.0, 26044.0, 2306.0, 556.0, 243.0, 104.0, 61.0, 30.0, 24.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.05755615234375, -3.9354248046875, -3.81329345703125, -3.691162109375, -3.56903076171875, -3.4468994140625, -3.32476806640625, -3.20263671875, -3.08050537109375, -2.9583740234375, -2.83624267578125, -2.714111328125, -2.59197998046875, -2.4698486328125, -2.34771728515625, -2.2255859375, -2.10345458984375, -1.9813232421875, -1.85919189453125, -1.737060546875, -1.61492919921875, -1.4927978515625, -1.37066650390625, -1.24853515625, -1.12640380859375, -1.0042724609375, -0.88214111328125, -0.760009765625, -0.63787841796875, -0.5157470703125, -0.39361572265625, -0.271484375, -0.14935302734375, -0.0272216796875, 0.09490966796875, 0.217041015625, 0.33917236328125, 0.4613037109375, 0.58343505859375, 0.70556640625, 0.82769775390625, 0.9498291015625, 1.07196044921875, 1.194091796875, 1.31622314453125, 1.4383544921875, 1.56048583984375, 1.6826171875, 1.80474853515625, 1.9268798828125, 2.04901123046875, 2.171142578125, 2.29327392578125, 2.4154052734375, 2.53753662109375, 2.65966796875, 2.78179931640625, 2.9039306640625, 3.02606201171875, 3.148193359375, 3.27032470703125, 3.3924560546875, 3.51458740234375, 3.63671875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 15.0, 25.0, 24.0, 51.0, 71.0, 126.0, 217.0, 381.0, 680.0, 826.0, 656.0, 404.0, 220.0, 132.0, 86.0, 57.0, 32.0, 17.0, 9.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5451278686523438, -0.5253143310546875, -0.5055007934570312, -0.485687255859375, -0.46587371826171875, -0.4460601806640625, -0.42624664306640625, -0.40643310546875, -0.38661956787109375, -0.3668060302734375, -0.34699249267578125, -0.327178955078125, -0.30736541748046875, -0.2875518798828125, -0.26773834228515625, -0.2479248046875, -0.22811126708984375, -0.2082977294921875, -0.18848419189453125, -0.168670654296875, -0.14885711669921875, -0.1290435791015625, -0.10923004150390625, -0.08941650390625, -0.06960296630859375, -0.0497894287109375, -0.02997589111328125, -0.010162353515625, 0.00965118408203125, 0.0294647216796875, 0.04927825927734375, 0.069091796875, 0.08890533447265625, 0.1087188720703125, 0.12853240966796875, 0.148345947265625, 0.16815948486328125, 0.1879730224609375, 0.20778656005859375, 0.22760009765625, 0.24741363525390625, 0.2672271728515625, 0.28704071044921875, 0.306854248046875, 0.32666778564453125, 0.3464813232421875, 0.36629486083984375, 0.3861083984375, 0.40592193603515625, 0.4257354736328125, 0.44554901123046875, 0.465362548828125, 0.48517608642578125, 0.5049896240234375, 0.5248031616210938, 0.54461669921875, 0.5644302368164062, 0.5842437744140625, 0.6040573120117188, 0.623870849609375, 0.6436843872070312, 0.6634979248046875, 0.6833114624023438, 0.703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 4.0, 10.0, 11.0, 27.0, 38.0, 75.0, 73.0, 138.0, 144.0, 126.0, 101.0, 86.0, 52.0, 42.0, 34.0, 18.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.574204444885254, -1.499069094657898, -1.423933744430542, -1.348798394203186, -1.27366304397583, -1.1985276937484741, -1.1233923435211182, -1.0482571125030518, -0.973121702671051, -0.8979863524436951, -0.8228510022163391, -0.7477157115936279, -0.672580361366272, -0.597445011138916, -0.5223096609115601, -0.4471743106842041, -0.37203896045684814, -0.2969036102294922, -0.22176827490329742, -0.14663293957710266, -0.0714975893497467, 0.003637760877609253, 0.07877308130264282, 0.15390843152999878, 0.22904378175735474, 0.3041791319847107, 0.37931448221206665, 0.4544498026371002, 0.5295851230621338, 0.6047204732894897, 0.6798558235168457, 0.7549911737442017, 0.8301265239715576, 0.9052618741989136, 0.9803972244262695, 1.0555325746536255, 1.1306679248809814, 1.2058032751083374, 1.2809386253356934, 1.3560738563537598, 1.4312093257904053, 1.5063446760177612, 1.5814800262451172, 1.6566153764724731, 1.731750726699829, 1.806886076927185, 1.882021427154541, 1.9571566581726074, 2.032291889190674, 2.1074271202087402, 2.1825625896453857, 2.257697820663452, 2.3328332901000977, 2.407968521118164, 2.4831039905548096, 2.558239221572876, 2.6333746910095215, 2.708509922027588, 2.7836453914642334, 2.8587806224823, 2.9339160919189453, 3.0090513229370117, 3.0841867923736572, 3.1593220233917236, 3.234457492828369]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 2.0, 13.0, 12.0, 15.0, 25.0, 23.0, 30.0, 33.0, 27.0, 33.0, 42.0, 36.0, 42.0, 58.0, 47.0, 60.0, 54.0, 43.0, 41.0, 51.0, 40.0, 31.0, 43.0, 29.0, 27.0, 27.0, 17.0, 22.0, 10.0, 11.0, 11.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2736073732376099, -1.2385990619659424, -1.203590750694275, -1.1685824394226074, -1.1335740089416504, -1.098565697669983, -1.0635573863983154, -1.028549075126648, -0.9935407638549805, -0.958532452583313, -0.9235241413116455, -0.8885157704353333, -0.8535074591636658, -0.8184991478919983, -0.783490777015686, -0.7484824657440186, -0.7134741544723511, -0.6784658432006836, -0.6434575319290161, -0.6084491610527039, -0.5734408497810364, -0.5384325385093689, -0.5034241676330566, -0.46841585636138916, -0.4334075450897217, -0.3983992338180542, -0.36339089274406433, -0.32838255167007446, -0.293374240398407, -0.2583659291267395, -0.22335758805274963, -0.18834926187992096, -0.15334093570709229, -0.11833260953426361, -0.08332428336143494, -0.04831595718860626, -0.013307631015777588, 0.021700695157051086, 0.05670902132987976, 0.09171734750270844, 0.1267256736755371, 0.16173399984836578, 0.19674232602119446, 0.23175065219402313, 0.2667589783668518, 0.3017672896385193, 0.33677563071250916, 0.371783971786499, 0.4067922830581665, 0.441800594329834, 0.47680893540382385, 0.5118172764778137, 0.5468255877494812, 0.5818338990211487, 0.6168422698974609, 0.6518505811691284, 0.6868588924407959, 0.7218672037124634, 0.7568755149841309, 0.7918838858604431, 0.8268921971321106, 0.8619005084037781, 0.8969088792800903, 0.9319171905517578, 0.9669255018234253]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 9.0, 7.0, 10.0, 21.0, 18.0, 36.0, 74.0, 119.0, 212.0, 374.0, 795.0, 1699.0, 3885.0, 10781.0, 30640.0, 90802.0, 245411.0, 358604.0, 197549.0, 69636.0, 23447.0, 8360.0, 3301.0, 1352.0, 663.0, 294.0, 164.0, 116.0, 61.0, 39.0, 22.0, 18.0, 15.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.26708984375, -0.2601299285888672, -0.2531700134277344, -0.24621009826660156, -0.23925018310546875, -0.23229026794433594, -0.22533035278320312, -0.2183704376220703, -0.2114105224609375, -0.2044506072998047, -0.19749069213867188, -0.19053077697753906, -0.18357086181640625, -0.17661094665527344, -0.16965103149414062, -0.1626911163330078, -0.155731201171875, -0.1487712860107422, -0.14181137084960938, -0.13485145568847656, -0.12789154052734375, -0.12093162536621094, -0.11397171020507812, -0.10701179504394531, -0.1000518798828125, -0.09309196472167969, -0.08613204956054688, -0.07917213439941406, -0.07221221923828125, -0.06525230407714844, -0.058292388916015625, -0.05133247375488281, -0.04437255859375, -0.03741264343261719, -0.030452728271484375, -0.023492813110351562, -0.01653289794921875, -0.009572982788085938, -0.002613067626953125, 0.0043468475341796875, 0.0113067626953125, 0.018266677856445312, 0.025226593017578125, 0.03218650817871094, 0.03914642333984375, 0.04610633850097656, 0.053066253662109375, 0.06002616882324219, 0.066986083984375, 0.07394599914550781, 0.08090591430664062, 0.08786582946777344, 0.09482574462890625, 0.10178565979003906, 0.10874557495117188, 0.11570549011230469, 0.1226654052734375, 0.1296253204345703, 0.13658523559570312, 0.14354515075683594, 0.15050506591796875, 0.15746498107910156, 0.16442489624023438, 0.1713848114013672, 0.1783447265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 10.0, 7.0, 13.0, 10.0, 25.0, 28.0, 32.0, 36.0, 33.0, 38.0, 43.0, 46.0, 55.0, 60.0, 74.0, 64.0, 39.0, 54.0, 43.0, 51.0, 36.0, 42.0, 35.0, 30.0, 18.0, 25.0, 10.0, 6.0, 8.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93310546875, -0.9078521728515625, -0.882598876953125, -0.8573455810546875, -0.83209228515625, -0.8068389892578125, -0.781585693359375, -0.7563323974609375, -0.7310791015625, -0.7058258056640625, -0.680572509765625, -0.6553192138671875, -0.63006591796875, -0.6048126220703125, -0.579559326171875, -0.5543060302734375, -0.529052734375, -0.5037994384765625, -0.478546142578125, -0.4532928466796875, -0.42803955078125, -0.4027862548828125, -0.377532958984375, -0.3522796630859375, -0.3270263671875, -0.3017730712890625, -0.276519775390625, -0.2512664794921875, -0.22601318359375, -0.2007598876953125, -0.175506591796875, -0.1502532958984375, -0.125, -0.0997467041015625, -0.074493408203125, -0.0492401123046875, -0.02398681640625, 0.0012664794921875, 0.026519775390625, 0.0517730712890625, 0.0770263671875, 0.1022796630859375, 0.127532958984375, 0.1527862548828125, 0.17803955078125, 0.2032928466796875, 0.228546142578125, 0.2537994384765625, 0.279052734375, 0.3043060302734375, 0.329559326171875, 0.3548126220703125, 0.38006591796875, 0.4053192138671875, 0.430572509765625, 0.4558258056640625, 0.4810791015625, 0.5063323974609375, 0.531585693359375, 0.5568389892578125, 0.58209228515625, 0.6073455810546875, 0.632598876953125, 0.6578521728515625, 0.68310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 10.0, 9.0, 21.0, 27.0, 35.0, 59.0, 99.0, 209.0, 337.0, 701.0, 1724.0, 4308.0, 12131.0, 37749.0, 121506.0, 311234.0, 340939.0, 147548.0, 46318.0, 14671.0, 5238.0, 1973.0, 803.0, 398.0, 179.0, 117.0, 66.0, 39.0, 35.0, 19.0, 12.0, 12.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2587890625, -0.25141334533691406, -0.24403762817382812, -0.2366619110107422, -0.22928619384765625, -0.2219104766845703, -0.21453475952148438, -0.20715904235839844, -0.1997833251953125, -0.19240760803222656, -0.18503189086914062, -0.1776561737060547, -0.17028045654296875, -0.1629047393798828, -0.15552902221679688, -0.14815330505371094, -0.140777587890625, -0.13340187072753906, -0.12602615356445312, -0.11865043640136719, -0.11127471923828125, -0.10389900207519531, -0.09652328491210938, -0.08914756774902344, -0.0817718505859375, -0.07439613342285156, -0.06702041625976562, -0.05964469909667969, -0.05226898193359375, -0.04489326477050781, -0.037517547607421875, -0.030141830444335938, -0.02276611328125, -0.015390396118164062, -0.008014678955078125, -0.0006389617919921875, 0.00673675537109375, 0.014112472534179688, 0.021488189697265625, 0.028863906860351562, 0.0362396240234375, 0.04361534118652344, 0.050991058349609375, 0.05836677551269531, 0.06574249267578125, 0.07311820983886719, 0.08049392700195312, 0.08786964416503906, 0.095245361328125, 0.10262107849121094, 0.10999679565429688, 0.11737251281738281, 0.12474822998046875, 0.1321239471435547, 0.13949966430664062, 0.14687538146972656, 0.1542510986328125, 0.16162681579589844, 0.16900253295898438, 0.1763782501220703, 0.18375396728515625, 0.1911296844482422, 0.19850540161132812, 0.20588111877441406, 0.2132568359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 9.0, 4.0, 8.0, 6.0, 8.0, 14.0, 18.0, 19.0, 22.0, 27.0, 39.0, 39.0, 49.0, 45.0, 54.0, 45.0, 56.0, 71.0, 65.0, 57.0, 59.0, 40.0, 38.0, 41.0, 27.0, 25.0, 24.0, 22.0, 19.0, 11.0, 7.0, 13.0, 5.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46875, -1.4204864501953125, -1.372222900390625, -1.3239593505859375, -1.27569580078125, -1.2274322509765625, -1.179168701171875, -1.1309051513671875, -1.0826416015625, -1.0343780517578125, -0.986114501953125, -0.9378509521484375, -0.88958740234375, -0.8413238525390625, -0.793060302734375, -0.7447967529296875, -0.696533203125, -0.6482696533203125, -0.600006103515625, -0.5517425537109375, -0.50347900390625, -0.4552154541015625, -0.406951904296875, -0.3586883544921875, -0.3104248046875, -0.2621612548828125, -0.213897705078125, -0.1656341552734375, -0.11737060546875, -0.0691070556640625, -0.020843505859375, 0.0274200439453125, 0.07568359375, 0.1239471435546875, 0.172210693359375, 0.2204742431640625, 0.26873779296875, 0.3170013427734375, 0.365264892578125, 0.4135284423828125, 0.4617919921875, 0.5100555419921875, 0.558319091796875, 0.6065826416015625, 0.65484619140625, 0.7031097412109375, 0.751373291015625, 0.7996368408203125, 0.847900390625, 0.8961639404296875, 0.944427490234375, 0.9926910400390625, 1.04095458984375, 1.0892181396484375, 1.137481689453125, 1.1857452392578125, 1.2340087890625, 1.2822723388671875, 1.330535888671875, 1.3787994384765625, 1.42706298828125, 1.4753265380859375, 1.523590087890625, 1.5718536376953125, 1.6201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 20.0, 25.0, 39.0, 53.0, 106.0, 154.0, 261.0, 451.0, 748.0, 1588.0, 3637.0, 9953.0, 37178.0, 184400.0, 555542.0, 197927.0, 38968.0, 10310.0, 3676.0, 1588.0, 825.0, 432.0, 259.0, 149.0, 73.0, 60.0, 35.0, 18.0, 7.0, 6.0, 8.0, 8.0, 8.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12310791015625, -0.11943531036376953, -0.11576271057128906, -0.1120901107788086, -0.10841751098632812, -0.10474491119384766, -0.10107231140136719, -0.09739971160888672, -0.09372711181640625, -0.09005451202392578, -0.08638191223144531, -0.08270931243896484, -0.07903671264648438, -0.0753641128540039, -0.07169151306152344, -0.06801891326904297, -0.0643463134765625, -0.06067371368408203, -0.05700111389160156, -0.053328514099121094, -0.049655914306640625, -0.045983314514160156, -0.04231071472167969, -0.03863811492919922, -0.03496551513671875, -0.03129291534423828, -0.027620315551757812, -0.023947715759277344, -0.020275115966796875, -0.016602516174316406, -0.012929916381835938, -0.009257316589355469, -0.005584716796875, -0.0019121170043945312, 0.0017604827880859375, 0.005433082580566406, 0.009105682373046875, 0.012778282165527344, 0.016450881958007812, 0.02012348175048828, 0.02379608154296875, 0.02746868133544922, 0.031141281127929688, 0.034813880920410156, 0.038486480712890625, 0.042159080505371094, 0.04583168029785156, 0.04950428009033203, 0.0531768798828125, 0.05684947967529297, 0.06052207946777344, 0.0641946792602539, 0.06786727905273438, 0.07153987884521484, 0.07521247863769531, 0.07888507843017578, 0.08255767822265625, 0.08623027801513672, 0.08990287780761719, 0.09357547760009766, 0.09724807739257812, 0.1009206771850586, 0.10459327697753906, 0.10826587677001953, 0.1119384765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 2.0, 8.0, 15.0, 9.0, 22.0, 25.0, 35.0, 42.0, 58.0, 65.0, 98.0, 91.0, 106.0, 93.0, 79.0, 71.0, 46.0, 28.0, 33.0, 21.0, 13.0, 16.0, 5.0, 3.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4465065002441406e-05, -4.293769598007202e-05, -4.141032695770264e-05, -3.988295793533325e-05, -3.835558891296387e-05, -3.682821989059448e-05, -3.53008508682251e-05, -3.377348184585571e-05, -3.224611282348633e-05, -3.071874380111694e-05, -2.919137477874756e-05, -2.7664005756378174e-05, -2.613663673400879e-05, -2.4609267711639404e-05, -2.308189868927002e-05, -2.1554529666900635e-05, -2.002716064453125e-05, -1.8499791622161865e-05, -1.697242259979248e-05, -1.5445053577423096e-05, -1.3917684555053711e-05, -1.2390315532684326e-05, -1.0862946510314941e-05, -9.335577487945557e-06, -7.808208465576172e-06, -6.280839443206787e-06, -4.753470420837402e-06, -3.2261013984680176e-06, -1.6987323760986328e-06, -1.7136335372924805e-07, 1.3560056686401367e-06, 2.8833746910095215e-06, 4.410743713378906e-06, 5.938112735748291e-06, 7.465481758117676e-06, 8.99285078048706e-06, 1.0520219802856445e-05, 1.204758882522583e-05, 1.3574957847595215e-05, 1.51023268699646e-05, 1.6629695892333984e-05, 1.815706491470337e-05, 1.9684433937072754e-05, 2.121180295944214e-05, 2.2739171981811523e-05, 2.4266541004180908e-05, 2.5793910026550293e-05, 2.7321279048919678e-05, 2.8848648071289062e-05, 3.0376017093658447e-05, 3.190338611602783e-05, 3.343075513839722e-05, 3.49581241607666e-05, 3.6485493183135986e-05, 3.801286220550537e-05, 3.9540231227874756e-05, 4.106760025024414e-05, 4.2594969272613525e-05, 4.412233829498291e-05, 4.5649707317352295e-05, 4.717707633972168e-05, 4.8704445362091064e-05, 5.023181438446045e-05, 5.1759183406829834e-05, 5.328655242919922e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 11.0, 15.0, 24.0, 23.0, 42.0, 69.0, 112.0, 216.0, 532.0, 1243.0, 3903.0, 18000.0, 132391.0, 666785.0, 193021.0, 24324.0, 5017.0, 1494.0, 616.0, 276.0, 147.0, 86.0, 61.0, 35.0, 24.0, 13.0, 10.0, 10.0, 1.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.18140029907226562, -0.17615509033203125, -0.17090988159179688, -0.1656646728515625, -0.16041946411132812, -0.15517425537109375, -0.14992904663085938, -0.144683837890625, -0.13943862915039062, -0.13419342041015625, -0.12894821166992188, -0.1237030029296875, -0.11845779418945312, -0.11321258544921875, -0.10796737670898438, -0.10272216796875, -0.09747695922851562, -0.09223175048828125, -0.08698654174804688, -0.0817413330078125, -0.07649612426757812, -0.07125091552734375, -0.06600570678710938, -0.060760498046875, -0.055515289306640625, -0.05027008056640625, -0.045024871826171875, -0.0397796630859375, -0.034534454345703125, -0.02928924560546875, -0.024044036865234375, -0.018798828125, -0.013553619384765625, -0.00830841064453125, -0.003063201904296875, 0.0021820068359375, 0.007427215576171875, 0.01267242431640625, 0.017917633056640625, 0.023162841796875, 0.028408050537109375, 0.03365325927734375, 0.038898468017578125, 0.0441436767578125, 0.049388885498046875, 0.05463409423828125, 0.059879302978515625, 0.06512451171875, 0.07036972045898438, 0.07561492919921875, 0.08086013793945312, 0.0861053466796875, 0.09135055541992188, 0.09659576416015625, 0.10184097290039062, 0.107086181640625, 0.11233139038085938, 0.11757659912109375, 0.12282180786132812, 0.1280670166015625, 0.13331222534179688, 0.13855743408203125, 0.14380264282226562, 0.1490478515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 12.0, 21.0, 27.0, 30.0, 45.0, 45.0, 41.0, 69.0, 95.0, 89.0, 92.0, 87.0, 75.0, 66.0, 52.0, 38.0, 29.0, 21.0, 13.0, 9.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0287322998046875, -0.027670621871948242, -0.026608943939208984, -0.025547266006469727, -0.02448558807373047, -0.02342391014099121, -0.022362232208251953, -0.021300554275512695, -0.020238876342773438, -0.01917719841003418, -0.018115520477294922, -0.017053842544555664, -0.015992164611816406, -0.014930486679077148, -0.01386880874633789, -0.012807130813598633, -0.011745452880859375, -0.010683774948120117, -0.00962209701538086, -0.008560419082641602, -0.007498741149902344, -0.006437063217163086, -0.005375385284423828, -0.00431370735168457, -0.0032520294189453125, -0.0021903514862060547, -0.0011286735534667969, -6.699562072753906e-05, 0.0009946823120117188, 0.0020563602447509766, 0.0031180381774902344, 0.004179716110229492, 0.00524139404296875, 0.006303071975708008, 0.007364749908447266, 0.008426427841186523, 0.009488105773925781, 0.010549783706665039, 0.011611461639404297, 0.012673139572143555, 0.013734817504882812, 0.01479649543762207, 0.015858173370361328, 0.016919851303100586, 0.017981529235839844, 0.0190432071685791, 0.02010488510131836, 0.021166563034057617, 0.022228240966796875, 0.023289918899536133, 0.02435159683227539, 0.02541327476501465, 0.026474952697753906, 0.027536630630493164, 0.028598308563232422, 0.02965998649597168, 0.030721664428710938, 0.031783342361450195, 0.03284502029418945, 0.03390669822692871, 0.03496837615966797, 0.03603005409240723, 0.037091732025146484, 0.03815340995788574, 0.039215087890625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 3.0, 8.0, 16.0, 37.0, 101.0, 175.0, 219.0, 192.0, 117.0, 65.0, 40.0, 13.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3516031503677368, -1.2831087112426758, -1.2146141529083252, -1.1461195945739746, -1.0776251554489136, -1.0091307163238525, -0.940636157989502, -0.8721416592597961, -0.8036471605300903, -0.7351526618003845, -0.6666581630706787, -0.5981636643409729, -0.5296691656112671, -0.4611746668815613, -0.39268016815185547, -0.32418566942214966, -0.25569117069244385, -0.18719667196273804, -0.11870217323303223, -0.050207674503326416, 0.018286824226379395, 0.0867813229560852, 0.15527582168579102, 0.22377032041549683, 0.29226481914520264, 0.36075931787490845, 0.42925381660461426, 0.49774831533432007, 0.5662428140640259, 0.6347373127937317, 0.7032318115234375, 0.7717263102531433, 0.8402206897735596, 0.9087151885032654, 0.9772096872329712, 1.0457041263580322, 1.1141986846923828, 1.1826932430267334, 1.2511876821517944, 1.3196821212768555, 1.388176679611206, 1.4566712379455566, 1.5251656770706177, 1.5936601161956787, 1.6621546745300293, 1.7306492328643799, 1.799143671989441, 1.867638111114502, 1.9361326694488525, 2.004627227783203, 2.0731215476989746, 2.141616106033325, 2.210110664367676, 2.2786052227020264, 2.347099781036377, 2.4155941009521484, 2.484088659286499, 2.5525832176208496, 2.621077537536621, 2.6895720958709717, 2.7580666542053223, 2.826561212539673, 2.8950557708740234, 2.963550090789795, 3.0320446491241455]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 8.0, 10.0, 20.0, 27.0, 33.0, 31.0, 39.0, 38.0, 44.0, 39.0, 69.0, 54.0, 65.0, 63.0, 52.0, 69.0, 53.0, 45.0, 40.0, 34.0, 31.0, 28.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9385626316070557, -0.9130412936210632, -0.8875199556350708, -0.8619986176490784, -0.8364772796630859, -0.8109559416770935, -0.7854346036911011, -0.7599132657051086, -0.7343919277191162, -0.7088705897331238, -0.6833492517471313, -0.6578279137611389, -0.6323065757751465, -0.606785237789154, -0.5812638998031616, -0.5557425618171692, -0.5302212238311768, -0.5046998858451843, -0.4791785478591919, -0.45365720987319946, -0.42813587188720703, -0.4026145339012146, -0.37709319591522217, -0.35157185792922974, -0.32605046033859253, -0.3005291223526001, -0.27500778436660767, -0.24948644638061523, -0.2239651083946228, -0.19844375550746918, -0.17292241752147675, -0.14740107953548431, -0.12187975645065308, -0.09635841846466064, -0.07083708047866821, -0.045315735042095184, -0.019794397056102753, 0.005726948380470276, 0.031248286366462708, 0.05676962435245514, 0.08229096233844757, 0.10781230032444, 0.13333363831043243, 0.15885499119758606, 0.1843763291835785, 0.20989766716957092, 0.23541900515556335, 0.2609403431415558, 0.2864616811275482, 0.31198301911354065, 0.3375043570995331, 0.3630256950855255, 0.38854703307151794, 0.41406840085983276, 0.4395897388458252, 0.4651110768318176, 0.49063241481781006, 0.5161537528038025, 0.5416750907897949, 0.5671964287757874, 0.5927177667617798, 0.6182391047477722, 0.6437604427337646, 0.6692817807197571, 0.6948031187057495]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 11.0, 6.0, 9.0, 21.0, 26.0, 46.0, 57.0, 106.0, 117.0, 221.0, 390.0, 611.0, 1133.0, 2224.0, 4486.0, 10048.0, 24317.0, 67418.0, 255531.0, 477177.0, 133454.0, 40797.0, 16211.0, 7103.0, 3295.0, 1665.0, 842.0, 465.0, 258.0, 185.0, 96.0, 76.0, 54.0, 29.0, 14.0, 16.0, 15.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.60595703125, -0.5877456665039062, -0.5695343017578125, -0.5513229370117188, -0.533111572265625, -0.5149002075195312, -0.4966888427734375, -0.47847747802734375, -0.46026611328125, -0.44205474853515625, -0.4238433837890625, -0.40563201904296875, -0.387420654296875, -0.36920928955078125, -0.3509979248046875, -0.33278656005859375, -0.3145751953125, -0.29636383056640625, -0.2781524658203125, -0.25994110107421875, -0.241729736328125, -0.22351837158203125, -0.2053070068359375, -0.18709564208984375, -0.16888427734375, -0.15067291259765625, -0.1324615478515625, -0.11425018310546875, -0.096038818359375, -0.07782745361328125, -0.0596160888671875, -0.04140472412109375, -0.023193359375, -0.00498199462890625, 0.0132293701171875, 0.03144073486328125, 0.049652099609375, 0.06786346435546875, 0.0860748291015625, 0.10428619384765625, 0.12249755859375, 0.14070892333984375, 0.1589202880859375, 0.17713165283203125, 0.195343017578125, 0.21355438232421875, 0.2317657470703125, 0.24997711181640625, 0.2681884765625, 0.28639984130859375, 0.3046112060546875, 0.32282257080078125, 0.341033935546875, 0.35924530029296875, 0.3774566650390625, 0.39566802978515625, 0.41387939453125, 0.43209075927734375, 0.4503021240234375, 0.46851348876953125, 0.486724853515625, 0.5049362182617188, 0.5231475830078125, 0.5413589477539062, 0.5595703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 9.0, 3.0, 7.0, 7.0, 12.0, 14.0, 15.0, 27.0, 20.0, 31.0, 23.0, 34.0, 31.0, 37.0, 40.0, 40.0, 45.0, 59.0, 55.0, 59.0, 39.0, 49.0, 40.0, 50.0, 35.0, 30.0, 35.0, 21.0, 21.0, 20.0, 19.0, 18.0, 11.0, 9.0, 5.0, 5.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.5322265625, -1.486724853515625, -1.44122314453125, -1.395721435546875, -1.3502197265625, -1.304718017578125, -1.25921630859375, -1.213714599609375, -1.168212890625, -1.122711181640625, -1.07720947265625, -1.031707763671875, -0.9862060546875, -0.940704345703125, -0.89520263671875, -0.849700927734375, -0.80419921875, -0.758697509765625, -0.71319580078125, -0.667694091796875, -0.6221923828125, -0.576690673828125, -0.53118896484375, -0.485687255859375, -0.440185546875, -0.394683837890625, -0.34918212890625, -0.303680419921875, -0.2581787109375, -0.212677001953125, -0.16717529296875, -0.121673583984375, -0.076171875, -0.030670166015625, 0.01483154296875, 0.060333251953125, 0.1058349609375, 0.151336669921875, 0.19683837890625, 0.242340087890625, 0.287841796875, 0.333343505859375, 0.37884521484375, 0.424346923828125, 0.4698486328125, 0.515350341796875, 0.56085205078125, 0.606353759765625, 0.65185546875, 0.697357177734375, 0.74285888671875, 0.788360595703125, 0.8338623046875, 0.879364013671875, 0.92486572265625, 0.970367431640625, 1.015869140625, 1.061370849609375, 1.10687255859375, 1.152374267578125, 1.1978759765625, 1.243377685546875, 1.28887939453125, 1.334381103515625, 1.3798828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 7.0, 9.0, 6.0, 17.0, 12.0, 26.0, 26.0, 46.0, 64.0, 119.0, 135.0, 260.0, 464.0, 1607.0, 12451.0, 364382.0, 646971.0, 18571.0, 2064.0, 563.0, 256.0, 149.0, 106.0, 71.0, 42.0, 30.0, 22.0, 15.0, 14.0, 11.0, 6.0, 2.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.62109375, -1.56121826171875, -1.5013427734375, -1.44146728515625, -1.381591796875, -1.32171630859375, -1.2618408203125, -1.20196533203125, -1.14208984375, -1.08221435546875, -1.0223388671875, -0.96246337890625, -0.902587890625, -0.84271240234375, -0.7828369140625, -0.72296142578125, -0.6630859375, -0.60321044921875, -0.5433349609375, -0.48345947265625, -0.423583984375, -0.36370849609375, -0.3038330078125, -0.24395751953125, -0.18408203125, -0.12420654296875, -0.0643310546875, -0.00445556640625, 0.055419921875, 0.11529541015625, 0.1751708984375, 0.23504638671875, 0.294921875, 0.35479736328125, 0.4146728515625, 0.47454833984375, 0.534423828125, 0.59429931640625, 0.6541748046875, 0.71405029296875, 0.77392578125, 0.83380126953125, 0.8936767578125, 0.95355224609375, 1.013427734375, 1.07330322265625, 1.1331787109375, 1.19305419921875, 1.2529296875, 1.31280517578125, 1.3726806640625, 1.43255615234375, 1.492431640625, 1.55230712890625, 1.6121826171875, 1.67205810546875, 1.73193359375, 1.79180908203125, 1.8516845703125, 1.91156005859375, 1.971435546875, 2.03131103515625, 2.0911865234375, 2.15106201171875, 2.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 6.0, 12.0, 10.0, 13.0, 12.0, 15.0, 18.0, 23.0, 22.0, 31.0, 22.0, 29.0, 43.0, 40.0, 42.0, 59.0, 55.0, 46.0, 39.0, 44.0, 51.0, 34.0, 33.0, 36.0, 43.0, 32.0, 24.0, 23.0, 19.0, 19.0, 21.0, 19.0, 11.0, 11.0, 10.0, 2.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.615234375, -1.561126708984375, -1.50701904296875, -1.452911376953125, -1.3988037109375, -1.344696044921875, -1.29058837890625, -1.236480712890625, -1.182373046875, -1.128265380859375, -1.07415771484375, -1.020050048828125, -0.9659423828125, -0.911834716796875, -0.85772705078125, -0.803619384765625, -0.74951171875, -0.695404052734375, -0.64129638671875, -0.587188720703125, -0.5330810546875, -0.478973388671875, -0.42486572265625, -0.370758056640625, -0.316650390625, -0.262542724609375, -0.20843505859375, -0.154327392578125, -0.1002197265625, -0.046112060546875, 0.00799560546875, 0.062103271484375, 0.1162109375, 0.170318603515625, 0.22442626953125, 0.278533935546875, 0.3326416015625, 0.386749267578125, 0.44085693359375, 0.494964599609375, 0.549072265625, 0.603179931640625, 0.65728759765625, 0.711395263671875, 0.7655029296875, 0.819610595703125, 0.87371826171875, 0.927825927734375, 0.98193359375, 1.036041259765625, 1.09014892578125, 1.144256591796875, 1.1983642578125, 1.252471923828125, 1.30657958984375, 1.360687255859375, 1.414794921875, 1.468902587890625, 1.52301025390625, 1.577117919921875, 1.6312255859375, 1.685333251953125, 1.73944091796875, 1.793548583984375, 1.84765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 3.0, 3.0, 7.0, 18.0, 16.0, 18.0, 26.0, 27.0, 54.0, 108.0, 176.0, 462.0, 1812.0, 15365.0, 677427.0, 341157.0, 9635.0, 1377.0, 397.0, 156.0, 82.0, 57.0, 44.0, 25.0, 24.0, 22.0, 9.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.59033203125, -0.5738945007324219, -0.5574569702148438, -0.5410194396972656, -0.5245819091796875, -0.5081443786621094, -0.49170684814453125, -0.4752693176269531, -0.458831787109375, -0.4423942565917969, -0.42595672607421875, -0.4095191955566406, -0.3930816650390625, -0.3766441345214844, -0.36020660400390625, -0.3437690734863281, -0.32733154296875, -0.3108940124511719, -0.29445648193359375, -0.2780189514160156, -0.2615814208984375, -0.24514389038085938, -0.22870635986328125, -0.21226882934570312, -0.195831298828125, -0.17939376831054688, -0.16295623779296875, -0.14651870727539062, -0.1300811767578125, -0.11364364624023438, -0.09720611572265625, -0.08076858520507812, -0.0643310546875, -0.047893524169921875, -0.03145599365234375, -0.015018463134765625, 0.0014190673828125, 0.017856597900390625, 0.03429412841796875, 0.050731658935546875, 0.067169189453125, 0.08360671997070312, 0.10004425048828125, 0.11648178100585938, 0.1329193115234375, 0.14935684204101562, 0.16579437255859375, 0.18223190307617188, 0.19866943359375, 0.21510696411132812, 0.23154449462890625, 0.24798202514648438, 0.2644195556640625, 0.2808570861816406, 0.29729461669921875, 0.3137321472167969, 0.330169677734375, 0.3466072082519531, 0.36304473876953125, 0.3794822692871094, 0.3959197998046875, 0.4123573303222656, 0.42879486083984375, 0.4452323913574219, 0.461669921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 10.0, 9.0, 11.0, 21.0, 45.0, 47.0, 59.0, 86.0, 112.0, 109.0, 127.0, 98.0, 65.0, 43.0, 44.0, 29.0, 26.0, 20.0, 9.0, 7.0, 4.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8683414459228516e-05, -3.753788769245148e-05, -3.639236092567444e-05, -3.52468341588974e-05, -3.410130739212036e-05, -3.295578062534332e-05, -3.1810253858566284e-05, -3.0664727091789246e-05, -2.9519200325012207e-05, -2.837367355823517e-05, -2.722814679145813e-05, -2.608262002468109e-05, -2.4937093257904053e-05, -2.3791566491127014e-05, -2.2646039724349976e-05, -2.1500512957572937e-05, -2.03549861907959e-05, -1.920945942401886e-05, -1.806393265724182e-05, -1.6918405890464783e-05, -1.5772879123687744e-05, -1.4627352356910706e-05, -1.3481825590133667e-05, -1.2336298823356628e-05, -1.119077205657959e-05, -1.0045245289802551e-05, -8.899718523025513e-06, -7.754191756248474e-06, -6.6086649894714355e-06, -5.463138222694397e-06, -4.317611455917358e-06, -3.17208468914032e-06, -2.0265579223632812e-06, -8.810311555862427e-07, 2.644956111907959e-07, 1.4100223779678345e-06, 2.555549144744873e-06, 3.7010759115219116e-06, 4.84660267829895e-06, 5.992129445075989e-06, 7.137656211853027e-06, 8.283182978630066e-06, 9.428709745407104e-06, 1.0574236512184143e-05, 1.1719763278961182e-05, 1.286529004573822e-05, 1.4010816812515259e-05, 1.5156343579292297e-05, 1.6301870346069336e-05, 1.7447397112846375e-05, 1.8592923879623413e-05, 1.973845064640045e-05, 2.088397741317749e-05, 2.202950417995453e-05, 2.3175030946731567e-05, 2.4320557713508606e-05, 2.5466084480285645e-05, 2.6611611247062683e-05, 2.775713801383972e-05, 2.890266478061676e-05, 3.00481915473938e-05, 3.119371831417084e-05, 3.2339245080947876e-05, 3.3484771847724915e-05, 3.463029861450195e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 17.0, 17.0, 15.0, 32.0, 63.0, 158.0, 415.0, 1381.0, 8902.0, 829098.0, 202228.0, 4595.0, 1029.0, 320.0, 126.0, 56.0, 24.0, 25.0, 17.0, 7.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8427734375, -0.8171310424804688, -0.7914886474609375, -0.7658462524414062, -0.740203857421875, -0.7145614624023438, -0.6889190673828125, -0.6632766723632812, -0.63763427734375, -0.6119918823242188, -0.5863494873046875, -0.5607070922851562, -0.535064697265625, -0.5094223022460938, -0.4837799072265625, -0.45813751220703125, -0.4324951171875, -0.40685272216796875, -0.3812103271484375, -0.35556793212890625, -0.329925537109375, -0.30428314208984375, -0.2786407470703125, -0.25299835205078125, -0.22735595703125, -0.20171356201171875, -0.1760711669921875, -0.15042877197265625, -0.124786376953125, -0.09914398193359375, -0.0735015869140625, -0.04785919189453125, -0.022216796875, 0.00342559814453125, 0.0290679931640625, 0.05471038818359375, 0.080352783203125, 0.10599517822265625, 0.1316375732421875, 0.15727996826171875, 0.18292236328125, 0.20856475830078125, 0.2342071533203125, 0.25984954833984375, 0.285491943359375, 0.31113433837890625, 0.3367767333984375, 0.36241912841796875, 0.3880615234375, 0.41370391845703125, 0.4393463134765625, 0.46498870849609375, 0.490631103515625, 0.5162734985351562, 0.5419158935546875, 0.5675582885742188, 0.59320068359375, 0.6188430786132812, 0.6444854736328125, 0.6701278686523438, 0.695770263671875, 0.7214126586914062, 0.7470550537109375, 0.7726974487304688, 0.79833984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 12.0, 16.0, 24.0, 38.0, 64.0, 90.0, 142.0, 194.0, 157.0, 97.0, 58.0, 33.0, 21.0, 16.0, 9.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.203125, -0.19647598266601562, -0.18982696533203125, -0.18317794799804688, -0.1765289306640625, -0.16987991333007812, -0.16323089599609375, -0.15658187866210938, -0.149932861328125, -0.14328384399414062, -0.13663482666015625, -0.12998580932617188, -0.1233367919921875, -0.11668777465820312, -0.11003875732421875, -0.10338973999023438, -0.09674072265625, -0.09009170532226562, -0.08344268798828125, -0.07679367065429688, -0.0701446533203125, -0.06349563598632812, -0.05684661865234375, -0.050197601318359375, -0.043548583984375, -0.036899566650390625, -0.03025054931640625, -0.023601531982421875, -0.0169525146484375, -0.010303497314453125, -0.00365447998046875, 0.002994537353515625, 0.0096435546875, 0.016292572021484375, 0.02294158935546875, 0.029590606689453125, 0.0362396240234375, 0.042888641357421875, 0.04953765869140625, 0.056186676025390625, 0.062835693359375, 0.06948471069335938, 0.07613372802734375, 0.08278274536132812, 0.0894317626953125, 0.09608078002929688, 0.10272979736328125, 0.10937881469726562, 0.11602783203125, 0.12267684936523438, 0.12932586669921875, 0.13597488403320312, 0.1426239013671875, 0.14927291870117188, 0.15592193603515625, 0.16257095336914062, 0.169219970703125, 0.17586898803710938, 0.18251800537109375, 0.18916702270507812, 0.1958160400390625, 0.20246505737304688, 0.20911407470703125, 0.21576309204101562, 0.222412109375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 10.0, 34.0, 81.0, 151.0, 222.0, 221.0, 124.0, 79.0, 42.0, 21.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.671441078186035, -2.530933380126953, -2.39042592048645, -2.249918222427368, -2.1094107627868652, -1.9689030647277832, -1.8283953666687012, -1.6878877878189087, -1.5473802089691162, -1.4068726301193237, -1.2663650512695312, -1.1258573532104492, -0.9853497743606567, -0.8448421955108643, -0.704334557056427, -0.5638269186019897, -0.42331933975219727, -0.2828117311000824, -0.14230412244796753, -0.0017965137958526611, 0.1387110948562622, 0.2792186737060547, 0.41972631216049194, 0.5602339506149292, 0.7007415294647217, 0.8412491083145142, 0.9817567467689514, 1.1222643852233887, 1.2627719640731812, 1.4032795429229736, 1.5437872409820557, 1.6842948198318481, 1.8248019218444824, 1.965309500694275, 2.1058170795440674, 2.2463247776031494, 2.3868322372436523, 2.5273399353027344, 2.6678476333618164, 2.8083553314208984, 2.9488627910614014, 3.0893704891204834, 3.2298779487609863, 3.3703856468200684, 3.5108933448791504, 3.6514008045196533, 3.7919085025787354, 3.9324159622192383, 4.07292366027832, 4.213431358337402, 4.353939056396484, 4.494446277618408, 4.63495397567749, 4.775461673736572, 4.915969371795654, 5.056477069854736, 5.19698429107666, 5.337491989135742, 5.477999687194824, 5.618506908416748, 5.75901460647583, 5.899522304534912, 6.040030002593994, 6.180537700653076, 6.321045398712158]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 9.0, 3.0, 6.0, 7.0, 9.0, 18.0, 13.0, 18.0, 28.0, 23.0, 32.0, 25.0, 26.0, 36.0, 32.0, 33.0, 43.0, 40.0, 41.0, 46.0, 53.0, 47.0, 38.0, 44.0, 39.0, 43.0, 34.0, 24.0, 26.0, 22.0, 22.0, 15.0, 21.0, 13.0, 12.0, 9.0, 8.0, 8.0, 3.0, 9.0, 3.0, 6.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8508780002593994, -2.759235382080078, -2.667592763900757, -2.5759501457214355, -2.4843077659606934, -2.392665147781372, -2.301022529602051, -2.2093799114227295, -2.117737293243408, -2.026094675064087, -1.9344521760940552, -1.8428095579147339, -1.7511669397354126, -1.6595244407653809, -1.5678818225860596, -1.4762392044067383, -1.3845967054367065, -1.2929540872573853, -1.2013115882873535, -1.1096689701080322, -1.018026351928711, -0.9263837933540344, -0.8347412347793579, -0.7430986166000366, -0.6514560580253601, -0.5598134994506836, -0.4681708812713623, -0.3765283226966858, -0.2848857343196869, -0.193243145942688, -0.10160058736801147, -0.009957969188690186, 0.08168458938598633, 0.17332717776298523, 0.26496976613998413, 0.35661232471466064, 0.44825491309165955, 0.5398975014686584, 0.631540060043335, 0.7231826782226562, 0.8148252367973328, 0.9064677953720093, 0.9981104135513306, 1.0897529125213623, 1.1813955307006836, 1.2730381488800049, 1.3646807670593262, 1.4563233852386475, 1.5479658842086792, 1.6396085023880005, 1.7312510013580322, 1.8228936195373535, 1.9145362377166748, 2.006178855895996, 2.0978212356567383, 2.1894640922546387, 2.281106472015381, 2.372749090194702, 2.4643917083740234, 2.5560340881347656, 2.647676706314087, 2.739319324493408, 2.8309619426727295, 2.922604560852051, 3.014247179031372]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 5.0, 11.0, 16.0, 22.0, 41.0, 106.0, 151.0, 299.0, 639.0, 1510.0, 3647.0, 11801.0, 62110.0, 625145.0, 2742240.0, 662564.0, 63847.0, 13452.0, 3889.0, 1493.0, 620.0, 310.0, 167.0, 77.0, 53.0, 28.0, 14.0, 6.0, 4.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8642578125, -1.8145599365234375, -1.764862060546875, -1.7151641845703125, -1.66546630859375, -1.6157684326171875, -1.566070556640625, -1.5163726806640625, -1.4666748046875, -1.4169769287109375, -1.367279052734375, -1.3175811767578125, -1.26788330078125, -1.2181854248046875, -1.168487548828125, -1.1187896728515625, -1.069091796875, -1.0193939208984375, -0.969696044921875, -0.9199981689453125, -0.87030029296875, -0.8206024169921875, -0.770904541015625, -0.7212066650390625, -0.6715087890625, -0.6218109130859375, -0.572113037109375, -0.5224151611328125, -0.47271728515625, -0.4230194091796875, -0.373321533203125, -0.3236236572265625, -0.27392578125, -0.2242279052734375, -0.174530029296875, -0.1248321533203125, -0.07513427734375, -0.0254364013671875, 0.024261474609375, 0.0739593505859375, 0.1236572265625, 0.1733551025390625, 0.223052978515625, 0.2727508544921875, 0.32244873046875, 0.3721466064453125, 0.421844482421875, 0.4715423583984375, 0.521240234375, 0.5709381103515625, 0.620635986328125, 0.6703338623046875, 0.72003173828125, 0.7697296142578125, 0.819427490234375, 0.8691253662109375, 0.9188232421875, 0.9685211181640625, 1.018218994140625, 1.0679168701171875, 1.11761474609375, 1.1673126220703125, 1.217010498046875, 1.2667083740234375, 1.31640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 10.0, 32.0, 18.0, 29.0, 42.0, 39.0, 50.0, 63.0, 51.0, 59.0, 64.0, 65.0, 67.0, 50.0, 54.0, 43.0, 39.0, 42.0, 36.0, 32.0, 15.0, 18.0, 8.0, 12.0, 9.0, 1.0, 6.0, 5.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.286529541015625, -1.24981689453125, -1.213104248046875, -1.1763916015625, -1.139678955078125, -1.10296630859375, -1.066253662109375, -1.029541015625, -0.992828369140625, -0.95611572265625, -0.919403076171875, -0.8826904296875, -0.845977783203125, -0.80926513671875, -0.772552490234375, -0.73583984375, -0.699127197265625, -0.66241455078125, -0.625701904296875, -0.5889892578125, -0.552276611328125, -0.51556396484375, -0.478851318359375, -0.442138671875, -0.405426025390625, -0.36871337890625, -0.332000732421875, -0.2952880859375, -0.258575439453125, -0.22186279296875, -0.185150146484375, -0.1484375, -0.111724853515625, -0.07501220703125, -0.038299560546875, -0.0015869140625, 0.035125732421875, 0.07183837890625, 0.108551025390625, 0.145263671875, 0.181976318359375, 0.21868896484375, 0.255401611328125, 0.2921142578125, 0.328826904296875, 0.36553955078125, 0.402252197265625, 0.43896484375, 0.475677490234375, 0.51239013671875, 0.549102783203125, 0.5858154296875, 0.622528076171875, 0.65924072265625, 0.695953369140625, 0.732666015625, 0.769378662109375, 0.80609130859375, 0.842803955078125, 0.8795166015625, 0.916229248046875, 0.95294189453125, 0.989654541015625, 1.0263671875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 15.0, 23.0, 19.0, 29.0, 81.0, 135.0, 346.0, 1089.0, 5740.0, 197996.0, 3950880.0, 34201.0, 2573.0, 680.0, 244.0, 97.0, 59.0, 30.0, 11.0, 4.0, 1.0, 12.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.972320556640625, -4.85479736328125, -4.737274169921875, -4.6197509765625, -4.502227783203125, -4.38470458984375, -4.267181396484375, -4.149658203125, -4.032135009765625, -3.91461181640625, -3.797088623046875, -3.6795654296875, -3.562042236328125, -3.44451904296875, -3.326995849609375, -3.20947265625, -3.091949462890625, -2.97442626953125, -2.856903076171875, -2.7393798828125, -2.621856689453125, -2.50433349609375, -2.386810302734375, -2.269287109375, -2.151763916015625, -2.03424072265625, -1.916717529296875, -1.7991943359375, -1.681671142578125, -1.56414794921875, -1.446624755859375, -1.3291015625, -1.211578369140625, -1.09405517578125, -0.976531982421875, -0.8590087890625, -0.741485595703125, -0.62396240234375, -0.506439208984375, -0.388916015625, -0.271392822265625, -0.15386962890625, -0.036346435546875, 0.0811767578125, 0.198699951171875, 0.31622314453125, 0.433746337890625, 0.55126953125, 0.668792724609375, 0.78631591796875, 0.903839111328125, 1.0213623046875, 1.138885498046875, 1.25640869140625, 1.373931884765625, 1.491455078125, 1.608978271484375, 1.72650146484375, 1.844024658203125, 1.9615478515625, 2.079071044921875, 2.19659423828125, 2.314117431640625, 2.431640625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 7.0, 10.0, 11.0, 14.0, 33.0, 49.0, 85.0, 164.0, 348.0, 628.0, 924.0, 848.0, 436.0, 216.0, 124.0, 62.0, 43.0, 29.0, 14.0, 9.0, 9.0, 3.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421875, -0.4005584716796875, -0.379241943359375, -0.3579254150390625, -0.33660888671875, -0.3152923583984375, -0.293975830078125, -0.2726593017578125, -0.2513427734375, -0.2300262451171875, -0.208709716796875, -0.1873931884765625, -0.16607666015625, -0.1447601318359375, -0.123443603515625, -0.1021270751953125, -0.080810546875, -0.0594940185546875, -0.038177490234375, -0.0168609619140625, 0.00445556640625, 0.0257720947265625, 0.047088623046875, 0.0684051513671875, 0.0897216796875, 0.1110382080078125, 0.132354736328125, 0.1536712646484375, 0.17498779296875, 0.1963043212890625, 0.217620849609375, 0.2389373779296875, 0.26025390625, 0.2815704345703125, 0.302886962890625, 0.3242034912109375, 0.34552001953125, 0.3668365478515625, 0.388153076171875, 0.4094696044921875, 0.4307861328125, 0.4521026611328125, 0.473419189453125, 0.4947357177734375, 0.51605224609375, 0.5373687744140625, 0.558685302734375, 0.5800018310546875, 0.601318359375, 0.6226348876953125, 0.643951416015625, 0.6652679443359375, 0.68658447265625, 0.7079010009765625, 0.729217529296875, 0.7505340576171875, 0.7718505859375, 0.7931671142578125, 0.814483642578125, 0.8358001708984375, 0.85711669921875, 0.8784332275390625, 0.899749755859375, 0.9210662841796875, 0.9423828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 10.0, 12.0, 21.0, 26.0, 34.0, 32.0, 65.0, 66.0, 83.0, 92.0, 91.0, 78.0, 87.0, 71.0, 66.0, 48.0, 34.0, 22.0, 21.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3673738241195679, -1.3176974058151245, -1.2680209875106812, -1.2183445692062378, -1.1686680316925049, -1.1189916133880615, -1.0693151950836182, -1.0196387767791748, -0.9699623584747314, -0.9202859401702881, -0.8706095218658447, -0.8209330439567566, -0.7712566256523132, -0.7215802073478699, -0.6719037294387817, -0.6222273111343384, -0.572550892829895, -0.5228744745254517, -0.4731980264186859, -0.42352157831192017, -0.3738451600074768, -0.32416874170303345, -0.2744922935962677, -0.22481584548950195, -0.1751394271850586, -0.12546299397945404, -0.07578656077384949, -0.026110127568244934, 0.02356630563735962, 0.07324273884296417, 0.12291917204856873, 0.17259562015533447, 0.22227215766906738, 0.27194857597351074, 0.3216250240802765, 0.37130147218704224, 0.4209778904914856, 0.47065430879592896, 0.5203307867050171, 0.5700072050094604, 0.6196836233139038, 0.6693600416183472, 0.7190364599227905, 0.7687129378318787, 0.818389356136322, 0.8680657744407654, 0.9177422523498535, 0.9674186706542969, 1.0170950889587402, 1.0667715072631836, 1.116447925567627, 1.1661243438720703, 1.2158007621765137, 1.2654772996902466, 1.31515371799469, 1.3648301362991333, 1.4145065546035767, 1.46418297290802, 1.5138593912124634, 1.5635358095169067, 1.6132123470306396, 1.662888765335083, 1.7125651836395264, 1.7622416019439697, 1.811918020248413]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 9.0, 13.0, 11.0, 23.0, 22.0, 23.0, 33.0, 28.0, 34.0, 35.0, 42.0, 52.0, 62.0, 57.0, 58.0, 56.0, 47.0, 67.0, 42.0, 45.0, 36.0, 40.0, 25.0, 27.0, 24.0, 15.0, 19.0, 10.0, 6.0, 11.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2569037675857544, -1.2227094173431396, -1.1885151863098145, -1.1543208360671997, -1.1201266050338745, -1.0859322547912598, -1.0517380237579346, -1.0175436735153198, -0.9833493232727051, -0.9491550326347351, -0.9149607419967651, -0.8807663917541504, -0.8465721011161804, -0.8123778104782104, -0.7781835198402405, -0.7439892292022705, -0.7097949385643005, -0.6756006479263306, -0.6414063572883606, -0.6072120666503906, -0.5730177164077759, -0.5388234257698059, -0.5046291351318359, -0.47043484449386597, -0.4362405240535736, -0.40204623341560364, -0.3678519129753113, -0.3336576223373413, -0.29946333169937134, -0.265269011259079, -0.231074720621109, -0.19688041508197784, -0.16268610954284668, -0.12849180400371552, -0.09429750591516495, -0.06010320782661438, -0.025908902287483215, 0.00828540325164795, 0.04247969388961792, 0.07667399942874908, 0.11086830496788025, 0.1450626105070114, 0.17925691604614258, 0.21345120668411255, 0.2476455122232437, 0.2818398177623749, 0.31603410840034485, 0.3502284288406372, 0.3844227194786072, 0.41861701011657715, 0.4528113305568695, 0.4870056211948395, 0.5211999416351318, 0.5553942322731018, 0.5895885229110718, 0.6237828135490417, 0.6579771041870117, 0.6921713948249817, 0.7263656854629517, 0.7605600357055664, 0.7947543263435364, 0.8289486169815063, 0.8631429076194763, 0.8973371982574463, 0.931531548500061]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 14.0, 10.0, 6.0, 16.0, 23.0, 54.0, 80.0, 160.0, 251.0, 519.0, 1041.0, 2281.0, 5502.0, 15474.0, 49513.0, 170781.0, 394545.0, 279423.0, 87826.0, 25785.0, 9030.0, 3281.0, 1387.0, 695.0, 366.0, 188.0, 113.0, 64.0, 36.0, 36.0, 15.0, 10.0, 12.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.236328125, -0.2286376953125, -0.220947265625, -0.2132568359375, -0.20556640625, -0.1978759765625, -0.190185546875, -0.1824951171875, -0.1748046875, -0.1671142578125, -0.159423828125, -0.1517333984375, -0.14404296875, -0.1363525390625, -0.128662109375, -0.1209716796875, -0.11328125, -0.1055908203125, -0.097900390625, -0.0902099609375, -0.08251953125, -0.0748291015625, -0.067138671875, -0.0594482421875, -0.0517578125, -0.0440673828125, -0.036376953125, -0.0286865234375, -0.02099609375, -0.0133056640625, -0.005615234375, 0.0020751953125, 0.009765625, 0.0174560546875, 0.025146484375, 0.0328369140625, 0.04052734375, 0.0482177734375, 0.055908203125, 0.0635986328125, 0.0712890625, 0.0789794921875, 0.086669921875, 0.0943603515625, 0.10205078125, 0.1097412109375, 0.117431640625, 0.1251220703125, 0.1328125, 0.1405029296875, 0.148193359375, 0.1558837890625, 0.16357421875, 0.1712646484375, 0.178955078125, 0.1866455078125, 0.1943359375, 0.2020263671875, 0.209716796875, 0.2174072265625, 0.22509765625, 0.2327880859375, 0.240478515625, 0.2481689453125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 5.0, 11.0, 13.0, 18.0, 14.0, 21.0, 34.0, 37.0, 34.0, 32.0, 34.0, 52.0, 60.0, 77.0, 50.0, 55.0, 64.0, 59.0, 49.0, 38.0, 44.0, 38.0, 24.0, 33.0, 17.0, 13.0, 11.0, 11.0, 16.0, 10.0, 6.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76806640625, -0.7440185546875, -0.719970703125, -0.6959228515625, -0.671875, -0.6478271484375, -0.623779296875, -0.5997314453125, -0.57568359375, -0.5516357421875, -0.527587890625, -0.5035400390625, -0.4794921875, -0.4554443359375, -0.431396484375, -0.4073486328125, -0.38330078125, -0.3592529296875, -0.335205078125, -0.3111572265625, -0.287109375, -0.2630615234375, -0.239013671875, -0.2149658203125, -0.19091796875, -0.1668701171875, -0.142822265625, -0.1187744140625, -0.0947265625, -0.0706787109375, -0.046630859375, -0.0225830078125, 0.00146484375, 0.0255126953125, 0.049560546875, 0.0736083984375, 0.09765625, 0.1217041015625, 0.145751953125, 0.1697998046875, 0.19384765625, 0.2178955078125, 0.241943359375, 0.2659912109375, 0.2900390625, 0.3140869140625, 0.338134765625, 0.3621826171875, 0.38623046875, 0.4102783203125, 0.434326171875, 0.4583740234375, 0.482421875, 0.5064697265625, 0.530517578125, 0.5545654296875, 0.57861328125, 0.6026611328125, 0.626708984375, 0.6507568359375, 0.6748046875, 0.6988525390625, 0.722900390625, 0.7469482421875, 0.77099609375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 11.0, 14.0, 9.0, 13.0, 20.0, 21.0, 36.0, 52.0, 81.0, 118.0, 190.0, 323.0, 636.0, 1266.0, 2840.0, 6256.0, 15529.0, 42218.0, 126699.0, 313615.0, 325125.0, 138070.0, 46111.0, 16692.0, 6731.0, 2896.0, 1373.0, 694.0, 405.0, 183.0, 105.0, 65.0, 49.0, 29.0, 24.0, 22.0, 10.0, 11.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.20778274536132812, -0.20108795166015625, -0.19439315795898438, -0.1876983642578125, -0.18100357055664062, -0.17430877685546875, -0.16761398315429688, -0.160919189453125, -0.15422439575195312, -0.14752960205078125, -0.14083480834960938, -0.1341400146484375, -0.12744522094726562, -0.12075042724609375, -0.11405563354492188, -0.10736083984375, -0.10066604614257812, -0.09397125244140625, -0.08727645874023438, -0.0805816650390625, -0.07388687133789062, -0.06719207763671875, -0.060497283935546875, -0.053802490234375, -0.047107696533203125, -0.04041290283203125, -0.033718109130859375, -0.0270233154296875, -0.020328521728515625, -0.01363372802734375, -0.006938934326171875, -0.000244140625, 0.006450653076171875, 0.01314544677734375, 0.019840240478515625, 0.0265350341796875, 0.033229827880859375, 0.03992462158203125, 0.046619415283203125, 0.053314208984375, 0.060009002685546875, 0.06670379638671875, 0.07339859008789062, 0.0800933837890625, 0.08678817749023438, 0.09348297119140625, 0.10017776489257812, 0.10687255859375, 0.11356735229492188, 0.12026214599609375, 0.12695693969726562, 0.1336517333984375, 0.14034652709960938, 0.14704132080078125, 0.15373611450195312, 0.160430908203125, 0.16712570190429688, 0.17382049560546875, 0.18051528930664062, 0.1872100830078125, 0.19390487670898438, 0.20059967041015625, 0.20729446411132812, 0.2139892578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 9.0, 16.0, 21.0, 19.0, 22.0, 19.0, 41.0, 32.0, 37.0, 42.0, 48.0, 43.0, 57.0, 44.0, 48.0, 45.0, 46.0, 49.0, 43.0, 25.0, 29.0, 41.0, 33.0, 34.0, 27.0, 18.0, 14.0, 14.0, 10.0, 5.0, 9.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.302734375, -1.2593841552734375, -1.216033935546875, -1.1726837158203125, -1.12933349609375, -1.0859832763671875, -1.042633056640625, -0.9992828369140625, -0.9559326171875, -0.9125823974609375, -0.869232177734375, -0.8258819580078125, -0.78253173828125, -0.7391815185546875, -0.695831298828125, -0.6524810791015625, -0.609130859375, -0.5657806396484375, -0.522430419921875, -0.4790802001953125, -0.43572998046875, -0.3923797607421875, -0.349029541015625, -0.3056793212890625, -0.2623291015625, -0.2189788818359375, -0.175628662109375, -0.1322784423828125, -0.08892822265625, -0.0455780029296875, -0.002227783203125, 0.0411224365234375, 0.08447265625, 0.1278228759765625, 0.171173095703125, 0.2145233154296875, 0.25787353515625, 0.3012237548828125, 0.344573974609375, 0.3879241943359375, 0.4312744140625, 0.4746246337890625, 0.517974853515625, 0.5613250732421875, 0.60467529296875, 0.6480255126953125, 0.691375732421875, 0.7347259521484375, 0.778076171875, 0.8214263916015625, 0.864776611328125, 0.9081268310546875, 0.95147705078125, 0.9948272705078125, 1.038177490234375, 1.0815277099609375, 1.1248779296875, 1.1682281494140625, 1.211578369140625, 1.2549285888671875, 1.29827880859375, 1.3416290283203125, 1.384979248046875, 1.4283294677734375, 1.4716796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 20.0, 33.0, 39.0, 54.0, 94.0, 182.0, 298.0, 541.0, 1135.0, 2550.0, 7247.0, 24535.0, 104917.0, 420557.0, 368117.0, 86422.0, 21016.0, 6370.0, 2289.0, 963.0, 498.0, 257.0, 134.0, 96.0, 59.0, 34.0, 27.0, 20.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10300827026367188, -0.10005950927734375, -0.09711074829101562, -0.0941619873046875, -0.09121322631835938, -0.08826446533203125, -0.08531570434570312, -0.082366943359375, -0.07941818237304688, -0.07646942138671875, -0.07352066040039062, -0.0705718994140625, -0.06762313842773438, -0.06467437744140625, -0.061725616455078125, -0.05877685546875, -0.055828094482421875, -0.05287933349609375, -0.049930572509765625, -0.0469818115234375, -0.044033050537109375, -0.04108428955078125, -0.038135528564453125, -0.035186767578125, -0.032238006591796875, -0.02928924560546875, -0.026340484619140625, -0.0233917236328125, -0.020442962646484375, -0.01749420166015625, -0.014545440673828125, -0.0115966796875, -0.008647918701171875, -0.00569915771484375, -0.002750396728515625, 0.0001983642578125, 0.003147125244140625, 0.00609588623046875, 0.009044647216796875, 0.011993408203125, 0.014942169189453125, 0.01789093017578125, 0.020839691162109375, 0.0237884521484375, 0.026737213134765625, 0.02968597412109375, 0.032634735107421875, 0.03558349609375, 0.038532257080078125, 0.04148101806640625, 0.044429779052734375, 0.0473785400390625, 0.050327301025390625, 0.05327606201171875, 0.056224822998046875, 0.059173583984375, 0.062122344970703125, 0.06507110595703125, 0.06801986694335938, 0.0709686279296875, 0.07391738891601562, 0.07686614990234375, 0.07981491088867188, 0.082763671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 7.0, 12.0, 10.0, 10.0, 24.0, 36.0, 39.0, 52.0, 73.0, 79.0, 97.0, 108.0, 86.0, 71.0, 65.0, 42.0, 51.0, 37.0, 32.0, 15.0, 20.0, 9.0, 7.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.546476364135742e-05, -3.407523036003113e-05, -3.2685697078704834e-05, -3.129616379737854e-05, -2.9906630516052246e-05, -2.8517097234725952e-05, -2.7127563953399658e-05, -2.5738030672073364e-05, -2.434849739074707e-05, -2.2958964109420776e-05, -2.1569430828094482e-05, -2.017989754676819e-05, -1.8790364265441895e-05, -1.74008309841156e-05, -1.6011297702789307e-05, -1.4621764421463013e-05, -1.3232231140136719e-05, -1.1842697858810425e-05, -1.0453164577484131e-05, -9.063631296157837e-06, -7.674098014831543e-06, -6.284564733505249e-06, -4.895031452178955e-06, -3.505498170852661e-06, -2.115964889526367e-06, -7.264316082000732e-07, 6.631016731262207e-07, 2.0526349544525146e-06, 3.4421682357788086e-06, 4.8317015171051025e-06, 6.2212347984313965e-06, 7.6107680797576904e-06, 9.000301361083984e-06, 1.0389834642410278e-05, 1.1779367923736572e-05, 1.3168901205062866e-05, 1.455843448638916e-05, 1.5947967767715454e-05, 1.7337501049041748e-05, 1.8727034330368042e-05, 2.0116567611694336e-05, 2.150610089302063e-05, 2.2895634174346924e-05, 2.4285167455673218e-05, 2.5674700736999512e-05, 2.7064234018325806e-05, 2.84537672996521e-05, 2.9843300580978394e-05, 3.123283386230469e-05, 3.262236714363098e-05, 3.4011900424957275e-05, 3.540143370628357e-05, 3.679096698760986e-05, 3.818050026893616e-05, 3.957003355026245e-05, 4.0959566831588745e-05, 4.234910011291504e-05, 4.373863339424133e-05, 4.512816667556763e-05, 4.651769995689392e-05, 4.7907233238220215e-05, 4.929676651954651e-05, 5.06862998008728e-05, 5.20758330821991e-05, 5.346536636352539e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 11.0, 19.0, 26.0, 24.0, 45.0, 75.0, 128.0, 156.0, 239.0, 460.0, 903.0, 2044.0, 5875.0, 19380.0, 82176.0, 391380.0, 422554.0, 91531.0, 20985.0, 6017.0, 2177.0, 1001.0, 505.0, 292.0, 179.0, 103.0, 66.0, 53.0, 42.0, 27.0, 21.0, 6.0, 13.0, 3.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1243896484375, -0.12103080749511719, -0.11767196655273438, -0.11431312561035156, -0.11095428466796875, -0.10759544372558594, -0.10423660278320312, -0.10087776184082031, -0.0975189208984375, -0.09416007995605469, -0.09080123901367188, -0.08744239807128906, -0.08408355712890625, -0.08072471618652344, -0.07736587524414062, -0.07400703430175781, -0.070648193359375, -0.06728935241699219, -0.06393051147460938, -0.06057167053222656, -0.05721282958984375, -0.05385398864746094, -0.050495147705078125, -0.04713630676269531, -0.0437774658203125, -0.04041862487792969, -0.037059783935546875, -0.03370094299316406, -0.03034210205078125, -0.026983261108398438, -0.023624420166015625, -0.020265579223632812, -0.01690673828125, -0.013547897338867188, -0.010189056396484375, -0.0068302154541015625, -0.00347137451171875, -0.0001125335693359375, 0.003246307373046875, 0.0066051483154296875, 0.0099639892578125, 0.013322830200195312, 0.016681671142578125, 0.020040512084960938, 0.02339935302734375, 0.026758193969726562, 0.030117034912109375, 0.03347587585449219, 0.036834716796875, 0.04019355773925781, 0.043552398681640625, 0.04691123962402344, 0.05027008056640625, 0.05362892150878906, 0.056987762451171875, 0.06034660339355469, 0.0637054443359375, 0.06706428527832031, 0.07042312622070312, 0.07378196716308594, 0.07714080810546875, 0.08049964904785156, 0.08385848999023438, 0.08721733093261719, 0.090576171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 10.0, 4.0, 5.0, 6.0, 10.0, 15.0, 12.0, 12.0, 22.0, 32.0, 28.0, 44.0, 38.0, 53.0, 67.0, 67.0, 72.0, 77.0, 66.0, 64.0, 50.0, 40.0, 56.0, 27.0, 30.0, 27.0, 19.0, 16.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018829345703125, -0.01801776885986328, -0.017206192016601562, -0.016394615173339844, -0.015583038330078125, -0.014771461486816406, -0.013959884643554688, -0.013148307800292969, -0.01233673095703125, -0.011525154113769531, -0.010713577270507812, -0.009902000427246094, -0.009090423583984375, -0.008278846740722656, -0.0074672698974609375, -0.006655693054199219, -0.0058441162109375, -0.005032539367675781, -0.0042209625244140625, -0.0034093856811523438, -0.002597808837890625, -0.0017862319946289062, -0.0009746551513671875, -0.00016307830810546875, 0.00064849853515625, 0.0014600753784179688, 0.0022716522216796875, 0.0030832290649414062, 0.003894805908203125, 0.004706382751464844, 0.0055179595947265625, 0.006329536437988281, 0.00714111328125, 0.007952690124511719, 0.008764266967773438, 0.009575843811035156, 0.010387420654296875, 0.011198997497558594, 0.012010574340820312, 0.012822151184082031, 0.01363372802734375, 0.014445304870605469, 0.015256881713867188, 0.016068458557128906, 0.016880035400390625, 0.017691612243652344, 0.018503189086914062, 0.01931476593017578, 0.0201263427734375, 0.02093791961669922, 0.021749496459960938, 0.022561073303222656, 0.023372650146484375, 0.024184226989746094, 0.024995803833007812, 0.02580738067626953, 0.02661895751953125, 0.02743053436279297, 0.028242111206054688, 0.029053688049316406, 0.029865264892578125, 0.030676841735839844, 0.03148841857910156, 0.03229999542236328, 0.033111572265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 14.0, 23.0, 35.0, 67.0, 105.0, 141.0, 155.0, 143.0, 114.0, 76.0, 50.0, 36.0, 16.0, 5.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1169722080230713, -1.0674782991409302, -1.017984390258789, -0.9684904217720032, -0.9189965128898621, -0.8695025444030762, -0.8200086355209351, -0.770514726638794, -0.7210208177566528, -0.6715269088745117, -0.6220329403877258, -0.5725390315055847, -0.5230451226234436, -0.4735511839389801, -0.4240572452545166, -0.3745633363723755, -0.3250693678855896, -0.2755754292011261, -0.22608152031898499, -0.17658758163452148, -0.12709365785121918, -0.07759973406791687, -0.02810579538345337, 0.021388113498687744, 0.07088205218315125, 0.12037597596645355, 0.16986989974975586, 0.21936383843421936, 0.26885777711868286, 0.318351686000824, 0.3678456246852875, 0.4173395335674286, 0.4668334722518921, 0.5163273811340332, 0.5658213496208191, 0.6153152585029602, 0.6648091673851013, 0.7143031358718872, 0.7637970447540283, 0.8132909536361694, 0.8627848625183105, 0.9122787714004517, 0.9617727398872375, 1.0112667083740234, 1.0607606172561646, 1.1102545261383057, 1.1597484350204468, 1.209242343902588, 1.2587363719940186, 1.3082302808761597, 1.3577241897583008, 1.4072182178497314, 1.4567121267318726, 1.5062060356140137, 1.5556999444961548, 1.605193853378296, 1.654687762260437, 1.7041816711425781, 1.7536755800247192, 1.8031694889068604, 1.852663516998291, 1.9021574258804321, 1.9516513347625732, 2.001145362854004, 2.0506391525268555]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 7.0, 15.0, 22.0, 23.0, 30.0, 32.0, 38.0, 30.0, 34.0, 65.0, 72.0, 58.0, 65.0, 68.0, 61.0, 70.0, 44.0, 47.0, 44.0, 31.0, 29.0, 22.0, 18.0, 20.0, 10.0, 8.0, 11.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8638395071029663, -0.8384256958961487, -0.813011884689331, -0.7875980734825134, -0.7621842622756958, -0.7367704510688782, -0.7113566398620605, -0.6859428286552429, -0.6605290174484253, -0.6351152062416077, -0.60970139503479, -0.5842875838279724, -0.5588737726211548, -0.5334599614143372, -0.5080461502075195, -0.4826323390007019, -0.4572184979915619, -0.43180468678474426, -0.40639087557792664, -0.380977064371109, -0.3555632531642914, -0.33014941215515137, -0.30473560094833374, -0.2793217897415161, -0.2539079785346985, -0.22849416732788086, -0.20308035612106323, -0.1776665449142456, -0.15225273370742798, -0.12683890759944916, -0.10142509639263153, -0.0760112851858139, -0.05059748888015747, -0.025183675810694695, 0.00023013725876808167, 0.025643952190876007, 0.051057763397693634, 0.07647158205509186, 0.10188539326190948, 0.1272992044687271, 0.15271301567554474, 0.17812682688236237, 0.20354063808918, 0.2289544641971588, 0.25436827540397644, 0.27978208661079407, 0.3051958978176117, 0.3306097090244293, 0.35602352023124695, 0.3814373314380646, 0.4068511426448822, 0.43226495385169983, 0.45767876505851746, 0.48309260606765747, 0.5085064172744751, 0.5339202284812927, 0.5593340396881104, 0.584747850894928, 0.6101616621017456, 0.6355754733085632, 0.6609892845153809, 0.6864030957221985, 0.7118169069290161, 0.7372307181358337, 0.7626445293426514]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 4.0, 5.0, 13.0, 17.0, 28.0, 46.0, 78.0, 128.0, 237.0, 383.0, 658.0, 1343.0, 2642.0, 5331.0, 12271.0, 30684.0, 94886.0, 380810.0, 373110.0, 92355.0, 30652.0, 12000.0, 5400.0, 2553.0, 1289.0, 683.0, 380.0, 211.0, 132.0, 92.0, 48.0, 31.0, 19.0, 11.0, 4.0, 10.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.5927734375, -0.5748062133789062, -0.5568389892578125, -0.5388717651367188, -0.520904541015625, -0.5029373168945312, -0.4849700927734375, -0.46700286865234375, -0.44903564453125, -0.43106842041015625, -0.4131011962890625, -0.39513397216796875, -0.377166748046875, -0.35919952392578125, -0.3412322998046875, -0.32326507568359375, -0.3052978515625, -0.28733062744140625, -0.2693634033203125, -0.25139617919921875, -0.233428955078125, -0.21546173095703125, -0.1974945068359375, -0.17952728271484375, -0.16156005859375, -0.14359283447265625, -0.1256256103515625, -0.10765838623046875, -0.089691162109375, -0.07172393798828125, -0.0537567138671875, -0.03578948974609375, -0.017822265625, 0.00014495849609375, 0.0181121826171875, 0.03607940673828125, 0.054046630859375, 0.07201385498046875, 0.0899810791015625, 0.10794830322265625, 0.12591552734375, 0.14388275146484375, 0.1618499755859375, 0.17981719970703125, 0.197784423828125, 0.21575164794921875, 0.2337188720703125, 0.25168609619140625, 0.2696533203125, 0.28762054443359375, 0.3055877685546875, 0.32355499267578125, 0.341522216796875, 0.35948944091796875, 0.3774566650390625, 0.39542388916015625, 0.41339111328125, 0.43135833740234375, 0.4493255615234375, 0.46729278564453125, 0.485260009765625, 0.5032272338867188, 0.5211944580078125, 0.5391616821289062, 0.55712890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 11.0, 12.0, 25.0, 25.0, 32.0, 35.0, 41.0, 41.0, 59.0, 63.0, 64.0, 81.0, 76.0, 62.0, 69.0, 37.0, 59.0, 40.0, 31.0, 26.0, 22.0, 18.0, 14.0, 10.0, 15.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8349609375, -1.7808380126953125, -1.726715087890625, -1.6725921630859375, -1.61846923828125, -1.5643463134765625, -1.510223388671875, -1.4561004638671875, -1.4019775390625, -1.3478546142578125, -1.293731689453125, -1.2396087646484375, -1.18548583984375, -1.1313629150390625, -1.077239990234375, -1.0231170654296875, -0.968994140625, -0.9148712158203125, -0.860748291015625, -0.8066253662109375, -0.75250244140625, -0.6983795166015625, -0.644256591796875, -0.5901336669921875, -0.5360107421875, -0.4818878173828125, -0.427764892578125, -0.3736419677734375, -0.31951904296875, -0.2653961181640625, -0.211273193359375, -0.1571502685546875, -0.10302734375, -0.0489044189453125, 0.005218505859375, 0.0593414306640625, 0.11346435546875, 0.1675872802734375, 0.221710205078125, 0.2758331298828125, 0.3299560546875, 0.3840789794921875, 0.438201904296875, 0.4923248291015625, 0.54644775390625, 0.6005706787109375, 0.654693603515625, 0.7088165283203125, 0.762939453125, 0.8170623779296875, 0.871185302734375, 0.9253082275390625, 0.97943115234375, 1.0335540771484375, 1.087677001953125, 1.1417999267578125, 1.1959228515625, 1.2500457763671875, 1.304168701171875, 1.3582916259765625, 1.41241455078125, 1.4665374755859375, 1.520660400390625, 1.5747833251953125, 1.62890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 11.0, 10.0, 13.0, 30.0, 49.0, 60.0, 107.0, 148.0, 335.0, 776.0, 3796.0, 51917.0, 889265.0, 94662.0, 5470.0, 969.0, 354.0, 195.0, 114.0, 68.0, 44.0, 34.0, 30.0, 21.0, 12.0, 16.0, 2.0, 7.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8388671875, -1.782440185546875, -1.72601318359375, -1.669586181640625, -1.6131591796875, -1.556732177734375, -1.50030517578125, -1.443878173828125, -1.387451171875, -1.331024169921875, -1.27459716796875, -1.218170166015625, -1.1617431640625, -1.105316162109375, -1.04888916015625, -0.992462158203125, -0.93603515625, -0.879608154296875, -0.82318115234375, -0.766754150390625, -0.7103271484375, -0.653900146484375, -0.59747314453125, -0.541046142578125, -0.484619140625, -0.428192138671875, -0.37176513671875, -0.315338134765625, -0.2589111328125, -0.202484130859375, -0.14605712890625, -0.089630126953125, -0.033203125, 0.023223876953125, 0.07965087890625, 0.136077880859375, 0.1925048828125, 0.248931884765625, 0.30535888671875, 0.361785888671875, 0.418212890625, 0.474639892578125, 0.53106689453125, 0.587493896484375, 0.6439208984375, 0.700347900390625, 0.75677490234375, 0.813201904296875, 0.86962890625, 0.926055908203125, 0.98248291015625, 1.038909912109375, 1.0953369140625, 1.151763916015625, 1.20819091796875, 1.264617919921875, 1.321044921875, 1.377471923828125, 1.43389892578125, 1.490325927734375, 1.5467529296875, 1.603179931640625, 1.65960693359375, 1.716033935546875, 1.7724609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 10.0, 9.0, 13.0, 16.0, 25.0, 25.0, 33.0, 37.0, 56.0, 59.0, 54.0, 71.0, 78.0, 80.0, 71.0, 84.0, 58.0, 48.0, 30.0, 32.0, 31.0, 22.0, 20.0, 11.0, 10.0, 9.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.218658447265625, -2.14239501953125, -2.066131591796875, -1.9898681640625, -1.913604736328125, -1.83734130859375, -1.761077880859375, -1.684814453125, -1.608551025390625, -1.53228759765625, -1.456024169921875, -1.3797607421875, -1.303497314453125, -1.22723388671875, -1.150970458984375, -1.07470703125, -0.998443603515625, -0.92218017578125, -0.845916748046875, -0.7696533203125, -0.693389892578125, -0.61712646484375, -0.540863037109375, -0.464599609375, -0.388336181640625, -0.31207275390625, -0.235809326171875, -0.1595458984375, -0.083282470703125, -0.00701904296875, 0.069244384765625, 0.1455078125, 0.221771240234375, 0.29803466796875, 0.374298095703125, 0.4505615234375, 0.526824951171875, 0.60308837890625, 0.679351806640625, 0.755615234375, 0.831878662109375, 0.90814208984375, 0.984405517578125, 1.0606689453125, 1.136932373046875, 1.21319580078125, 1.289459228515625, 1.36572265625, 1.441986083984375, 1.51824951171875, 1.594512939453125, 1.6707763671875, 1.747039794921875, 1.82330322265625, 1.899566650390625, 1.975830078125, 2.052093505859375, 2.12835693359375, 2.204620361328125, 2.2808837890625, 2.357147216796875, 2.43341064453125, 2.509674072265625, 2.5859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 5.0, 15.0, 22.0, 35.0, 52.0, 74.0, 139.0, 302.0, 845.0, 4093.0, 62433.0, 915355.0, 59648.0, 3937.0, 857.0, 307.0, 156.0, 84.0, 58.0, 39.0, 23.0, 13.0, 12.0, 10.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6729354858398438, -0.6539764404296875, -0.6350173950195312, -0.616058349609375, -0.5970993041992188, -0.5781402587890625, -0.5591812133789062, -0.54022216796875, -0.5212631225585938, -0.5023040771484375, -0.48334503173828125, -0.464385986328125, -0.44542694091796875, -0.4264678955078125, -0.40750885009765625, -0.3885498046875, -0.36959075927734375, -0.3506317138671875, -0.33167266845703125, -0.312713623046875, -0.29375457763671875, -0.2747955322265625, -0.25583648681640625, -0.23687744140625, -0.21791839599609375, -0.1989593505859375, -0.18000030517578125, -0.161041259765625, -0.14208221435546875, -0.1231231689453125, -0.10416412353515625, -0.085205078125, -0.06624603271484375, -0.0472869873046875, -0.02832794189453125, -0.009368896484375, 0.00959014892578125, 0.0285491943359375, 0.04750823974609375, 0.06646728515625, 0.08542633056640625, 0.1043853759765625, 0.12334442138671875, 0.142303466796875, 0.16126251220703125, 0.1802215576171875, 0.19918060302734375, 0.2181396484375, 0.23709869384765625, 0.2560577392578125, 0.27501678466796875, 0.293975830078125, 0.31293487548828125, 0.3318939208984375, 0.35085296630859375, 0.36981201171875, 0.38877105712890625, 0.4077301025390625, 0.42668914794921875, 0.445648193359375, 0.46460723876953125, 0.4835662841796875, 0.5025253295898438, 0.521484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 9.0, 9.0, 18.0, 52.0, 112.0, 204.0, 255.0, 181.0, 85.0, 47.0, 17.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001506805419921875, -0.00014729052782058716, -0.00014390051364898682, -0.00014051049947738647, -0.00013712048530578613, -0.0001337304711341858, -0.00013034045696258545, -0.0001269504427909851, -0.00012356042861938477, -0.00012017041444778442, -0.00011678040027618408, -0.00011339038610458374, -0.0001100003719329834, -0.00010661035776138306, -0.00010322034358978271, -9.983032941818237e-05, -9.644031524658203e-05, -9.305030107498169e-05, -8.966028690338135e-05, -8.6270272731781e-05, -8.288025856018066e-05, -7.949024438858032e-05, -7.610023021697998e-05, -7.271021604537964e-05, -6.93202018737793e-05, -6.593018770217896e-05, -6.254017353057861e-05, -5.915015935897827e-05, -5.576014518737793e-05, -5.237013101577759e-05, -4.8980116844177246e-05, -4.5590102672576904e-05, -4.220008850097656e-05, -3.881007432937622e-05, -3.542006015777588e-05, -3.203004598617554e-05, -2.8640031814575195e-05, -2.5250017642974854e-05, -2.1860003471374512e-05, -1.846998929977417e-05, -1.5079975128173828e-05, -1.1689960956573486e-05, -8.299946784973145e-06, -4.909932613372803e-06, -1.519918441772461e-06, 1.8700957298278809e-06, 5.260109901428223e-06, 8.650124073028564e-06, 1.2040138244628906e-05, 1.5430152416229248e-05, 1.882016658782959e-05, 2.221018075942993e-05, 2.5600194931030273e-05, 2.8990209102630615e-05, 3.238022327423096e-05, 3.57702374458313e-05, 3.916025161743164e-05, 4.255026578903198e-05, 4.5940279960632324e-05, 4.9330294132232666e-05, 5.272030830383301e-05, 5.611032247543335e-05, 5.950033664703369e-05, 6.289035081863403e-05, 6.628036499023438e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 11.0, 13.0, 23.0, 40.0, 57.0, 135.0, 323.0, 814.0, 2694.0, 24975.0, 912430.0, 99788.0, 5136.0, 1197.0, 441.0, 211.0, 96.0, 57.0, 36.0, 19.0, 10.0, 9.0, 6.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.78515625, -0.7611312866210938, -0.7371063232421875, -0.7130813598632812, -0.689056396484375, -0.6650314331054688, -0.6410064697265625, -0.6169815063476562, -0.59295654296875, -0.5689315795898438, -0.5449066162109375, -0.5208816528320312, -0.496856689453125, -0.47283172607421875, -0.4488067626953125, -0.42478179931640625, -0.4007568359375, -0.37673187255859375, -0.3527069091796875, -0.32868194580078125, -0.304656982421875, -0.28063201904296875, -0.2566070556640625, -0.23258209228515625, -0.20855712890625, -0.18453216552734375, -0.1605072021484375, -0.13648223876953125, -0.112457275390625, -0.08843231201171875, -0.0644073486328125, -0.04038238525390625, -0.016357421875, 0.00766754150390625, 0.0316925048828125, 0.05571746826171875, 0.079742431640625, 0.10376739501953125, 0.1277923583984375, 0.15181732177734375, 0.17584228515625, 0.19986724853515625, 0.2238922119140625, 0.24791717529296875, 0.271942138671875, 0.29596710205078125, 0.3199920654296875, 0.34401702880859375, 0.3680419921875, 0.39206695556640625, 0.4160919189453125, 0.44011688232421875, 0.464141845703125, 0.48816680908203125, 0.5121917724609375, 0.5362167358398438, 0.56024169921875, 0.5842666625976562, 0.6082916259765625, 0.6323165893554688, 0.656341552734375, 0.6803665161132812, 0.7043914794921875, 0.7284164428710938, 0.75244140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 7.0, 13.0, 18.0, 31.0, 31.0, 40.0, 69.0, 114.0, 140.0, 168.0, 117.0, 92.0, 62.0, 28.0, 17.0, 13.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2391357421875, -0.23250198364257812, -0.22586822509765625, -0.21923446655273438, -0.2126007080078125, -0.20596694946289062, -0.19933319091796875, -0.19269943237304688, -0.186065673828125, -0.17943191528320312, -0.17279815673828125, -0.16616439819335938, -0.1595306396484375, -0.15289688110351562, -0.14626312255859375, -0.13962936401367188, -0.13299560546875, -0.12636184692382812, -0.11972808837890625, -0.11309432983398438, -0.1064605712890625, -0.09982681274414062, -0.09319305419921875, -0.08655929565429688, -0.079925537109375, -0.07329177856445312, -0.06665802001953125, -0.060024261474609375, -0.0533905029296875, -0.046756744384765625, -0.04012298583984375, -0.033489227294921875, -0.02685546875, -0.020221710205078125, -0.01358795166015625, -0.006954193115234375, -0.0003204345703125, 0.006313323974609375, 0.01294708251953125, 0.019580841064453125, 0.026214599609375, 0.032848358154296875, 0.03948211669921875, 0.046115875244140625, 0.0527496337890625, 0.059383392333984375, 0.06601715087890625, 0.07265090942382812, 0.07928466796875, 0.08591842651367188, 0.09255218505859375, 0.09918594360351562, 0.1058197021484375, 0.11245346069335938, 0.11908721923828125, 0.12572097778320312, 0.132354736328125, 0.13898849487304688, 0.14562225341796875, 0.15225601196289062, 0.1588897705078125, 0.16552352905273438, 0.17215728759765625, 0.17879104614257812, 0.1854248046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 9.0, 15.0, 24.0, 24.0, 37.0, 66.0, 109.0, 106.0, 130.0, 119.0, 96.0, 84.0, 63.0, 44.0, 25.0, 21.0, 10.0, 9.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7931145429611206, -1.7143815755844116, -1.635648488998413, -1.556915521621704, -1.4781825542449951, -1.3994494676589966, -1.3207165002822876, -1.241983413696289, -1.16325044631958, -1.084517478942871, -1.0057843923568726, -0.9270514249801636, -0.8483183979988098, -0.769585371017456, -0.6908524036407471, -0.6121193766593933, -0.5333863496780396, -0.4546533226966858, -0.3759203255176544, -0.29718732833862305, -0.2184543013572693, -0.13972127437591553, -0.060988277196884155, 0.017744719982147217, 0.09647774696350098, 0.17521075904369354, 0.2539437711238861, 0.3326767683029175, 0.41140979528427124, 0.490142822265625, 0.568875789642334, 0.6476088166236877, 0.726341724395752, 0.8050747513771057, 0.8838077783584595, 0.9625407457351685, 1.041273832321167, 1.120006799697876, 1.198739767074585, 1.277472734451294, 1.3562058210372925, 1.4349387884140015, 1.513671875, 1.592404842376709, 1.671137809753418, 1.7498708963394165, 1.8286038637161255, 1.907336950302124, 1.986069917678833, 2.064802885055542, 2.143535852432251, 2.222269058227539, 2.301002025604248, 2.379734992980957, 2.458467960357666, 2.537200927734375, 2.615933895111084, 2.694666862487793, 2.773399829864502, 2.85213303565979, 2.930866003036499, 3.009598970413208, 3.088331937789917, 3.167064905166626, 3.245798110961914]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 6.0, 9.0, 7.0, 8.0, 10.0, 17.0, 28.0, 30.0, 29.0, 34.0, 40.0, 53.0, 50.0, 80.0, 66.0, 69.0, 68.0, 67.0, 54.0, 56.0, 42.0, 39.0, 45.0, 40.0, 15.0, 10.0, 9.0, 10.0, 6.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8595168590545654, -2.7413735389709473, -2.623230457305908, -2.50508713722229, -2.386943817138672, -2.268800735473633, -2.1506574153900146, -2.0325140953063965, -1.9143708944320679, -1.7962276935577393, -1.678084373474121, -1.5599411725997925, -1.4417979717254639, -1.3236546516418457, -1.205511450767517, -1.0873682498931885, -0.9692249298095703, -0.8510816693305969, -0.7329384088516235, -0.6147952079772949, -0.49665194749832153, -0.37850868701934814, -0.26036548614501953, -0.14222222566604614, -0.024078965187072754, 0.09406428039073944, 0.21220752596855164, 0.33035075664520264, 0.448494017124176, 0.5666372776031494, 0.684780478477478, 0.8029237389564514, 0.9210672378540039, 1.0392104387283325, 1.1573537588119507, 1.2754969596862793, 1.3936402797698975, 1.511783480644226, 1.6299266815185547, 1.7480700016021729, 1.8662132024765015, 1.98435640335083, 2.1024997234344482, 2.2206430435180664, 2.3387861251831055, 2.4569294452667236, 2.575072765350342, 2.693215847015381, 2.811359167098999, 2.929502487182617, 3.0476455688476562, 3.1657888889312744, 3.2839322090148926, 3.4020752906799316, 3.52021861076355, 3.638361930847168, 3.756505012512207, 3.874648332595825, 3.9927914142608643, 4.110934734344482, 4.2290778160095215, 4.347221374511719, 4.465364456176758, 4.583507537841797, 4.701651096343994]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 11.0, 17.0, 28.0, 42.0, 77.0, 129.0, 238.0, 553.0, 1314.0, 4137.0, 17615.0, 177129.0, 2741867.0, 1178388.0, 59216.0, 9188.0, 2568.0, 899.0, 432.0, 197.0, 84.0, 61.0, 25.0, 17.0, 22.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9189453125, -1.860443115234375, -1.80194091796875, -1.743438720703125, -1.6849365234375, -1.626434326171875, -1.56793212890625, -1.509429931640625, -1.450927734375, -1.392425537109375, -1.33392333984375, -1.275421142578125, -1.2169189453125, -1.158416748046875, -1.09991455078125, -1.041412353515625, -0.98291015625, -0.924407958984375, -0.86590576171875, -0.807403564453125, -0.7489013671875, -0.690399169921875, -0.63189697265625, -0.573394775390625, -0.514892578125, -0.456390380859375, -0.39788818359375, -0.339385986328125, -0.2808837890625, -0.222381591796875, -0.16387939453125, -0.105377197265625, -0.046875, 0.011627197265625, 0.07012939453125, 0.128631591796875, 0.1871337890625, 0.245635986328125, 0.30413818359375, 0.362640380859375, 0.421142578125, 0.479644775390625, 0.53814697265625, 0.596649169921875, 0.6551513671875, 0.713653564453125, 0.77215576171875, 0.830657958984375, 0.88916015625, 0.947662353515625, 1.00616455078125, 1.064666748046875, 1.1231689453125, 1.181671142578125, 1.24017333984375, 1.298675537109375, 1.357177734375, 1.415679931640625, 1.47418212890625, 1.532684326171875, 1.5911865234375, 1.649688720703125, 1.70819091796875, 1.766693115234375, 1.8251953125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 7.0, 13.0, 19.0, 18.0, 23.0, 24.0, 32.0, 28.0, 37.0, 43.0, 48.0, 48.0, 48.0, 59.0, 55.0, 48.0, 64.0, 56.0, 39.0, 50.0, 42.0, 39.0, 21.0, 21.0, 23.0, 16.0, 10.0, 9.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9580078125, -0.9302902221679688, -0.9025726318359375, -0.8748550415039062, -0.847137451171875, -0.8194198608398438, -0.7917022705078125, -0.7639846801757812, -0.73626708984375, -0.7085494995117188, -0.6808319091796875, -0.6531143188476562, -0.625396728515625, -0.5976791381835938, -0.5699615478515625, -0.5422439575195312, -0.5145263671875, -0.48680877685546875, -0.4590911865234375, -0.43137359619140625, -0.403656005859375, -0.37593841552734375, -0.3482208251953125, -0.32050323486328125, -0.29278564453125, -0.26506805419921875, -0.2373504638671875, -0.20963287353515625, -0.181915283203125, -0.15419769287109375, -0.1264801025390625, -0.09876251220703125, -0.071044921875, -0.04332733154296875, -0.0156097412109375, 0.01210784912109375, 0.039825439453125, 0.06754302978515625, 0.0952606201171875, 0.12297821044921875, 0.15069580078125, 0.17841339111328125, 0.2061309814453125, 0.23384857177734375, 0.261566162109375, 0.28928375244140625, 0.3170013427734375, 0.34471893310546875, 0.3724365234375, 0.40015411376953125, 0.4278717041015625, 0.45558929443359375, 0.483306884765625, 0.5110244750976562, 0.5387420654296875, 0.5664596557617188, 0.59417724609375, 0.6218948364257812, 0.6496124267578125, 0.6773300170898438, 0.705047607421875, 0.7327651977539062, 0.7604827880859375, 0.7882003784179688, 0.81591796875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 7.0, 6.0, 9.0, 15.0, 31.0, 49.0, 79.0, 136.0, 340.0, 1042.0, 5395.0, 129046.0, 3983887.0, 68702.0, 4130.0, 862.0, 275.0, 121.0, 57.0, 29.0, 23.0, 15.0, 5.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.333984375, -3.231170654296875, -3.12835693359375, -3.025543212890625, -2.9227294921875, -2.819915771484375, -2.71710205078125, -2.614288330078125, -2.511474609375, -2.408660888671875, -2.30584716796875, -2.203033447265625, -2.1002197265625, -1.997406005859375, -1.89459228515625, -1.791778564453125, -1.68896484375, -1.586151123046875, -1.48333740234375, -1.380523681640625, -1.2777099609375, -1.174896240234375, -1.07208251953125, -0.969268798828125, -0.866455078125, -0.763641357421875, -0.66082763671875, -0.558013916015625, -0.4552001953125, -0.352386474609375, -0.24957275390625, -0.146759033203125, -0.0439453125, 0.058868408203125, 0.16168212890625, 0.264495849609375, 0.3673095703125, 0.470123291015625, 0.57293701171875, 0.675750732421875, 0.778564453125, 0.881378173828125, 0.98419189453125, 1.087005615234375, 1.1898193359375, 1.292633056640625, 1.39544677734375, 1.498260498046875, 1.60107421875, 1.703887939453125, 1.80670166015625, 1.909515380859375, 2.0123291015625, 2.115142822265625, 2.21795654296875, 2.320770263671875, 2.423583984375, 2.526397705078125, 2.62921142578125, 2.732025146484375, 2.8348388671875, 2.937652587890625, 3.04046630859375, 3.143280029296875, 3.24609375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 17.0, 20.0, 20.0, 44.0, 58.0, 103.0, 149.0, 269.0, 411.0, 634.0, 696.0, 576.0, 398.0, 198.0, 146.0, 96.0, 62.0, 51.0, 30.0, 20.0, 19.0, 8.0, 7.0, 10.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5234375, -0.5086479187011719, -0.49385833740234375, -0.4790687561035156, -0.4642791748046875, -0.4494895935058594, -0.43470001220703125, -0.4199104309082031, -0.405120849609375, -0.3903312683105469, -0.37554168701171875, -0.3607521057128906, -0.3459625244140625, -0.3311729431152344, -0.31638336181640625, -0.3015937805175781, -0.28680419921875, -0.2720146179199219, -0.25722503662109375, -0.24243545532226562, -0.2276458740234375, -0.21285629272460938, -0.19806671142578125, -0.18327713012695312, -0.168487548828125, -0.15369796752929688, -0.13890838623046875, -0.12411880493164062, -0.1093292236328125, -0.09453964233398438, -0.07975006103515625, -0.06496047973632812, -0.0501708984375, -0.035381317138671875, -0.02059173583984375, -0.005802154541015625, 0.0089874267578125, 0.023777008056640625, 0.03856658935546875, 0.053356170654296875, 0.068145751953125, 0.08293533325195312, 0.09772491455078125, 0.11251449584960938, 0.1273040771484375, 0.14209365844726562, 0.15688323974609375, 0.17167282104492188, 0.18646240234375, 0.20125198364257812, 0.21604156494140625, 0.23083114624023438, 0.2456207275390625, 0.2604103088378906, 0.27519989013671875, 0.2899894714355469, 0.304779052734375, 0.3195686340332031, 0.33435821533203125, 0.3491477966308594, 0.3639373779296875, 0.3787269592285156, 0.39351654052734375, 0.4083061218261719, 0.423095703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 24.0, 30.0, 52.0, 81.0, 88.0, 122.0, 129.0, 127.0, 102.0, 86.0, 56.0, 35.0, 24.0, 15.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.386441230773926, -2.3192806243896484, -2.252120018005371, -2.184959650039673, -2.1177990436553955, -2.050638437271118, -1.9834779500961304, -1.9163174629211426, -1.8491568565368652, -1.781996250152588, -1.7148357629776, -1.6476752758026123, -1.580514669418335, -1.5133540630340576, -1.4461935758590698, -1.379033088684082, -1.3118724822998047, -1.2447118759155273, -1.1775513887405396, -1.1103909015655518, -1.0432302951812744, -0.9760697484016418, -0.9089092016220093, -0.8417486548423767, -0.7745881080627441, -0.7074275612831116, -0.640267014503479, -0.5731064677238464, -0.5059459209442139, -0.4387853741645813, -0.37162482738494873, -0.30446428060531616, -0.23730361461639404, -0.17014306783676147, -0.1029825210571289, -0.03582197427749634, 0.03133857250213623, 0.0984991192817688, 0.16565966606140137, 0.23282021284103394, 0.2999807596206665, 0.3671413064002991, 0.43430185317993164, 0.5014623999595642, 0.5686229467391968, 0.6357834935188293, 0.7029440402984619, 0.7701045870780945, 0.837265133857727, 0.9044256806373596, 0.9715862274169922, 1.0387468338012695, 1.1059073209762573, 1.1730678081512451, 1.2402284145355225, 1.3073890209197998, 1.3745495080947876, 1.4417099952697754, 1.5088706016540527, 1.57603120803833, 1.6431916952133179, 1.7103521823883057, 1.777512788772583, 1.8446733951568604, 1.9118338823318481]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 4.0, 8.0, 5.0, 6.0, 8.0, 14.0, 12.0, 27.0, 24.0, 20.0, 29.0, 28.0, 40.0, 35.0, 55.0, 52.0, 43.0, 44.0, 45.0, 44.0, 47.0, 39.0, 41.0, 45.0, 36.0, 35.0, 29.0, 31.0, 24.0, 19.0, 17.0, 14.0, 17.0, 12.0, 9.0, 9.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8895167112350464, -0.8610020875930786, -0.8324874043464661, -0.8039727807044983, -0.7754580974578857, -0.746943473815918, -0.7184287905693054, -0.6899141669273376, -0.6613994836807251, -0.6328848600387573, -0.6043701767921448, -0.575855553150177, -0.5473408699035645, -0.5188262462615967, -0.49031156301498413, -0.46179693937301636, -0.4332822859287262, -0.40476763248443604, -0.3762529790401459, -0.3477383255958557, -0.31922367215156555, -0.2907090187072754, -0.2621943950653076, -0.23367972671985626, -0.2051650732755661, -0.17665041983127594, -0.14813576638698578, -0.11962112039327621, -0.09110646694898605, -0.06259182095527649, -0.03407716751098633, -0.005562514066696167, 0.022952139377593994, 0.051466792821884155, 0.07998144626617432, 0.10849609225988388, 0.13701075315475464, 0.1655253916978836, 0.19404004514217377, 0.22255469858646393, 0.2510693669319153, 0.27958402037620544, 0.3080986738204956, 0.33661332726478577, 0.3651279807090759, 0.3936426043510437, 0.42215728759765625, 0.450671911239624, 0.4791865646839142, 0.5077012181282043, 0.5362158417701721, 0.5647305250167847, 0.5932451486587524, 0.621759831905365, 0.6502744555473328, 0.6787891387939453, 0.7073037624359131, 0.7358183860778809, 0.7643330693244934, 0.7928476929664612, 0.8213623762130737, 0.8498769998550415, 0.878391683101654, 0.9069063067436218, 0.9354209899902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 3.0, 9.0, 17.0, 21.0, 29.0, 52.0, 90.0, 131.0, 235.0, 455.0, 808.0, 1479.0, 3027.0, 6199.0, 14827.0, 40651.0, 138930.0, 385879.0, 310025.0, 94738.0, 29288.0, 11340.0, 5072.0, 2391.0, 1297.0, 650.0, 335.0, 214.0, 131.0, 83.0, 48.0, 33.0, 20.0, 13.0, 12.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25554656982421875, -0.2466888427734375, -0.23783111572265625, -0.228973388671875, -0.22011566162109375, -0.2112579345703125, -0.20240020751953125, -0.19354248046875, -0.18468475341796875, -0.1758270263671875, -0.16696929931640625, -0.158111572265625, -0.14925384521484375, -0.1403961181640625, -0.13153839111328125, -0.1226806640625, -0.11382293701171875, -0.1049652099609375, -0.09610748291015625, -0.087249755859375, -0.07839202880859375, -0.0695343017578125, -0.06067657470703125, -0.05181884765625, -0.04296112060546875, -0.0341033935546875, -0.02524566650390625, -0.016387939453125, -0.00753021240234375, 0.0013275146484375, 0.01018524169921875, 0.01904296875, 0.02790069580078125, 0.0367584228515625, 0.04561614990234375, 0.054473876953125, 0.06333160400390625, 0.0721893310546875, 0.08104705810546875, 0.08990478515625, 0.09876251220703125, 0.1076202392578125, 0.11647796630859375, 0.125335693359375, 0.13419342041015625, 0.1430511474609375, 0.15190887451171875, 0.1607666015625, 0.16962432861328125, 0.1784820556640625, 0.18733978271484375, 0.196197509765625, 0.20505523681640625, 0.2139129638671875, 0.22277069091796875, 0.23162841796875, 0.24048614501953125, 0.2493438720703125, 0.25820159912109375, 0.267059326171875, 0.27591705322265625, 0.2847747802734375, 0.29363250732421875, 0.302490234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 13.0, 13.0, 15.0, 24.0, 29.0, 24.0, 36.0, 32.0, 46.0, 62.0, 54.0, 48.0, 54.0, 52.0, 70.0, 49.0, 51.0, 53.0, 54.0, 31.0, 33.0, 26.0, 21.0, 22.0, 14.0, 11.0, 15.0, 7.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8076171875, -0.7854537963867188, -0.7632904052734375, -0.7411270141601562, -0.718963623046875, -0.6968002319335938, -0.6746368408203125, -0.6524734497070312, -0.63031005859375, -0.6081466674804688, -0.5859832763671875, -0.5638198852539062, -0.541656494140625, -0.5194931030273438, -0.4973297119140625, -0.47516632080078125, -0.4530029296875, -0.43083953857421875, -0.4086761474609375, -0.38651275634765625, -0.364349365234375, -0.34218597412109375, -0.3200225830078125, -0.29785919189453125, -0.27569580078125, -0.25353240966796875, -0.2313690185546875, -0.20920562744140625, -0.187042236328125, -0.16487884521484375, -0.1427154541015625, -0.12055206298828125, -0.098388671875, -0.07622528076171875, -0.0540618896484375, -0.03189849853515625, -0.009735107421875, 0.01242828369140625, 0.0345916748046875, 0.05675506591796875, 0.07891845703125, 0.10108184814453125, 0.1232452392578125, 0.14540863037109375, 0.167572021484375, 0.18973541259765625, 0.2118988037109375, 0.23406219482421875, 0.2562255859375, 0.27838897705078125, 0.3005523681640625, 0.32271575927734375, 0.344879150390625, 0.36704254150390625, 0.3892059326171875, 0.41136932373046875, 0.43353271484375, 0.45569610595703125, 0.4778594970703125, 0.5000228881835938, 0.522186279296875, 0.5443496704101562, 0.5665130615234375, 0.5886764526367188, 0.61083984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 10.0, 8.0, 12.0, 14.0, 20.0, 28.0, 47.0, 74.0, 90.0, 206.0, 387.0, 860.0, 2040.0, 5195.0, 14912.0, 57496.0, 258660.0, 477305.0, 174319.0, 38830.0, 11041.0, 3923.0, 1567.0, 694.0, 335.0, 186.0, 97.0, 68.0, 30.0, 31.0, 19.0, 17.0, 8.0, 5.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.337646484375, -0.3280982971191406, -0.31855010986328125, -0.3090019226074219, -0.2994537353515625, -0.2899055480957031, -0.28035736083984375, -0.2708091735839844, -0.261260986328125, -0.2517127990722656, -0.24216461181640625, -0.23261642456054688, -0.2230682373046875, -0.21352005004882812, -0.20397186279296875, -0.19442367553710938, -0.18487548828125, -0.17532730102539062, -0.16577911376953125, -0.15623092651367188, -0.1466827392578125, -0.13713455200195312, -0.12758636474609375, -0.11803817749023438, -0.108489990234375, -0.09894180297851562, -0.08939361572265625, -0.07984542846679688, -0.0702972412109375, -0.060749053955078125, -0.05120086669921875, -0.041652679443359375, -0.0321044921875, -0.022556304931640625, -0.01300811767578125, -0.003459930419921875, 0.0060882568359375, 0.015636444091796875, 0.02518463134765625, 0.034732818603515625, 0.044281005859375, 0.053829193115234375, 0.06337738037109375, 0.07292556762695312, 0.0824737548828125, 0.09202194213867188, 0.10157012939453125, 0.11111831665039062, 0.12066650390625, 0.13021469116210938, 0.13976287841796875, 0.14931106567382812, 0.1588592529296875, 0.16840744018554688, 0.17795562744140625, 0.18750381469726562, 0.197052001953125, 0.20660018920898438, 0.21614837646484375, 0.22569656372070312, 0.2352447509765625, 0.24479293823242188, 0.25434112548828125, 0.2638893127441406, 0.2734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 14.0, 10.0, 15.0, 18.0, 20.0, 32.0, 46.0, 41.0, 49.0, 63.0, 66.0, 66.0, 80.0, 75.0, 62.0, 65.0, 56.0, 48.0, 37.0, 32.0, 33.0, 30.0, 13.0, 8.0, 8.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.328125, -1.27239990234375, -1.2166748046875, -1.16094970703125, -1.105224609375, -1.04949951171875, -0.9937744140625, -0.93804931640625, -0.88232421875, -0.82659912109375, -0.7708740234375, -0.71514892578125, -0.659423828125, -0.60369873046875, -0.5479736328125, -0.49224853515625, -0.4365234375, -0.38079833984375, -0.3250732421875, -0.26934814453125, -0.213623046875, -0.15789794921875, -0.1021728515625, -0.04644775390625, 0.00927734375, 0.06500244140625, 0.1207275390625, 0.17645263671875, 0.232177734375, 0.28790283203125, 0.3436279296875, 0.39935302734375, 0.455078125, 0.51080322265625, 0.5665283203125, 0.62225341796875, 0.677978515625, 0.73370361328125, 0.7894287109375, 0.84515380859375, 0.90087890625, 0.95660400390625, 1.0123291015625, 1.06805419921875, 1.123779296875, 1.17950439453125, 1.2352294921875, 1.29095458984375, 1.3466796875, 1.40240478515625, 1.4581298828125, 1.51385498046875, 1.569580078125, 1.62530517578125, 1.6810302734375, 1.73675537109375, 1.79248046875, 1.84820556640625, 1.9039306640625, 1.95965576171875, 2.015380859375, 2.07110595703125, 2.1268310546875, 2.18255615234375, 2.23828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 10.0, 9.0, 19.0, 16.0, 31.0, 47.0, 94.0, 142.0, 309.0, 548.0, 1186.0, 2440.0, 6248.0, 19258.0, 76325.0, 407402.0, 422437.0, 80237.0, 20139.0, 6537.0, 2648.0, 1143.0, 575.0, 304.0, 159.0, 89.0, 72.0, 38.0, 26.0, 17.0, 14.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1337890625, -0.1296100616455078, -0.12543106079101562, -0.12125205993652344, -0.11707305908203125, -0.11289405822753906, -0.10871505737304688, -0.10453605651855469, -0.1003570556640625, -0.09617805480957031, -0.09199905395507812, -0.08782005310058594, -0.08364105224609375, -0.07946205139160156, -0.07528305053710938, -0.07110404968261719, -0.066925048828125, -0.06274604797363281, -0.058567047119140625, -0.05438804626464844, -0.05020904541015625, -0.04603004455566406, -0.041851043701171875, -0.03767204284667969, -0.0334930419921875, -0.029314041137695312, -0.025135040283203125, -0.020956039428710938, -0.01677703857421875, -0.012598037719726562, -0.008419036865234375, -0.0042400360107421875, -6.103515625e-05, 0.0041179656982421875, 0.008296966552734375, 0.012475967407226562, 0.01665496826171875, 0.020833969116210938, 0.025012969970703125, 0.029191970825195312, 0.0333709716796875, 0.03754997253417969, 0.041728973388671875, 0.04590797424316406, 0.05008697509765625, 0.05426597595214844, 0.058444976806640625, 0.06262397766113281, 0.066802978515625, 0.07098197937011719, 0.07516098022460938, 0.07933998107910156, 0.08351898193359375, 0.08769798278808594, 0.09187698364257812, 0.09605598449707031, 0.1002349853515625, 0.10441398620605469, 0.10859298706054688, 0.11277198791503906, 0.11695098876953125, 0.12112998962402344, 0.12530899047851562, 0.1294879913330078, 0.1336669921875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 12.0, 8.0, 11.0, 14.0, 18.0, 30.0, 30.0, 59.0, 70.0, 80.0, 81.0, 101.0, 111.0, 95.0, 54.0, 48.0, 40.0, 36.0, 19.0, 21.0, 14.0, 9.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.267692565917969e-05, -4.113186150789261e-05, -3.958679735660553e-05, -3.804173320531845e-05, -3.649666905403137e-05, -3.495160490274429e-05, -3.3406540751457214e-05, -3.1861476600170135e-05, -3.0316412448883057e-05, -2.8771348297595978e-05, -2.72262841463089e-05, -2.568121999502182e-05, -2.413615584373474e-05, -2.2591091692447662e-05, -2.1046027541160583e-05, -1.9500963389873505e-05, -1.7955899238586426e-05, -1.6410835087299347e-05, -1.4865770936012268e-05, -1.332070678472519e-05, -1.177564263343811e-05, -1.0230578482151031e-05, -8.685514330863953e-06, -7.140450179576874e-06, -5.595386028289795e-06, -4.050321877002716e-06, -2.505257725715637e-06, -9.601935744285583e-07, 5.848705768585205e-07, 2.1299347281455994e-06, 3.6749988794326782e-06, 5.220063030719757e-06, 6.765127182006836e-06, 8.310191333293915e-06, 9.855255484580994e-06, 1.1400319635868073e-05, 1.2945383787155151e-05, 1.449044793844223e-05, 1.603551208972931e-05, 1.7580576241016388e-05, 1.9125640392303467e-05, 2.0670704543590546e-05, 2.2215768694877625e-05, 2.3760832846164703e-05, 2.5305896997451782e-05, 2.685096114873886e-05, 2.839602530002594e-05, 2.994108945131302e-05, 3.14861536026001e-05, 3.3031217753887177e-05, 3.4576281905174255e-05, 3.6121346056461334e-05, 3.766641020774841e-05, 3.921147435903549e-05, 4.075653851032257e-05, 4.230160266160965e-05, 4.384666681289673e-05, 4.539173096418381e-05, 4.6936795115470886e-05, 4.8481859266757965e-05, 5.0026923418045044e-05, 5.157198756933212e-05, 5.31170517206192e-05, 5.466211587190628e-05, 5.620718002319336e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 11.0, 11.0, 14.0, 30.0, 27.0, 38.0, 57.0, 71.0, 124.0, 193.0, 367.0, 675.0, 1498.0, 3428.0, 8485.0, 23879.0, 87509.0, 406768.0, 393522.0, 84252.0, 22911.0, 8170.0, 3343.0, 1455.0, 686.0, 362.0, 213.0, 118.0, 73.0, 62.0, 44.0, 27.0, 26.0, 17.0, 14.0, 13.0, 11.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1226806640625, -0.11858940124511719, -0.11449813842773438, -0.11040687561035156, -0.10631561279296875, -0.10222434997558594, -0.09813308715820312, -0.09404182434082031, -0.0899505615234375, -0.08585929870605469, -0.08176803588867188, -0.07767677307128906, -0.07358551025390625, -0.06949424743652344, -0.06540298461914062, -0.06131172180175781, -0.057220458984375, -0.05312919616699219, -0.049037933349609375, -0.04494667053222656, -0.04085540771484375, -0.03676414489746094, -0.032672882080078125, -0.028581619262695312, -0.0244903564453125, -0.020399093627929688, -0.016307830810546875, -0.012216567993164062, -0.00812530517578125, -0.0040340423583984375, 5.7220458984375e-05, 0.0041484832763671875, 0.00823974609375, 0.012331008911132812, 0.016422271728515625, 0.020513534545898438, 0.02460479736328125, 0.028696060180664062, 0.032787322998046875, 0.03687858581542969, 0.0409698486328125, 0.04506111145019531, 0.049152374267578125, 0.05324363708496094, 0.05733489990234375, 0.06142616271972656, 0.06551742553710938, 0.06960868835449219, 0.073699951171875, 0.07779121398925781, 0.08188247680664062, 0.08597373962402344, 0.09006500244140625, 0.09415626525878906, 0.09824752807617188, 0.10233879089355469, 0.1064300537109375, 0.11052131652832031, 0.11461257934570312, 0.11870384216308594, 0.12279510498046875, 0.12688636779785156, 0.13097763061523438, 0.1350688934326172, 0.13916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 5.0, 4.0, 2.0, 3.0, 10.0, 9.0, 6.0, 7.0, 11.0, 20.0, 29.0, 33.0, 61.0, 59.0, 81.0, 95.0, 96.0, 107.0, 82.0, 58.0, 56.0, 41.0, 30.0, 23.0, 15.0, 12.0, 8.0, 10.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.036712646484375, -0.03546857833862305, -0.034224510192871094, -0.03298044204711914, -0.03173637390136719, -0.030492305755615234, -0.02924823760986328, -0.028004169464111328, -0.026760101318359375, -0.025516033172607422, -0.02427196502685547, -0.023027896881103516, -0.021783828735351562, -0.02053976058959961, -0.019295692443847656, -0.018051624298095703, -0.01680755615234375, -0.015563488006591797, -0.014319419860839844, -0.01307535171508789, -0.011831283569335938, -0.010587215423583984, -0.009343147277832031, -0.008099079132080078, -0.006855010986328125, -0.005610942840576172, -0.004366874694824219, -0.0031228065490722656, -0.0018787384033203125, -0.0006346702575683594, 0.0006093978881835938, 0.0018534660339355469, 0.0030975341796875, 0.004341602325439453, 0.005585670471191406, 0.006829738616943359, 0.008073806762695312, 0.009317874908447266, 0.010561943054199219, 0.011806011199951172, 0.013050079345703125, 0.014294147491455078, 0.015538215637207031, 0.016782283782958984, 0.018026351928710938, 0.01927042007446289, 0.020514488220214844, 0.021758556365966797, 0.02300262451171875, 0.024246692657470703, 0.025490760803222656, 0.02673482894897461, 0.027978897094726562, 0.029222965240478516, 0.03046703338623047, 0.03171110153198242, 0.032955169677734375, 0.03419923782348633, 0.03544330596923828, 0.036687374114990234, 0.03793144226074219, 0.03917551040649414, 0.040419578552246094, 0.04166364669799805, 0.04290771484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 11.0, 14.0, 36.0, 58.0, 106.0, 121.0, 140.0, 168.0, 123.0, 86.0, 62.0, 37.0, 14.0, 9.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1071770191192627, -1.060936689376831, -1.014696478843689, -0.9684562087059021, -0.9222159385681152, -0.8759756684303284, -0.8297353982925415, -0.7834951281547546, -0.7372548580169678, -0.6910145878791809, -0.644774317741394, -0.5985340476036072, -0.5522937774658203, -0.5060535073280334, -0.4598132371902466, -0.4135729670524597, -0.36733269691467285, -0.321092426776886, -0.2748521566390991, -0.22861188650131226, -0.1823716163635254, -0.13613134622573853, -0.08989107608795166, -0.043650805950164795, 0.0025894641876220703, 0.048829734325408936, 0.0950700044631958, 0.14131027460098267, 0.18755054473876953, 0.2337908148765564, 0.28003108501434326, 0.3262713551521301, 0.372511625289917, 0.41875189542770386, 0.4649921655654907, 0.5112324357032776, 0.5574727058410645, 0.6037129759788513, 0.6499532461166382, 0.696193516254425, 0.7424337863922119, 0.7886740565299988, 0.8349143266677856, 0.8811545968055725, 0.9273948669433594, 0.9736351370811462, 1.019875407218933, 1.0661156177520752, 1.1123559474945068, 1.1585962772369385, 1.2048364877700806, 1.2510766983032227, 1.2973170280456543, 1.343557357788086, 1.389797568321228, 1.4360377788543701, 1.4822781085968018, 1.5285184383392334, 1.5747586488723755, 1.6209988594055176, 1.6672391891479492, 1.7134795188903809, 1.759719729423523, 1.805959939956665, 1.8522002696990967]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 4.0, 14.0, 18.0, 14.0, 26.0, 23.0, 30.0, 34.0, 48.0, 52.0, 54.0, 52.0, 54.0, 53.0, 58.0, 42.0, 44.0, 47.0, 50.0, 44.0, 33.0, 36.0, 22.0, 25.0, 17.0, 21.0, 14.0, 11.0, 9.0, 8.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7224306464195251, -0.7024909853935242, -0.6825513243675232, -0.6626116633415222, -0.6426719427108765, -0.6227322816848755, -0.6027926206588745, -0.5828529596328735, -0.5629132986068726, -0.5429736375808716, -0.5230339765548706, -0.5030943155288696, -0.48315462470054626, -0.4632149636745453, -0.4432752728462219, -0.42333561182022095, -0.40339595079421997, -0.383456289768219, -0.363516628742218, -0.34357693791389465, -0.3236372768878937, -0.3036976158618927, -0.28375792503356934, -0.26381826400756836, -0.24387860298156738, -0.2239389419555664, -0.20399926602840424, -0.18405959010124207, -0.1641199290752411, -0.1441802680492401, -0.12424059212207794, -0.10430091619491577, -0.08436119556427002, -0.06442152708768845, -0.04448185861110687, -0.0245421901345253, -0.004602521657943726, 0.015337146818637848, 0.03527681529521942, 0.05521649122238159, 0.07515615224838257, 0.09509582072496414, 0.11503548920154572, 0.13497516512870789, 0.15491482615470886, 0.17485448718070984, 0.194794163107872, 0.21473383903503418, 0.23467350006103516, 0.25461316108703613, 0.2745528221130371, 0.2944925129413605, 0.31443217396736145, 0.3343718349933624, 0.3543115258216858, 0.37425118684768677, 0.39419084787368774, 0.4141305088996887, 0.4340701699256897, 0.45400986075401306, 0.47394952178001404, 0.493889182806015, 0.5138288736343384, 0.5337685346603394, 0.5537081956863403]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 13.0, 22.0, 39.0, 70.0, 133.0, 277.0, 700.0, 1754.0, 5247.0, 18080.0, 108959.0, 813058.0, 78205.0, 15012.0, 4268.0, 1558.0, 584.0, 256.0, 142.0, 66.0, 38.0, 29.0, 11.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0439682006835938, -1.0127410888671875, -0.9815139770507812, -0.950286865234375, -0.9190597534179688, -0.8878326416015625, -0.8566055297851562, -0.82537841796875, -0.7941513061523438, -0.7629241943359375, -0.7316970825195312, -0.700469970703125, -0.6692428588867188, -0.6380157470703125, -0.6067886352539062, -0.5755615234375, -0.5443344116210938, -0.5131072998046875, -0.48188018798828125, -0.450653076171875, -0.41942596435546875, -0.3881988525390625, -0.35697174072265625, -0.32574462890625, -0.29451751708984375, -0.2632904052734375, -0.23206329345703125, -0.200836181640625, -0.16960906982421875, -0.1383819580078125, -0.10715484619140625, -0.075927734375, -0.04470062255859375, -0.0134735107421875, 0.01775360107421875, 0.048980712890625, 0.08020782470703125, 0.1114349365234375, 0.14266204833984375, 0.17388916015625, 0.20511627197265625, 0.2363433837890625, 0.26757049560546875, 0.298797607421875, 0.33002471923828125, 0.3612518310546875, 0.39247894287109375, 0.4237060546875, 0.45493316650390625, 0.4861602783203125, 0.5173873901367188, 0.548614501953125, 0.5798416137695312, 0.6110687255859375, 0.6422958374023438, 0.67352294921875, 0.7047500610351562, 0.7359771728515625, 0.7672042846679688, 0.798431396484375, 0.8296585083007812, 0.8608856201171875, 0.8921127319335938, 0.92333984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 6.0, 8.0, 10.0, 19.0, 30.0, 35.0, 47.0, 63.0, 89.0, 83.0, 89.0, 102.0, 75.0, 62.0, 76.0, 50.0, 49.0, 31.0, 22.0, 21.0, 11.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.03125, -2.964385986328125, -2.89752197265625, -2.830657958984375, -2.7637939453125, -2.696929931640625, -2.63006591796875, -2.563201904296875, -2.496337890625, -2.429473876953125, -2.36260986328125, -2.295745849609375, -2.2288818359375, -2.162017822265625, -2.09515380859375, -2.028289794921875, -1.96142578125, -1.894561767578125, -1.82769775390625, -1.760833740234375, -1.6939697265625, -1.627105712890625, -1.56024169921875, -1.493377685546875, -1.426513671875, -1.359649658203125, -1.29278564453125, -1.225921630859375, -1.1590576171875, -1.092193603515625, -1.02532958984375, -0.958465576171875, -0.8916015625, -0.824737548828125, -0.75787353515625, -0.691009521484375, -0.6241455078125, -0.557281494140625, -0.49041748046875, -0.423553466796875, -0.356689453125, -0.289825439453125, -0.22296142578125, -0.156097412109375, -0.0892333984375, -0.022369384765625, 0.04449462890625, 0.111358642578125, 0.17822265625, 0.245086669921875, 0.31195068359375, 0.378814697265625, 0.4456787109375, 0.512542724609375, 0.57940673828125, 0.646270751953125, 0.713134765625, 0.779998779296875, 0.84686279296875, 0.913726806640625, 0.9805908203125, 1.047454833984375, 1.11431884765625, 1.181182861328125, 1.248046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 8.0, 12.0, 21.0, 20.0, 36.0, 48.0, 65.0, 119.0, 257.0, 10181.0, 1035466.0, 1889.0, 169.0, 97.0, 67.0, 39.0, 25.0, 16.0, 13.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3828125, -6.2022705078125, -6.021728515625, -5.8411865234375, -5.66064453125, -5.4801025390625, -5.299560546875, -5.1190185546875, -4.9384765625, -4.7579345703125, -4.577392578125, -4.3968505859375, -4.21630859375, -4.0357666015625, -3.855224609375, -3.6746826171875, -3.494140625, -3.3135986328125, -3.133056640625, -2.9525146484375, -2.77197265625, -2.5914306640625, -2.410888671875, -2.2303466796875, -2.0498046875, -1.8692626953125, -1.688720703125, -1.5081787109375, -1.32763671875, -1.1470947265625, -0.966552734375, -0.7860107421875, -0.60546875, -0.4249267578125, -0.244384765625, -0.0638427734375, 0.11669921875, 0.2972412109375, 0.477783203125, 0.6583251953125, 0.8388671875, 1.0194091796875, 1.199951171875, 1.3804931640625, 1.56103515625, 1.7415771484375, 1.922119140625, 2.1026611328125, 2.283203125, 2.4637451171875, 2.644287109375, 2.8248291015625, 3.00537109375, 3.1859130859375, 3.366455078125, 3.5469970703125, 3.7275390625, 3.9080810546875, 4.088623046875, 4.2691650390625, 4.44970703125, 4.6302490234375, 4.810791015625, 4.9913330078125, 5.171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 14.0, 22.0, 19.0, 32.0, 38.0, 57.0, 58.0, 89.0, 104.0, 125.0, 93.0, 80.0, 84.0, 66.0, 42.0, 25.0, 21.0, 9.0, 15.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.58203125, -3.483673095703125, -3.38531494140625, -3.286956787109375, -3.1885986328125, -3.090240478515625, -2.99188232421875, -2.893524169921875, -2.795166015625, -2.696807861328125, -2.59844970703125, -2.500091552734375, -2.4017333984375, -2.303375244140625, -2.20501708984375, -2.106658935546875, -2.00830078125, -1.909942626953125, -1.81158447265625, -1.713226318359375, -1.6148681640625, -1.516510009765625, -1.41815185546875, -1.319793701171875, -1.221435546875, -1.123077392578125, -1.02471923828125, -0.926361083984375, -0.8280029296875, -0.729644775390625, -0.63128662109375, -0.532928466796875, -0.4345703125, -0.336212158203125, -0.23785400390625, -0.139495849609375, -0.0411376953125, 0.057220458984375, 0.15557861328125, 0.253936767578125, 0.352294921875, 0.450653076171875, 0.54901123046875, 0.647369384765625, 0.7457275390625, 0.844085693359375, 0.94244384765625, 1.040802001953125, 1.13916015625, 1.237518310546875, 1.33587646484375, 1.434234619140625, 1.5325927734375, 1.630950927734375, 1.72930908203125, 1.827667236328125, 1.926025390625, 2.024383544921875, 2.12274169921875, 2.221099853515625, 2.3194580078125, 2.417816162109375, 2.51617431640625, 2.614532470703125, 2.712890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 21.0, 31.0, 46.0, 80.0, 134.0, 304.0, 754.0, 2884.0, 15471.0, 276747.0, 720610.0, 25774.0, 4025.0, 955.0, 324.0, 154.0, 93.0, 43.0, 27.0, 10.0, 13.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.266357421875, -0.2543144226074219, -0.24227142333984375, -0.23022842407226562, -0.2181854248046875, -0.20614242553710938, -0.19409942626953125, -0.18205642700195312, -0.170013427734375, -0.15797042846679688, -0.14592742919921875, -0.13388442993164062, -0.1218414306640625, -0.10979843139648438, -0.09775543212890625, -0.08571243286132812, -0.07366943359375, -0.061626434326171875, -0.04958343505859375, -0.037540435791015625, -0.0254974365234375, -0.013454437255859375, -0.00141143798828125, 0.010631561279296875, 0.022674560546875, 0.034717559814453125, 0.04676055908203125, 0.058803558349609375, 0.0708465576171875, 0.08288955688476562, 0.09493255615234375, 0.10697555541992188, 0.1190185546875, 0.13106155395507812, 0.14310455322265625, 0.15514755249023438, 0.1671905517578125, 0.17923355102539062, 0.19127655029296875, 0.20331954956054688, 0.215362548828125, 0.22740554809570312, 0.23944854736328125, 0.2514915466308594, 0.2635345458984375, 0.2755775451660156, 0.28762054443359375, 0.2996635437011719, 0.31170654296875, 0.3237495422363281, 0.33579254150390625, 0.3478355407714844, 0.3598785400390625, 0.3719215393066406, 0.38396453857421875, 0.3960075378417969, 0.408050537109375, 0.4200935363769531, 0.43213653564453125, 0.4441795349121094, 0.4562225341796875, 0.4682655334472656, 0.48030853271484375, 0.4923515319824219, 0.50439453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 1.0, 5.0, 9.0, 13.0, 13.0, 26.0, 47.0, 74.0, 132.0, 220.0, 165.0, 105.0, 74.0, 38.0, 26.0, 8.0, 14.0, 4.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.792213439941406e-05, -4.6581029891967773e-05, -4.5239925384521484e-05, -4.3898820877075195e-05, -4.2557716369628906e-05, -4.121661186218262e-05, -3.987550735473633e-05, -3.853440284729004e-05, -3.719329833984375e-05, -3.585219383239746e-05, -3.451108932495117e-05, -3.316998481750488e-05, -3.1828880310058594e-05, -3.0487775802612305e-05, -2.9146671295166016e-05, -2.7805566787719727e-05, -2.6464462280273438e-05, -2.512335777282715e-05, -2.378225326538086e-05, -2.244114875793457e-05, -2.110004425048828e-05, -1.9758939743041992e-05, -1.8417835235595703e-05, -1.7076730728149414e-05, -1.5735626220703125e-05, -1.4394521713256836e-05, -1.3053417205810547e-05, -1.1712312698364258e-05, -1.0371208190917969e-05, -9.03010368347168e-06, -7.68899917602539e-06, -6.3478946685791016e-06, -5.0067901611328125e-06, -3.6656856536865234e-06, -2.3245811462402344e-06, -9.834766387939453e-07, 3.5762786865234375e-07, 1.6987323760986328e-06, 3.039836883544922e-06, 4.380941390991211e-06, 5.7220458984375e-06, 7.063150405883789e-06, 8.404254913330078e-06, 9.745359420776367e-06, 1.1086463928222656e-05, 1.2427568435668945e-05, 1.3768672943115234e-05, 1.5109777450561523e-05, 1.6450881958007812e-05, 1.77919864654541e-05, 1.913309097290039e-05, 2.047419548034668e-05, 2.181529998779297e-05, 2.3156404495239258e-05, 2.4497509002685547e-05, 2.5838613510131836e-05, 2.7179718017578125e-05, 2.8520822525024414e-05, 2.9861927032470703e-05, 3.120303153991699e-05, 3.254413604736328e-05, 3.388524055480957e-05, 3.522634506225586e-05, 3.656744956970215e-05, 3.790855407714844e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 9.0, 16.0, 16.0, 16.0, 39.0, 78.0, 141.0, 266.0, 690.0, 1832.0, 6756.0, 64865.0, 908311.0, 56094.0, 6419.0, 1769.0, 604.0, 273.0, 148.0, 72.0, 45.0, 32.0, 12.0, 11.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.443359375, -0.42722320556640625, -0.4110870361328125, -0.39495086669921875, -0.378814697265625, -0.36267852783203125, -0.3465423583984375, -0.33040618896484375, -0.31427001953125, -0.29813385009765625, -0.2819976806640625, -0.26586151123046875, -0.249725341796875, -0.23358917236328125, -0.2174530029296875, -0.20131683349609375, -0.1851806640625, -0.16904449462890625, -0.1529083251953125, -0.13677215576171875, -0.120635986328125, -0.10449981689453125, -0.0883636474609375, -0.07222747802734375, -0.05609130859375, -0.03995513916015625, -0.0238189697265625, -0.00768280029296875, 0.008453369140625, 0.02458953857421875, 0.0407257080078125, 0.05686187744140625, 0.072998046875, 0.08913421630859375, 0.1052703857421875, 0.12140655517578125, 0.137542724609375, 0.15367889404296875, 0.1698150634765625, 0.18595123291015625, 0.20208740234375, 0.21822357177734375, 0.2343597412109375, 0.25049591064453125, 0.266632080078125, 0.28276824951171875, 0.2989044189453125, 0.31504058837890625, 0.3311767578125, 0.34731292724609375, 0.3634490966796875, 0.37958526611328125, 0.395721435546875, 0.41185760498046875, 0.4279937744140625, 0.44412994384765625, 0.46026611328125, 0.47640228271484375, 0.4925384521484375, 0.5086746215820312, 0.524810791015625, 0.5409469604492188, 0.5570831298828125, 0.5732192993164062, 0.58935546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 19.0, 30.0, 43.0, 67.0, 114.0, 244.0, 181.0, 110.0, 49.0, 35.0, 24.0, 18.0, 10.0, 3.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1981201171875, -0.19259071350097656, -0.18706130981445312, -0.1815319061279297, -0.17600250244140625, -0.1704730987548828, -0.16494369506835938, -0.15941429138183594, -0.1538848876953125, -0.14835548400878906, -0.14282608032226562, -0.1372966766357422, -0.13176727294921875, -0.1262378692626953, -0.12070846557617188, -0.11517906188964844, -0.109649658203125, -0.10412025451660156, -0.09859085083007812, -0.09306144714355469, -0.08753204345703125, -0.08200263977050781, -0.07647323608398438, -0.07094383239746094, -0.0654144287109375, -0.05988502502441406, -0.054355621337890625, -0.04882621765136719, -0.04329681396484375, -0.03776741027832031, -0.032238006591796875, -0.026708602905273438, -0.02117919921875, -0.015649795532226562, -0.010120391845703125, -0.0045909881591796875, 0.00093841552734375, 0.0064678192138671875, 0.011997222900390625, 0.017526626586914062, 0.0230560302734375, 0.028585433959960938, 0.034114837646484375, 0.03964424133300781, 0.04517364501953125, 0.05070304870605469, 0.056232452392578125, 0.06176185607910156, 0.067291259765625, 0.07282066345214844, 0.07835006713867188, 0.08387947082519531, 0.08940887451171875, 0.09493827819824219, 0.10046768188476562, 0.10599708557128906, 0.1115264892578125, 0.11705589294433594, 0.12258529663085938, 0.1281147003173828, 0.13364410400390625, 0.1391735076904297, 0.14470291137695312, 0.15023231506347656, 0.15576171875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 10.0, 40.0, 98.0, 165.0, 204.0, 210.0, 134.0, 90.0, 28.0, 9.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93709135055542, -5.7985615730285645, -5.660031318664551, -5.521501541137695, -5.38297176361084, -5.244441986083984, -5.105911731719971, -4.967381954193115, -4.82885217666626, -4.690322399139404, -4.551792144775391, -4.413262367248535, -4.27473258972168, -4.136202812194824, -3.9976725578308105, -3.859142780303955, -3.7206127643585205, -3.582082748413086, -3.4435529708862305, -3.305022954940796, -3.1664931774139404, -3.027963161468506, -2.8894333839416504, -2.750903367996216, -2.6123733520507812, -2.4738433361053467, -2.335313558578491, -2.1967835426330566, -2.058253765106201, -1.9197237491607666, -1.7811938524246216, -1.6426639556884766, -1.504133939743042, -1.365604043006897, -1.227074146270752, -1.0885441303253174, -0.9500142931938171, -0.8114843964576721, -0.6729544401168823, -0.5344245433807373, -0.3958946466445923, -0.25736474990844727, -0.11883482336997986, 0.01969510316848755, 0.15822499990463257, 0.2967548966407776, 0.4352848529815674, 0.5738147497177124, 0.7123446464538574, 0.8508745431900024, 0.9894044399261475, 1.127934455871582, 1.2664642333984375, 1.404994249343872, 1.543524146080017, 1.682054042816162, 1.8205839395523071, 1.9591138362884521, 2.0976438522338867, 2.236173629760742, 2.3747036457061768, 2.5132334232330322, 2.651763439178467, 2.7902932167053223, 2.928823232650757]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 10.0, 13.0, 15.0, 15.0, 15.0, 32.0, 26.0, 30.0, 28.0, 22.0, 36.0, 36.0, 41.0, 36.0, 54.0, 32.0, 35.0, 47.0, 40.0, 33.0, 29.0, 34.0, 42.0, 30.0, 32.0, 23.0, 34.0, 30.0, 16.0, 18.0, 12.0, 12.0, 15.0, 7.0, 8.0, 8.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-2.3927602767944336, -2.323352813720703, -2.2539453506469727, -2.184537649154663, -2.1151301860809326, -2.045722723007202, -1.9763151407241821, -1.906907558441162, -1.8375000953674316, -1.7680926322937012, -1.6986850500106812, -1.6292774677276611, -1.5598700046539307, -1.4904625415802002, -1.4210549592971802, -1.3516473770141602, -1.2822399139404297, -1.2128324508666992, -1.1434248685836792, -1.0740172863006592, -1.0046098232269287, -0.9352023005485535, -0.8657947778701782, -0.796387255191803, -0.7269797325134277, -0.6575722098350525, -0.5881646871566772, -0.518757164478302, -0.44934964179992676, -0.3799421191215515, -0.31053459644317627, -0.24112707376480103, -0.17171955108642578, -0.10231202840805054, -0.03290450572967529, 0.03650301694869995, 0.1059105396270752, 0.17531806230545044, 0.24472558498382568, 0.3141331076622009, 0.38354063034057617, 0.4529481530189514, 0.5223556756973267, 0.5917631983757019, 0.6611707210540771, 0.7305782437324524, 0.7999857664108276, 0.8693932890892029, 0.9388008117675781, 1.0082082748413086, 1.0776158571243286, 1.1470234394073486, 1.216430902481079, 1.2858383655548096, 1.3552459478378296, 1.4246535301208496, 1.49406099319458, 1.5634684562683105, 1.6328760385513306, 1.7022836208343506, 1.771691083908081, 1.8410985469818115, 1.9105061292648315, 1.9799137115478516, 2.049321174621582]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 9.0, 2.0, 8.0, 11.0, 17.0, 27.0, 40.0, 47.0, 64.0, 108.0, 203.0, 489.0, 1053.0, 2906.0, 8760.0, 40160.0, 469560.0, 3193536.0, 425995.0, 37843.0, 8707.0, 2739.0, 1025.0, 400.0, 210.0, 123.0, 72.0, 46.0, 25.0, 23.0, 27.0, 9.0, 11.0, 11.0, 5.0, 7.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3779296875, -1.3259124755859375, -1.273895263671875, -1.2218780517578125, -1.16986083984375, -1.1178436279296875, -1.065826416015625, -1.0138092041015625, -0.9617919921875, -0.9097747802734375, -0.857757568359375, -0.8057403564453125, -0.75372314453125, -0.7017059326171875, -0.649688720703125, -0.5976715087890625, -0.545654296875, -0.4936370849609375, -0.441619873046875, -0.3896026611328125, -0.33758544921875, -0.2855682373046875, -0.233551025390625, -0.1815338134765625, -0.1295166015625, -0.0774993896484375, -0.025482177734375, 0.0265350341796875, 0.07855224609375, 0.1305694580078125, 0.182586669921875, 0.2346038818359375, 0.28662109375, 0.3386383056640625, 0.390655517578125, 0.4426727294921875, 0.49468994140625, 0.5467071533203125, 0.598724365234375, 0.6507415771484375, 0.7027587890625, 0.7547760009765625, 0.806793212890625, 0.8588104248046875, 0.91082763671875, 0.9628448486328125, 1.014862060546875, 1.0668792724609375, 1.118896484375, 1.1709136962890625, 1.222930908203125, 1.2749481201171875, 1.32696533203125, 1.3789825439453125, 1.430999755859375, 1.4830169677734375, 1.5350341796875, 1.5870513916015625, 1.639068603515625, 1.6910858154296875, 1.74310302734375, 1.7951202392578125, 1.847137451171875, 1.8991546630859375, 1.951171875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 6.0, 5.0, 15.0, 6.0, 13.0, 17.0, 13.0, 23.0, 37.0, 38.0, 24.0, 34.0, 43.0, 58.0, 45.0, 49.0, 54.0, 52.0, 48.0, 45.0, 43.0, 36.0, 31.0, 29.0, 28.0, 36.0, 28.0, 24.0, 22.0, 19.0, 14.0, 8.0, 5.0, 7.0, 7.0, 10.0, 3.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.67333984375, -0.6512908935546875, -0.629241943359375, -0.6071929931640625, -0.58514404296875, -0.5630950927734375, -0.541046142578125, -0.5189971923828125, -0.4969482421875, -0.4748992919921875, -0.452850341796875, -0.4308013916015625, -0.40875244140625, -0.3867034912109375, -0.364654541015625, -0.3426055908203125, -0.320556640625, -0.2985076904296875, -0.276458740234375, -0.2544097900390625, -0.23236083984375, -0.2103118896484375, -0.188262939453125, -0.1662139892578125, -0.1441650390625, -0.1221160888671875, -0.100067138671875, -0.0780181884765625, -0.05596923828125, -0.0339202880859375, -0.011871337890625, 0.0101776123046875, 0.0322265625, 0.0542755126953125, 0.076324462890625, 0.0983734130859375, 0.12042236328125, 0.1424713134765625, 0.164520263671875, 0.1865692138671875, 0.2086181640625, 0.2306671142578125, 0.252716064453125, 0.2747650146484375, 0.29681396484375, 0.3188629150390625, 0.340911865234375, 0.3629608154296875, 0.385009765625, 0.4070587158203125, 0.429107666015625, 0.4511566162109375, 0.47320556640625, 0.4952545166015625, 0.517303466796875, 0.5393524169921875, 0.5614013671875, 0.5834503173828125, 0.605499267578125, 0.6275482177734375, 0.64959716796875, 0.6716461181640625, 0.693695068359375, 0.7157440185546875, 0.73779296875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 8.0, 16.0, 17.0, 44.0, 43.0, 90.0, 159.0, 321.0, 990.0, 4582.0, 43441.0, 3535116.0, 588808.0, 16815.0, 2608.0, 640.0, 264.0, 107.0, 72.0, 36.0, 39.0, 18.0, 12.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.5625, -2.4765625, -2.390625, -2.3046875, -2.21875, -2.1328125, -2.046875, -1.9609375, -1.875, -1.7890625, -1.703125, -1.6171875, -1.53125, -1.4453125, -1.359375, -1.2734375, -1.1875, -1.1015625, -1.015625, -0.9296875, -0.84375, -0.7578125, -0.671875, -0.5859375, -0.5, -0.4140625, -0.328125, -0.2421875, -0.15625, -0.0703125, 0.015625, 0.1015625, 0.1875, 0.2734375, 0.359375, 0.4453125, 0.53125, 0.6171875, 0.703125, 0.7890625, 0.875, 0.9609375, 1.046875, 1.1328125, 1.21875, 1.3046875, 1.390625, 1.4765625, 1.5625, 1.6484375, 1.734375, 1.8203125, 1.90625, 1.9921875, 2.078125, 2.1640625, 2.25, 2.3359375, 2.421875, 2.5078125, 2.59375, 2.6796875, 2.765625, 2.8515625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 8.0, 11.0, 8.0, 10.0, 18.0, 25.0, 33.0, 42.0, 47.0, 69.0, 125.0, 148.0, 204.0, 299.0, 456.0, 605.0, 554.0, 443.0, 289.0, 173.0, 132.0, 98.0, 78.0, 44.0, 34.0, 27.0, 20.0, 11.0, 12.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.364990234375, -0.353851318359375, -0.34271240234375, -0.331573486328125, -0.3204345703125, -0.309295654296875, -0.29815673828125, -0.287017822265625, -0.27587890625, -0.264739990234375, -0.25360107421875, -0.242462158203125, -0.2313232421875, -0.220184326171875, -0.20904541015625, -0.197906494140625, -0.186767578125, -0.175628662109375, -0.16448974609375, -0.153350830078125, -0.1422119140625, -0.131072998046875, -0.11993408203125, -0.108795166015625, -0.09765625, -0.086517333984375, -0.07537841796875, -0.064239501953125, -0.0531005859375, -0.041961669921875, -0.03082275390625, -0.019683837890625, -0.008544921875, 0.002593994140625, 0.01373291015625, 0.024871826171875, 0.0360107421875, 0.047149658203125, 0.05828857421875, 0.069427490234375, 0.08056640625, 0.091705322265625, 0.10284423828125, 0.113983154296875, 0.1251220703125, 0.136260986328125, 0.14739990234375, 0.158538818359375, 0.169677734375, 0.180816650390625, 0.19195556640625, 0.203094482421875, 0.2142333984375, 0.225372314453125, 0.23651123046875, 0.247650146484375, 0.2587890625, 0.269927978515625, 0.28106689453125, 0.292205810546875, 0.3033447265625, 0.314483642578125, 0.32562255859375, 0.336761474609375, 0.347900390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 8.0, 12.0, 25.0, 40.0, 58.0, 65.0, 84.0, 104.0, 85.0, 90.0, 99.0, 75.0, 61.0, 63.0, 48.0, 37.0, 20.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4661681652069092, -1.4143344163894653, -1.3625006675720215, -1.3106670379638672, -1.2588332891464233, -1.2069995403289795, -1.1551659107208252, -1.1033321619033813, -1.0514984130859375, -0.9996646642684937, -0.9478309750556946, -0.8959972858428955, -0.8441635370254517, -0.7923297882080078, -0.7404960989952087, -0.6886624097824097, -0.6368286609649658, -0.584994912147522, -0.5331612229347229, -0.48132750391960144, -0.42949378490448, -0.3776600658893585, -0.32582634687423706, -0.2739926278591156, -0.22215890884399414, -0.17032518982887268, -0.11849147081375122, -0.06665775179862976, -0.0148240327835083, 0.03700968623161316, 0.08884340524673462, 0.14067712426185608, 0.1925109624862671, 0.24434468150138855, 0.29617840051651, 0.34801211953163147, 0.39984583854675293, 0.4516795575618744, 0.5035132765769958, 0.5553469657897949, 0.6071807146072388, 0.6590144634246826, 0.7108481526374817, 0.7626818418502808, 0.8145155906677246, 0.8663493394851685, 0.9181830286979675, 0.9700167179107666, 1.0218504667282104, 1.0736842155456543, 1.1255178451538086, 1.1773515939712524, 1.2291853427886963, 1.2810190916061401, 1.332852840423584, 1.3846864700317383, 1.4365202188491821, 1.488353967666626, 1.5401875972747803, 1.5920213460922241, 1.643855094909668, 1.6956888437271118, 1.7475225925445557, 1.79935622215271, 1.8511899709701538]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 7.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 9.0, 8.0, 12.0, 12.0, 12.0, 14.0, 24.0, 21.0, 29.0, 31.0, 37.0, 33.0, 33.0, 31.0, 52.0, 48.0, 44.0, 49.0, 45.0, 53.0, 36.0, 37.0, 35.0, 40.0, 27.0, 25.0, 23.0, 19.0, 17.0, 24.0, 23.0, 13.0, 10.0, 13.0, 6.0, 4.0, 6.0, 4.0, 7.0, 7.0, 6.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6828749775886536, -0.6577270030975342, -0.6325790286064148, -0.6074310541152954, -0.582283079624176, -0.5571351051330566, -0.531987190246582, -0.5068391561508179, -0.4816912114620209, -0.4565432369709015, -0.4313952624797821, -0.4062473177909851, -0.3810993432998657, -0.35595136880874634, -0.33080339431762695, -0.30565541982650757, -0.2805074453353882, -0.2553594708442688, -0.23021149635314941, -0.20506353676319122, -0.17991556227207184, -0.15476758778095245, -0.12961962819099426, -0.10447165369987488, -0.0793236792087555, -0.05417570844292641, -0.02902773767709732, -0.0038797706365585327, 0.021268203854560852, 0.04641617834568024, 0.07156413793563843, 0.09671211242675781, 0.12186014652252197, 0.14700812101364136, 0.17215609550476074, 0.19730405509471893, 0.22245202958583832, 0.2476000040769577, 0.2727479636669159, 0.2978959381580353, 0.32304391264915466, 0.34819188714027405, 0.37333986163139343, 0.39848780632019043, 0.4236357808113098, 0.4487837553024292, 0.4739317297935486, 0.49907970428466797, 0.5242276787757874, 0.5493756532669067, 0.5745236277580261, 0.5996716022491455, 0.6248195767402649, 0.6499675512313843, 0.6751154661178589, 0.700263500213623, 0.7254114151000977, 0.750559389591217, 0.7757073640823364, 0.8008553385734558, 0.8260033130645752, 0.8511512875556946, 0.876299262046814, 0.9014471769332886, 0.9265952110290527]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 7.0, 8.0, 5.0, 13.0, 17.0, 19.0, 36.0, 55.0, 80.0, 117.0, 215.0, 362.0, 640.0, 1180.0, 2249.0, 4835.0, 13337.0, 57912.0, 348090.0, 489281.0, 98626.0, 19295.0, 6187.0, 2694.0, 1406.0, 780.0, 418.0, 220.0, 151.0, 96.0, 66.0, 29.0, 31.0, 22.0, 10.0, 14.0, 10.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.453857421875, -0.4392852783203125, -0.424713134765625, -0.4101409912109375, -0.39556884765625, -0.3809967041015625, -0.366424560546875, -0.3518524169921875, -0.3372802734375, -0.3227081298828125, -0.308135986328125, -0.2935638427734375, -0.27899169921875, -0.2644195556640625, -0.249847412109375, -0.2352752685546875, -0.220703125, -0.2061309814453125, -0.191558837890625, -0.1769866943359375, -0.16241455078125, -0.1478424072265625, -0.133270263671875, -0.1186981201171875, -0.1041259765625, -0.0895538330078125, -0.074981689453125, -0.0604095458984375, -0.04583740234375, -0.0312652587890625, -0.016693115234375, -0.0021209716796875, 0.012451171875, 0.0270233154296875, 0.041595458984375, 0.0561676025390625, 0.07073974609375, 0.0853118896484375, 0.099884033203125, 0.1144561767578125, 0.1290283203125, 0.1436004638671875, 0.158172607421875, 0.1727447509765625, 0.18731689453125, 0.2018890380859375, 0.216461181640625, 0.2310333251953125, 0.24560546875, 0.2601776123046875, 0.274749755859375, 0.2893218994140625, 0.30389404296875, 0.3184661865234375, 0.333038330078125, 0.3476104736328125, 0.3621826171875, 0.3767547607421875, 0.391326904296875, 0.4058990478515625, 0.42047119140625, 0.4350433349609375, 0.449615478515625, 0.4641876220703125, 0.478759765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 3.0, 5.0, 6.0, 6.0, 11.0, 17.0, 14.0, 21.0, 23.0, 24.0, 38.0, 33.0, 42.0, 50.0, 50.0, 52.0, 59.0, 66.0, 75.0, 47.0, 42.0, 39.0, 49.0, 20.0, 32.0, 33.0, 26.0, 36.0, 16.0, 15.0, 10.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.654296875, -0.6328964233398438, -0.6114959716796875, -0.5900955200195312, -0.568695068359375, -0.5472946166992188, -0.5258941650390625, -0.5044937133789062, -0.48309326171875, -0.46169281005859375, -0.4402923583984375, -0.41889190673828125, -0.397491455078125, -0.37609100341796875, -0.3546905517578125, -0.33329010009765625, -0.3118896484375, -0.29048919677734375, -0.2690887451171875, -0.24768829345703125, -0.226287841796875, -0.20488739013671875, -0.1834869384765625, -0.16208648681640625, -0.14068603515625, -0.11928558349609375, -0.0978851318359375, -0.07648468017578125, -0.055084228515625, -0.03368377685546875, -0.0122833251953125, 0.00911712646484375, 0.030517578125, 0.05191802978515625, 0.0733184814453125, 0.09471893310546875, 0.116119384765625, 0.13751983642578125, 0.1589202880859375, 0.18032073974609375, 0.20172119140625, 0.22312164306640625, 0.2445220947265625, 0.26592254638671875, 0.287322998046875, 0.30872344970703125, 0.3301239013671875, 0.35152435302734375, 0.3729248046875, 0.39432525634765625, 0.4157257080078125, 0.43712615966796875, 0.458526611328125, 0.47992706298828125, 0.5013275146484375, 0.5227279663085938, 0.54412841796875, 0.5655288696289062, 0.5869293212890625, 0.6083297729492188, 0.629730224609375, 0.6511306762695312, 0.6725311279296875, 0.6939315795898438, 0.71533203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 3.0, 6.0, 11.0, 8.0, 22.0, 39.0, 61.0, 106.0, 205.0, 398.0, 730.0, 1501.0, 3315.0, 9350.0, 37163.0, 210394.0, 557997.0, 180156.0, 32264.0, 8659.0, 3160.0, 1447.0, 733.0, 340.0, 189.0, 99.0, 54.0, 29.0, 25.0, 14.0, 10.0, 9.0, 8.0, 4.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.4371299743652344, -0.42406463623046875, -0.4109992980957031, -0.3979339599609375, -0.3848686218261719, -0.37180328369140625, -0.3587379455566406, -0.345672607421875, -0.3326072692871094, -0.31954193115234375, -0.3064765930175781, -0.2934112548828125, -0.2803459167480469, -0.26728057861328125, -0.2542152404785156, -0.24114990234375, -0.22808456420898438, -0.21501922607421875, -0.20195388793945312, -0.1888885498046875, -0.17582321166992188, -0.16275787353515625, -0.14969253540039062, -0.136627197265625, -0.12356185913085938, -0.11049652099609375, -0.09743118286132812, -0.0843658447265625, -0.07130050659179688, -0.05823516845703125, -0.045169830322265625, -0.0321044921875, -0.019039154052734375, -0.00597381591796875, 0.007091522216796875, 0.0201568603515625, 0.033222198486328125, 0.04628753662109375, 0.059352874755859375, 0.072418212890625, 0.08548355102539062, 0.09854888916015625, 0.11161422729492188, 0.1246795654296875, 0.13774490356445312, 0.15081024169921875, 0.16387557983398438, 0.17694091796875, 0.19000625610351562, 0.20307159423828125, 0.21613693237304688, 0.2292022705078125, 0.24226760864257812, 0.25533294677734375, 0.2683982849121094, 0.281463623046875, 0.2945289611816406, 0.30759429931640625, 0.3206596374511719, 0.3337249755859375, 0.3467903137207031, 0.35985565185546875, 0.3729209899902344, 0.385986328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 2.0, 9.0, 14.0, 14.0, 11.0, 14.0, 25.0, 26.0, 21.0, 24.0, 43.0, 37.0, 42.0, 36.0, 29.0, 37.0, 34.0, 41.0, 47.0, 43.0, 43.0, 41.0, 45.0, 36.0, 37.0, 34.0, 29.0, 27.0, 32.0, 22.0, 22.0, 16.0, 7.0, 9.0, 10.0, 7.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.09375, -1.05615234375, -1.0185546875, -0.98095703125, -0.943359375, -0.90576171875, -0.8681640625, -0.83056640625, -0.79296875, -0.75537109375, -0.7177734375, -0.68017578125, -0.642578125, -0.60498046875, -0.5673828125, -0.52978515625, -0.4921875, -0.45458984375, -0.4169921875, -0.37939453125, -0.341796875, -0.30419921875, -0.2666015625, -0.22900390625, -0.19140625, -0.15380859375, -0.1162109375, -0.07861328125, -0.041015625, -0.00341796875, 0.0341796875, 0.07177734375, 0.109375, 0.14697265625, 0.1845703125, 0.22216796875, 0.259765625, 0.29736328125, 0.3349609375, 0.37255859375, 0.41015625, 0.44775390625, 0.4853515625, 0.52294921875, 0.560546875, 0.59814453125, 0.6357421875, 0.67333984375, 0.7109375, 0.74853515625, 0.7861328125, 0.82373046875, 0.861328125, 0.89892578125, 0.9365234375, 0.97412109375, 1.01171875, 1.04931640625, 1.0869140625, 1.12451171875, 1.162109375, 1.19970703125, 1.2373046875, 1.27490234375, 1.3125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 22.0, 19.0, 28.0, 42.0, 61.0, 87.0, 157.0, 174.0, 306.0, 500.0, 791.0, 1351.0, 2505.0, 4911.0, 10836.0, 29727.0, 102475.0, 341425.0, 375191.0, 120379.0, 33928.0, 11998.0, 5334.0, 2526.0, 1400.0, 813.0, 497.0, 318.0, 209.0, 151.0, 105.0, 66.0, 53.0, 52.0, 42.0, 16.0, 12.0, 7.0, 7.0, 0.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0], "bins": [-0.10943603515625, -0.10622310638427734, -0.10301017761230469, -0.09979724884033203, -0.09658432006835938, -0.09337139129638672, -0.09015846252441406, -0.0869455337524414, -0.08373260498046875, -0.0805196762084961, -0.07730674743652344, -0.07409381866455078, -0.07088088989257812, -0.06766796112060547, -0.06445503234863281, -0.061242103576660156, -0.0580291748046875, -0.054816246032714844, -0.05160331726074219, -0.04839038848876953, -0.045177459716796875, -0.04196453094482422, -0.03875160217285156, -0.035538673400878906, -0.03232574462890625, -0.029112815856933594, -0.025899887084960938, -0.02268695831298828, -0.019474029541015625, -0.01626110076904297, -0.013048171997070312, -0.009835243225097656, -0.006622314453125, -0.0034093856811523438, -0.0001964569091796875, 0.0030164718627929688, 0.006229400634765625, 0.009442329406738281, 0.012655258178710938, 0.015868186950683594, 0.01908111572265625, 0.022294044494628906, 0.025506973266601562, 0.02871990203857422, 0.031932830810546875, 0.03514575958251953, 0.03835868835449219, 0.041571617126464844, 0.0447845458984375, 0.047997474670410156, 0.05121040344238281, 0.05442333221435547, 0.057636260986328125, 0.06084918975830078, 0.06406211853027344, 0.0672750473022461, 0.07048797607421875, 0.0737009048461914, 0.07691383361816406, 0.08012676239013672, 0.08333969116210938, 0.08655261993408203, 0.08976554870605469, 0.09297847747802734, 0.09619140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 9.0, 19.0, 25.0, 48.0, 70.0, 146.0, 153.0, 179.0, 108.0, 96.0, 51.0, 34.0, 25.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011467933654785156, -0.00011166650801897049, -0.00010865367949008942, -0.00010564085096120834, -0.00010262802243232727, -9.96151939034462e-05, -9.660236537456512e-05, -9.358953684568405e-05, -9.057670831680298e-05, -8.75638797879219e-05, -8.455105125904083e-05, -8.153822273015976e-05, -7.852539420127869e-05, -7.551256567239761e-05, -7.249973714351654e-05, -6.948690861463547e-05, -6.64740800857544e-05, -6.346125155687332e-05, -6.044842302799225e-05, -5.7435594499111176e-05, -5.44227659702301e-05, -5.140993744134903e-05, -4.8397108912467957e-05, -4.5384280383586884e-05, -4.237145185470581e-05, -3.935862332582474e-05, -3.6345794796943665e-05, -3.333296626806259e-05, -3.032013773918152e-05, -2.7307309210300446e-05, -2.4294480681419373e-05, -2.12816521525383e-05, -1.8268823623657227e-05, -1.5255995094776154e-05, -1.224316656589508e-05, -9.230338037014008e-06, -6.2175095081329346e-06, -3.2046809792518616e-06, -1.9185245037078857e-07, 2.8209760785102844e-06, 5.833804607391357e-06, 8.84663313627243e-06, 1.1859461665153503e-05, 1.4872290194034576e-05, 1.788511872291565e-05, 2.0897947251796722e-05, 2.3910775780677795e-05, 2.692360430955887e-05, 2.993643283843994e-05, 3.2949261367321014e-05, 3.596208989620209e-05, 3.897491842508316e-05, 4.1987746953964233e-05, 4.5000575482845306e-05, 4.801340401172638e-05, 5.102623254060745e-05, 5.4039061069488525e-05, 5.70518895983696e-05, 6.006471812725067e-05, 6.307754665613174e-05, 6.609037518501282e-05, 6.910320371389389e-05, 7.211603224277496e-05, 7.512886077165604e-05, 7.814168930053711e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 13.0, 14.0, 22.0, 21.0, 39.0, 54.0, 106.0, 161.0, 257.0, 494.0, 863.0, 1745.0, 3976.0, 11245.0, 40451.0, 199522.0, 534420.0, 196391.0, 39873.0, 11122.0, 3972.0, 1815.0, 844.0, 453.0, 227.0, 130.0, 107.0, 57.0, 41.0, 36.0, 14.0, 21.0, 11.0, 14.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1483154296875, -0.14360618591308594, -0.13889694213867188, -0.1341876983642578, -0.12947845458984375, -0.12476921081542969, -0.12005996704101562, -0.11535072326660156, -0.1106414794921875, -0.10593223571777344, -0.10122299194335938, -0.09651374816894531, -0.09180450439453125, -0.08709526062011719, -0.08238601684570312, -0.07767677307128906, -0.072967529296875, -0.06825828552246094, -0.06354904174804688, -0.05883979797363281, -0.05413055419921875, -0.04942131042480469, -0.044712066650390625, -0.04000282287597656, -0.0352935791015625, -0.030584335327148438, -0.025875091552734375, -0.021165847778320312, -0.01645660400390625, -0.011747360229492188, -0.007038116455078125, -0.0023288726806640625, 0.00238037109375, 0.0070896148681640625, 0.011798858642578125, 0.016508102416992188, 0.02121734619140625, 0.025926589965820312, 0.030635833740234375, 0.03534507751464844, 0.0400543212890625, 0.04476356506347656, 0.049472808837890625, 0.05418205261230469, 0.05889129638671875, 0.06360054016113281, 0.06830978393554688, 0.07301902770996094, 0.077728271484375, 0.08243751525878906, 0.08714675903320312, 0.09185600280761719, 0.09656524658203125, 0.10127449035644531, 0.10598373413085938, 0.11069297790527344, 0.1154022216796875, 0.12011146545410156, 0.12482070922851562, 0.1295299530029297, 0.13423919677734375, 0.1389484405517578, 0.14365768432617188, 0.14836692810058594, 0.153076171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 9.0, 5.0, 5.0, 4.0, 7.0, 4.0, 9.0, 18.0, 8.0, 9.0, 22.0, 33.0, 54.0, 46.0, 53.0, 52.0, 82.0, 64.0, 63.0, 67.0, 63.0, 61.0, 49.0, 37.0, 29.0, 27.0, 17.0, 19.0, 14.0, 9.0, 14.0, 8.0, 7.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.034637451171875, -0.033522605895996094, -0.03240776062011719, -0.03129291534423828, -0.030178070068359375, -0.02906322479248047, -0.027948379516601562, -0.026833534240722656, -0.02571868896484375, -0.024603843688964844, -0.023488998413085938, -0.02237415313720703, -0.021259307861328125, -0.02014446258544922, -0.019029617309570312, -0.017914772033691406, -0.0167999267578125, -0.015685081481933594, -0.014570236206054688, -0.013455390930175781, -0.012340545654296875, -0.011225700378417969, -0.010110855102539062, -0.008996009826660156, -0.00788116455078125, -0.006766319274902344, -0.0056514739990234375, -0.004536628723144531, -0.003421783447265625, -0.0023069381713867188, -0.0011920928955078125, -7.724761962890625e-05, 0.00103759765625, 0.0021524429321289062, 0.0032672882080078125, 0.004382133483886719, 0.005496978759765625, 0.006611824035644531, 0.0077266693115234375, 0.008841514587402344, 0.00995635986328125, 0.011071205139160156, 0.012186050415039062, 0.013300895690917969, 0.014415740966796875, 0.015530586242675781, 0.016645431518554688, 0.017760276794433594, 0.0188751220703125, 0.019989967346191406, 0.021104812622070312, 0.02221965789794922, 0.023334503173828125, 0.02444934844970703, 0.025564193725585938, 0.026679039001464844, 0.02779388427734375, 0.028908729553222656, 0.030023574829101562, 0.03113842010498047, 0.032253265380859375, 0.03336811065673828, 0.03448295593261719, 0.035597801208496094, 0.036712646484375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 11.0, 13.0, 27.0, 42.0, 57.0, 79.0, 126.0, 115.0, 120.0, 105.0, 98.0, 64.0, 50.0, 40.0, 23.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9416314959526062, -0.901360273361206, -0.8610890507698059, -0.8208178281784058, -0.7805466055870056, -0.7402753829956055, -0.7000041007995605, -0.6597329378128052, -0.6194616556167603, -0.5791904330253601, -0.53891921043396, -0.4986479878425598, -0.45837676525115967, -0.4181055426597595, -0.377834290266037, -0.33756306767463684, -0.2972918748855591, -0.25702065229415894, -0.2167494297027588, -0.17647819221019745, -0.1362069696187973, -0.09593574702739716, -0.055664509534835815, -0.015393286943435669, 0.024877935647964478, 0.06514915823936462, 0.10542038828134537, 0.1456916183233261, 0.18596284091472626, 0.2262340635061264, 0.26650530099868774, 0.3067765235900879, 0.3470478057861328, 0.38731902837753296, 0.4275902509689331, 0.46786147356033325, 0.5081326961517334, 0.5484039187431335, 0.5886751413345337, 0.6289464235305786, 0.669217586517334, 0.7094888091087341, 0.7497600317001343, 0.7900312542915344, 0.8303024768829346, 0.8705736994743347, 0.9108449220657349, 0.9511162042617798, 0.9913874268531799, 1.03165864944458, 1.071929931640625, 1.1122010946273804, 1.1524723768234253, 1.1927435398101807, 1.2330148220062256, 1.273285984992981, 1.3135572671890259, 1.3538285493850708, 1.3940997123718262, 1.434370994567871, 1.4746421575546265, 1.5149134397506714, 1.5551846027374268, 1.5954558849334717, 1.635727047920227]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 12.0, 10.0, 23.0, 21.0, 24.0, 16.0, 30.0, 43.0, 33.0, 40.0, 36.0, 50.0, 51.0, 54.0, 53.0, 64.0, 46.0, 62.0, 30.0, 34.0, 33.0, 25.0, 24.0, 27.0, 24.0, 24.0, 15.0, 14.0, 13.0, 7.0, 4.0, 7.0, 6.0, 6.0, 5.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6570508480072021, -0.6378562450408936, -0.618661642074585, -0.5994670391082764, -0.5802724957466125, -0.561077892780304, -0.5418832898139954, -0.5226886868476868, -0.5034940838813782, -0.4842994809150696, -0.4651049077510834, -0.4459103047847748, -0.4267157018184662, -0.40752112865448, -0.3883265256881714, -0.3691319227218628, -0.3499373495578766, -0.330742746591568, -0.3115481734275818, -0.2923535704612732, -0.2731589674949646, -0.253964364528656, -0.2347697913646698, -0.2155751883983612, -0.1963806003332138, -0.1771860122680664, -0.1579914093017578, -0.1387968212366104, -0.11960222572088242, -0.10040763020515442, -0.08121304214000702, -0.062018439173698425, -0.042823851108551025, -0.023629257455468178, -0.00443466380238533, 0.014759927988052368, 0.033954523503780365, 0.05314911901950836, 0.07234370708465576, 0.09153831005096436, 0.11073289811611176, 0.12992748618125916, 0.14912208914756775, 0.16831667721271515, 0.18751126527786255, 0.20670586824417114, 0.22590045630931854, 0.24509505927562714, 0.26428964734077454, 0.28348425030708313, 0.30267882347106934, 0.32187342643737793, 0.3410680294036865, 0.3602626323699951, 0.3794572055339813, 0.3986518085002899, 0.4178463816642761, 0.4370409846305847, 0.4562355577945709, 0.4754301607608795, 0.4946247637271881, 0.5138193368911743, 0.5330139398574829, 0.5522085428237915, 0.5714031457901001]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 13.0, 16.0, 13.0, 34.0, 61.0, 70.0, 153.0, 279.0, 451.0, 909.0, 2082.0, 4828.0, 12821.0, 43178.0, 235999.0, 622344.0, 89354.0, 22377.0, 7736.0, 2992.0, 1346.0, 643.0, 329.0, 192.0, 119.0, 72.0, 39.0, 23.0, 28.0, 12.0, 13.0, 11.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.96875, -0.940460205078125, -0.91217041015625, -0.883880615234375, -0.8555908203125, -0.827301025390625, -0.79901123046875, -0.770721435546875, -0.742431640625, -0.714141845703125, -0.68585205078125, -0.657562255859375, -0.6292724609375, -0.600982666015625, -0.57269287109375, -0.544403076171875, -0.51611328125, -0.487823486328125, -0.45953369140625, -0.431243896484375, -0.4029541015625, -0.374664306640625, -0.34637451171875, -0.318084716796875, -0.289794921875, -0.261505126953125, -0.23321533203125, -0.204925537109375, -0.1766357421875, -0.148345947265625, -0.12005615234375, -0.091766357421875, -0.0634765625, -0.035186767578125, -0.00689697265625, 0.021392822265625, 0.0496826171875, 0.077972412109375, 0.10626220703125, 0.134552001953125, 0.162841796875, 0.191131591796875, 0.21942138671875, 0.247711181640625, 0.2760009765625, 0.304290771484375, 0.33258056640625, 0.360870361328125, 0.38916015625, 0.417449951171875, 0.44573974609375, 0.474029541015625, 0.5023193359375, 0.530609130859375, 0.55889892578125, 0.587188720703125, 0.615478515625, 0.643768310546875, 0.67205810546875, 0.700347900390625, 0.7286376953125, 0.756927490234375, 0.78521728515625, 0.813507080078125, 0.841796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 16.0, 11.0, 26.0, 32.0, 45.0, 61.0, 65.0, 66.0, 101.0, 106.0, 94.0, 86.0, 61.0, 52.0, 43.0, 38.0, 23.0, 23.0, 11.0, 11.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.2872467041015625, -2.224884033203125, -2.1625213623046875, -2.10015869140625, -2.0377960205078125, -1.975433349609375, -1.9130706787109375, -1.8507080078125, -1.7883453369140625, -1.725982666015625, -1.6636199951171875, -1.60125732421875, -1.5388946533203125, -1.476531982421875, -1.4141693115234375, -1.351806640625, -1.2894439697265625, -1.227081298828125, -1.1647186279296875, -1.10235595703125, -1.0399932861328125, -0.977630615234375, -0.9152679443359375, -0.8529052734375, -0.7905426025390625, -0.728179931640625, -0.6658172607421875, -0.60345458984375, -0.5410919189453125, -0.478729248046875, -0.4163665771484375, -0.35400390625, -0.2916412353515625, -0.229278564453125, -0.1669158935546875, -0.10455322265625, -0.0421905517578125, 0.020172119140625, 0.0825347900390625, 0.1448974609375, 0.2072601318359375, 0.269622802734375, 0.3319854736328125, 0.39434814453125, 0.4567108154296875, 0.519073486328125, 0.5814361572265625, 0.643798828125, 0.7061614990234375, 0.768524169921875, 0.8308868408203125, 0.89324951171875, 0.9556121826171875, 1.017974853515625, 1.0803375244140625, 1.1427001953125, 1.2050628662109375, 1.267425537109375, 1.3297882080078125, 1.39215087890625, 1.4545135498046875, 1.516876220703125, 1.5792388916015625, 1.6416015625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 5.0, 6.0, 1.0, 8.0, 9.0, 15.0, 21.0, 22.0, 20.0, 37.0, 59.0, 65.0, 97.0, 211.0, 386.0, 1419.0, 15401.0, 917149.0, 108492.0, 3712.0, 682.0, 260.0, 150.0, 84.0, 53.0, 44.0, 35.0, 28.0, 19.0, 12.0, 12.0, 7.0, 6.0, 5.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.849700927734375, -2.75994873046875, -2.670196533203125, -2.5804443359375, -2.490692138671875, -2.40093994140625, -2.311187744140625, -2.221435546875, -2.131683349609375, -2.04193115234375, -1.952178955078125, -1.8624267578125, -1.772674560546875, -1.68292236328125, -1.593170166015625, -1.50341796875, -1.413665771484375, -1.32391357421875, -1.234161376953125, -1.1444091796875, -1.054656982421875, -0.96490478515625, -0.875152587890625, -0.785400390625, -0.695648193359375, -0.60589599609375, -0.516143798828125, -0.4263916015625, -0.336639404296875, -0.24688720703125, -0.157135009765625, -0.0673828125, 0.022369384765625, 0.11212158203125, 0.201873779296875, 0.2916259765625, 0.381378173828125, 0.47113037109375, 0.560882568359375, 0.650634765625, 0.740386962890625, 0.83013916015625, 0.919891357421875, 1.0096435546875, 1.099395751953125, 1.18914794921875, 1.278900146484375, 1.36865234375, 1.458404541015625, 1.54815673828125, 1.637908935546875, 1.7276611328125, 1.817413330078125, 1.90716552734375, 1.996917724609375, 2.086669921875, 2.176422119140625, 2.26617431640625, 2.355926513671875, 2.4456787109375, 2.535430908203125, 2.62518310546875, 2.714935302734375, 2.8046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 2.0, 9.0, 4.0, 10.0, 6.0, 8.0, 14.0, 12.0, 18.0, 22.0, 28.0, 33.0, 43.0, 46.0, 36.0, 47.0, 52.0, 43.0, 48.0, 58.0, 45.0, 54.0, 45.0, 50.0, 50.0, 29.0, 28.0, 36.0, 20.0, 24.0, 13.0, 12.0, 10.0, 7.0, 5.0, 6.0, 7.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.53515625, -1.4888763427734375, -1.442596435546875, -1.3963165283203125, -1.35003662109375, -1.3037567138671875, -1.257476806640625, -1.2111968994140625, -1.1649169921875, -1.1186370849609375, -1.072357177734375, -1.0260772705078125, -0.97979736328125, -0.9335174560546875, -0.887237548828125, -0.8409576416015625, -0.794677734375, -0.7483978271484375, -0.702117919921875, -0.6558380126953125, -0.60955810546875, -0.5632781982421875, -0.516998291015625, -0.4707183837890625, -0.4244384765625, -0.3781585693359375, -0.331878662109375, -0.2855987548828125, -0.23931884765625, -0.1930389404296875, -0.146759033203125, -0.1004791259765625, -0.05419921875, -0.0079193115234375, 0.038360595703125, 0.0846405029296875, 0.13092041015625, 0.1772003173828125, 0.223480224609375, 0.2697601318359375, 0.3160400390625, 0.3623199462890625, 0.408599853515625, 0.4548797607421875, 0.50115966796875, 0.5474395751953125, 0.593719482421875, 0.6399993896484375, 0.686279296875, 0.7325592041015625, 0.778839111328125, 0.8251190185546875, 0.87139892578125, 0.9176788330078125, 0.963958740234375, 1.0102386474609375, 1.0565185546875, 1.1027984619140625, 1.149078369140625, 1.1953582763671875, 1.24163818359375, 1.2879180908203125, 1.334197998046875, 1.3804779052734375, 1.4267578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 6.0, 7.0, 11.0, 14.0, 13.0, 28.0, 37.0, 53.0, 109.0, 164.0, 324.0, 766.0, 1936.0, 6257.0, 27579.0, 262015.0, 684345.0, 50300.0, 9745.0, 2821.0, 1017.0, 434.0, 203.0, 123.0, 58.0, 42.0, 36.0, 27.0, 24.0, 12.0, 9.0, 5.0, 2.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.36376953125, -0.3531227111816406, -0.34247589111328125, -0.3318290710449219, -0.3211822509765625, -0.3105354309082031, -0.29988861083984375, -0.2892417907714844, -0.278594970703125, -0.2679481506347656, -0.25730133056640625, -0.24665451049804688, -0.2360076904296875, -0.22536087036132812, -0.21471405029296875, -0.20406723022460938, -0.19342041015625, -0.18277359008789062, -0.17212677001953125, -0.16147994995117188, -0.1508331298828125, -0.14018630981445312, -0.12953948974609375, -0.11889266967773438, -0.108245849609375, -0.09759902954101562, -0.08695220947265625, -0.07630538940429688, -0.0656585693359375, -0.055011749267578125, -0.04436492919921875, -0.033718109130859375, -0.0230712890625, -0.012424468994140625, -0.00177764892578125, 0.008869171142578125, 0.0195159912109375, 0.030162811279296875, 0.04080963134765625, 0.051456451416015625, 0.062103271484375, 0.07275009155273438, 0.08339691162109375, 0.09404373168945312, 0.1046905517578125, 0.11533737182617188, 0.12598419189453125, 0.13663101196289062, 0.14727783203125, 0.15792465209960938, 0.16857147216796875, 0.17921829223632812, 0.1898651123046875, 0.20051193237304688, 0.21115875244140625, 0.22180557250976562, 0.232452392578125, 0.24309921264648438, 0.25374603271484375, 0.2643928527832031, 0.2750396728515625, 0.2856864929199219, 0.29633331298828125, 0.3069801330566406, 0.317626953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 16.0, 17.0, 30.0, 32.0, 69.0, 116.0, 177.0, 193.0, 107.0, 65.0, 48.0, 31.0, 15.0, 8.0, 13.0, 4.0, 8.0, 4.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.060434341430664e-05, -4.885625094175339e-05, -4.7108158469200134e-05, -4.536006599664688e-05, -4.361197352409363e-05, -4.1863881051540375e-05, -4.011578857898712e-05, -3.836769610643387e-05, -3.6619603633880615e-05, -3.487151116132736e-05, -3.312341868877411e-05, -3.1375326216220856e-05, -2.9627233743667603e-05, -2.787914127111435e-05, -2.6131048798561096e-05, -2.4382956326007843e-05, -2.263486385345459e-05, -2.0886771380901337e-05, -1.9138678908348083e-05, -1.739058643579483e-05, -1.5642493963241577e-05, -1.3894401490688324e-05, -1.214630901813507e-05, -1.0398216545581818e-05, -8.650124073028564e-06, -6.902031600475311e-06, -5.153939127922058e-06, -3.405846655368805e-06, -1.6577541828155518e-06, 9.033828973770142e-08, 1.8384307622909546e-06, 3.5865232348442078e-06, 5.334615707397461e-06, 7.082708179950714e-06, 8.830800652503967e-06, 1.057889312505722e-05, 1.2326985597610474e-05, 1.4075078070163727e-05, 1.582317054271698e-05, 1.7571263015270233e-05, 1.9319355487823486e-05, 2.106744796037674e-05, 2.2815540432929993e-05, 2.4563632905483246e-05, 2.63117253780365e-05, 2.8059817850589752e-05, 2.9807910323143005e-05, 3.155600279569626e-05, 3.330409526824951e-05, 3.5052187740802765e-05, 3.680028021335602e-05, 3.854837268590927e-05, 4.0296465158462524e-05, 4.204455763101578e-05, 4.379265010356903e-05, 4.5540742576122284e-05, 4.728883504867554e-05, 4.903692752122879e-05, 5.0785019993782043e-05, 5.25331124663353e-05, 5.428120493888855e-05, 5.60292974114418e-05, 5.7777389883995056e-05, 5.952548235654831e-05, 6.127357482910156e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 14.0, 17.0, 26.0, 62.0, 101.0, 229.0, 485.0, 1286.0, 5366.0, 51907.0, 908130.0, 72062.0, 6295.0, 1513.0, 497.0, 245.0, 129.0, 59.0, 36.0, 36.0, 18.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6748046875, -0.654693603515625, -0.63458251953125, -0.614471435546875, -0.5943603515625, -0.574249267578125, -0.55413818359375, -0.534027099609375, -0.513916015625, -0.493804931640625, -0.47369384765625, -0.453582763671875, -0.4334716796875, -0.413360595703125, -0.39324951171875, -0.373138427734375, -0.35302734375, -0.332916259765625, -0.31280517578125, -0.292694091796875, -0.2725830078125, -0.252471923828125, -0.23236083984375, -0.212249755859375, -0.192138671875, -0.172027587890625, -0.15191650390625, -0.131805419921875, -0.1116943359375, -0.091583251953125, -0.07147216796875, -0.051361083984375, -0.03125, -0.011138916015625, 0.00897216796875, 0.029083251953125, 0.0491943359375, 0.069305419921875, 0.08941650390625, 0.109527587890625, 0.129638671875, 0.149749755859375, 0.16986083984375, 0.189971923828125, 0.2100830078125, 0.230194091796875, 0.25030517578125, 0.270416259765625, 0.29052734375, 0.310638427734375, 0.33074951171875, 0.350860595703125, 0.3709716796875, 0.391082763671875, 0.41119384765625, 0.431304931640625, 0.451416015625, 0.471527099609375, 0.49163818359375, 0.511749267578125, 0.5318603515625, 0.551971435546875, 0.57208251953125, 0.592193603515625, 0.6123046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 2.0, 3.0, 9.0, 10.0, 16.0, 16.0, 32.0, 41.0, 75.0, 98.0, 208.0, 219.0, 109.0, 65.0, 34.0, 28.0, 16.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.204833984375, -0.19843101501464844, -0.19202804565429688, -0.1856250762939453, -0.17922210693359375, -0.1728191375732422, -0.16641616821289062, -0.16001319885253906, -0.1536102294921875, -0.14720726013183594, -0.14080429077148438, -0.1344013214111328, -0.12799835205078125, -0.12159538269042969, -0.11519241333007812, -0.10878944396972656, -0.102386474609375, -0.09598350524902344, -0.08958053588867188, -0.08317756652832031, -0.07677459716796875, -0.07037162780761719, -0.06396865844726562, -0.05756568908691406, -0.0511627197265625, -0.04475975036621094, -0.038356781005859375, -0.03195381164550781, -0.02555084228515625, -0.019147872924804688, -0.012744903564453125, -0.0063419342041015625, 6.103515625e-05, 0.0064640045166015625, 0.012866973876953125, 0.019269943237304688, 0.02567291259765625, 0.03207588195800781, 0.038478851318359375, 0.04488182067871094, 0.0512847900390625, 0.05768775939941406, 0.06409072875976562, 0.07049369812011719, 0.07689666748046875, 0.08329963684082031, 0.08970260620117188, 0.09610557556152344, 0.102508544921875, 0.10891151428222656, 0.11531448364257812, 0.12171745300292969, 0.12812042236328125, 0.1345233917236328, 0.14092636108398438, 0.14732933044433594, 0.1537322998046875, 0.16013526916503906, 0.16653823852539062, 0.1729412078857422, 0.17934417724609375, 0.1857471466064453, 0.19215011596679688, 0.19855308532714844, 0.2049560546875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 6.0, 14.0, 11.0, 28.0, 34.0, 48.0, 62.0, 66.0, 83.0, 111.0, 96.0, 96.0, 92.0, 61.0, 58.0, 38.0, 25.0, 26.0, 12.0, 10.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6523833274841309, -1.5897029638290405, -1.5270226001739502, -1.4643423557281494, -1.401661992073059, -1.3389816284179688, -1.276301383972168, -1.2136210203170776, -1.1509406566619873, -1.088260293006897, -1.0255799293518066, -0.9628996849060059, -0.9002193212509155, -0.8375389575958252, -0.7748586535453796, -0.7121783494949341, -0.6494979858398438, -0.5868176221847534, -0.5241373181343079, -0.4614569842815399, -0.398776650428772, -0.33609631657600403, -0.2734159827232361, -0.21073564887046814, -0.1480553150177002, -0.08537498116493225, -0.022694647312164307, 0.03998568654060364, 0.10266602039337158, 0.16534635424613953, 0.22802668809890747, 0.2907070219516754, 0.35338711738586426, 0.4160674512386322, 0.47874778509140015, 0.5414280891418457, 0.604108452796936, 0.6667888164520264, 0.7294691205024719, 0.7921494245529175, 0.8548297882080078, 0.9175101518630981, 0.9801904559135437, 1.0428707599639893, 1.1055511236190796, 1.16823148727417, 1.2309117317199707, 1.293592095375061, 1.3562724590301514, 1.4189528226852417, 1.481633186340332, 1.5443134307861328, 1.6069937944412231, 1.6696741580963135, 1.7323544025421143, 1.7950347661972046, 1.857715129852295, 1.9203954935073853, 1.9830758571624756, 2.0457561016082764, 2.1084365844726562, 2.171116828918457, 2.233797073364258, 2.2964775562286377, 2.3591578006744385]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 7.0, 5.0, 9.0, 13.0, 12.0, 19.0, 16.0, 26.0, 30.0, 26.0, 30.0, 29.0, 36.0, 41.0, 42.0, 52.0, 42.0, 57.0, 41.0, 47.0, 40.0, 34.0, 26.0, 38.0, 29.0, 42.0, 38.0, 27.0, 26.0, 16.0, 21.0, 18.0, 8.0, 10.0, 11.0, 6.0, 4.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1389782428741455, -2.0687272548675537, -1.9984760284423828, -1.928225040435791, -1.8579739332199097, -1.7877228260040283, -1.7174718379974365, -1.6472207307815552, -1.5769696235656738, -1.5067185163497925, -1.4364674091339111, -1.3662164211273193, -1.295965313911438, -1.2257142066955566, -1.1554632186889648, -1.0852121114730835, -1.0149610042572021, -0.9447098970413208, -0.8744588494300842, -0.8042078018188477, -0.7339566946029663, -0.663705587387085, -0.5934545397758484, -0.5232034921646118, -0.45295238494873047, -0.3827013075351715, -0.31245023012161255, -0.2421991527080536, -0.17194807529449463, -0.10169699788093567, -0.03144592046737671, 0.03880515694618225, 0.10905599594116211, 0.17930707335472107, 0.24955815076828003, 0.319809228181839, 0.39006030559539795, 0.4603113830089569, 0.5305624604225159, 0.6008135080337524, 0.6710646152496338, 0.7413157224655151, 0.8115667700767517, 0.8818178176879883, 0.9520689249038696, 1.022320032119751, 1.0925710201263428, 1.1628221273422241, 1.2330732345581055, 1.3033243417739868, 1.3735754489898682, 1.44382643699646, 1.5140775442123413, 1.5843286514282227, 1.6545796394348145, 1.7248307466506958, 1.7950818538665771, 1.8653329610824585, 1.9355840682983398, 2.0058350563049316, 2.0760860443115234, 2.1463372707366943, 2.216588258743286, 2.286839485168457, 2.357090473175049]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 7.0, 14.0, 19.0, 17.0, 27.0, 31.0, 50.0, 74.0, 80.0, 106.0, 156.0, 247.0, 307.0, 536.0, 861.0, 1361.0, 2311.0, 4270.0, 8581.0, 19483.0, 55081.0, 222012.0, 1209585.0, 2018735.0, 497408.0, 96725.0, 29589.0, 12261.0, 6024.0, 3176.0, 1886.0, 1050.0, 705.0, 414.0, 301.0, 190.0, 159.0, 108.0, 79.0, 51.0, 42.0, 28.0, 28.0, 25.0, 13.0, 10.0, 8.0, 7.0, 10.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.7841796875, -0.7582473754882812, -0.7323150634765625, -0.7063827514648438, -0.680450439453125, -0.6545181274414062, -0.6285858154296875, -0.6026535034179688, -0.57672119140625, -0.5507888793945312, -0.5248565673828125, -0.49892425537109375, -0.472991943359375, -0.44705963134765625, -0.4211273193359375, -0.39519500732421875, -0.3692626953125, -0.34333038330078125, -0.3173980712890625, -0.29146575927734375, -0.265533447265625, -0.23960113525390625, -0.2136688232421875, -0.18773651123046875, -0.16180419921875, -0.13587188720703125, -0.1099395751953125, -0.08400726318359375, -0.058074951171875, -0.03214263916015625, -0.0062103271484375, 0.01972198486328125, 0.045654296875, 0.07158660888671875, 0.0975189208984375, 0.12345123291015625, 0.149383544921875, 0.17531585693359375, 0.2012481689453125, 0.22718048095703125, 0.25311279296875, 0.27904510498046875, 0.3049774169921875, 0.33090972900390625, 0.356842041015625, 0.38277435302734375, 0.4087066650390625, 0.43463897705078125, 0.4605712890625, 0.48650360107421875, 0.5124359130859375, 0.5383682250976562, 0.564300537109375, 0.5902328491210938, 0.6161651611328125, 0.6420974731445312, 0.66802978515625, 0.6939620971679688, 0.7198944091796875, 0.7458267211914062, 0.771759033203125, 0.7976913452148438, 0.8236236572265625, 0.8495559692382812, 0.87548828125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 7.0, 9.0, 17.0, 18.0, 19.0, 23.0, 22.0, 20.0, 36.0, 46.0, 51.0, 52.0, 45.0, 56.0, 38.0, 50.0, 58.0, 52.0, 40.0, 44.0, 46.0, 35.0, 35.0, 32.0, 18.0, 19.0, 16.0, 15.0, 14.0, 14.0, 7.0, 4.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.66259765625, -0.6413192749023438, -0.6200408935546875, -0.5987625122070312, -0.577484130859375, -0.5562057495117188, -0.5349273681640625, -0.5136489868164062, -0.49237060546875, -0.47109222412109375, -0.4498138427734375, -0.42853546142578125, -0.407257080078125, -0.38597869873046875, -0.3647003173828125, -0.34342193603515625, -0.3221435546875, -0.30086517333984375, -0.2795867919921875, -0.25830841064453125, -0.237030029296875, -0.21575164794921875, -0.1944732666015625, -0.17319488525390625, -0.15191650390625, -0.13063812255859375, -0.1093597412109375, -0.08808135986328125, -0.066802978515625, -0.04552459716796875, -0.0242462158203125, -0.00296783447265625, 0.018310546875, 0.03958892822265625, 0.0608673095703125, 0.08214569091796875, 0.103424072265625, 0.12470245361328125, 0.1459808349609375, 0.16725921630859375, 0.18853759765625, 0.20981597900390625, 0.2310943603515625, 0.25237274169921875, 0.273651123046875, 0.29492950439453125, 0.3162078857421875, 0.33748626708984375, 0.3587646484375, 0.38004302978515625, 0.4013214111328125, 0.42259979248046875, 0.443878173828125, 0.46515655517578125, 0.4864349365234375, 0.5077133178710938, 0.52899169921875, 0.5502700805664062, 0.5715484619140625, 0.5928268432617188, 0.614105224609375, 0.6353836059570312, 0.6566619873046875, 0.6779403686523438, 0.69921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 15.0, 19.0, 39.0, 82.0, 142.0, 306.0, 1112.0, 7759.0, 323155.0, 3827508.0, 30708.0, 2467.0, 536.0, 199.0, 81.0, 47.0, 35.0, 20.0, 10.0, 10.0, 9.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.4073486328125, -2.299072265625, -2.1907958984375, -2.08251953125, -1.9742431640625, -1.865966796875, -1.7576904296875, -1.6494140625, -1.5411376953125, -1.432861328125, -1.3245849609375, -1.21630859375, -1.1080322265625, -0.999755859375, -0.8914794921875, -0.783203125, -0.6749267578125, -0.566650390625, -0.4583740234375, -0.35009765625, -0.2418212890625, -0.133544921875, -0.0252685546875, 0.0830078125, 0.1912841796875, 0.299560546875, 0.4078369140625, 0.51611328125, 0.6243896484375, 0.732666015625, 0.8409423828125, 0.94921875, 1.0574951171875, 1.165771484375, 1.2740478515625, 1.38232421875, 1.4906005859375, 1.598876953125, 1.7071533203125, 1.8154296875, 1.9237060546875, 2.031982421875, 2.1402587890625, 2.24853515625, 2.3568115234375, 2.465087890625, 2.5733642578125, 2.681640625, 2.7899169921875, 2.898193359375, 3.0064697265625, 3.11474609375, 3.2230224609375, 3.331298828125, 3.4395751953125, 3.5478515625, 3.6561279296875, 3.764404296875, 3.8726806640625, 3.98095703125, 4.0892333984375, 4.197509765625, 4.3057861328125, 4.4140625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 14.0, 18.0, 26.0, 34.0, 51.0, 78.0, 100.0, 198.0, 304.0, 547.0, 670.0, 687.0, 484.0, 323.0, 183.0, 114.0, 66.0, 53.0, 30.0, 28.0, 9.0, 10.0, 12.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4876251220703125, -0.472808837890625, -0.4579925537109375, -0.44317626953125, -0.4283599853515625, -0.413543701171875, -0.3987274169921875, -0.3839111328125, -0.3690948486328125, -0.354278564453125, -0.3394622802734375, -0.32464599609375, -0.3098297119140625, -0.295013427734375, -0.2801971435546875, -0.265380859375, -0.2505645751953125, -0.235748291015625, -0.2209320068359375, -0.20611572265625, -0.1912994384765625, -0.176483154296875, -0.1616668701171875, -0.1468505859375, -0.1320343017578125, -0.117218017578125, -0.1024017333984375, -0.08758544921875, -0.0727691650390625, -0.057952880859375, -0.0431365966796875, -0.0283203125, -0.0135040283203125, 0.001312255859375, 0.0161285400390625, 0.03094482421875, 0.0457611083984375, 0.060577392578125, 0.0753936767578125, 0.0902099609375, 0.1050262451171875, 0.119842529296875, 0.1346588134765625, 0.14947509765625, 0.1642913818359375, 0.179107666015625, 0.1939239501953125, 0.208740234375, 0.2235565185546875, 0.238372802734375, 0.2531890869140625, 0.26800537109375, 0.2828216552734375, 0.297637939453125, 0.3124542236328125, 0.3272705078125, 0.3420867919921875, 0.356903076171875, 0.3717193603515625, 0.38653564453125, 0.4013519287109375, 0.416168212890625, 0.4309844970703125, 0.44580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 7.0, 8.0, 10.0, 17.0, 29.0, 46.0, 52.0, 59.0, 63.0, 76.0, 85.0, 80.0, 84.0, 74.0, 64.0, 51.0, 50.0, 42.0, 29.0, 15.0, 21.0, 15.0, 8.0, 8.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.216651439666748, -1.1758785247802734, -1.1351054906845093, -1.0943324565887451, -1.0535595417022705, -1.012786626815796, -0.9720135927200317, -0.9312406182289124, -0.890467643737793, -0.8496946692466736, -0.8089216947555542, -0.7681487202644348, -0.7273757457733154, -0.686602771282196, -0.6458297967910767, -0.6050568222999573, -0.5642838478088379, -0.5235108733177185, -0.4827378988265991, -0.44196492433547974, -0.40119194984436035, -0.36041897535324097, -0.3196460008621216, -0.2788730263710022, -0.2381000518798828, -0.19732707738876343, -0.15655410289764404, -0.11578112840652466, -0.07500815391540527, -0.03423517942428589, 0.006537795066833496, 0.04731076955795288, 0.08808362483978271, 0.1288565993309021, 0.16962957382202148, 0.21040254831314087, 0.25117552280426025, 0.29194849729537964, 0.332721471786499, 0.3734944462776184, 0.4142674207687378, 0.4550403952598572, 0.49581336975097656, 0.536586344242096, 0.5773593187332153, 0.6181322932243347, 0.6589052677154541, 0.6996782422065735, 0.7404512166976929, 0.7812241911888123, 0.8219971656799316, 0.862770140171051, 0.9035431146621704, 0.9443160891532898, 0.9850890636444092, 1.0258619785308838, 1.066635012626648, 1.107408046722412, 1.1481809616088867, 1.1889538764953613, 1.2297269105911255, 1.2704999446868896, 1.3112728595733643, 1.3520457744598389, 1.392818808555603]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 3.0, 12.0, 6.0, 17.0, 16.0, 13.0, 14.0, 15.0, 24.0, 27.0, 30.0, 31.0, 40.0, 32.0, 44.0, 64.0, 33.0, 34.0, 39.0, 38.0, 47.0, 53.0, 45.0, 50.0, 21.0, 39.0, 28.0, 22.0, 25.0, 19.0, 15.0, 17.0, 19.0, 12.0, 14.0, 10.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7895708084106445, -0.7645266652107239, -0.7394824624061584, -0.7144383192062378, -0.6893941164016724, -0.6643499732017517, -0.639305830001831, -0.6142616271972656, -0.5892174243927002, -0.5641732811927795, -0.5391290783882141, -0.5140849351882935, -0.489040732383728, -0.4639965891838074, -0.43895241618156433, -0.4139082431793213, -0.38886409997940063, -0.3638199269771576, -0.33877575397491455, -0.3137316107749939, -0.28868740797042847, -0.2636432647705078, -0.23859909176826477, -0.21355491876602173, -0.1885107457637787, -0.16346657276153564, -0.1384223997592926, -0.11337824165821075, -0.08833406865596771, -0.06328989565372467, -0.03824573755264282, -0.01320156455039978, 0.011842548847198486, 0.03688671812415123, 0.06193088740110397, 0.08697505295276642, 0.11201922595500946, 0.1370633989572525, 0.16210755705833435, 0.1871517300605774, 0.21219590306282043, 0.23724007606506348, 0.2622842490673065, 0.28732842206954956, 0.3123725652694702, 0.33741676807403564, 0.3624609112739563, 0.38750508427619934, 0.4125492572784424, 0.4375934302806854, 0.46263760328292847, 0.4876817464828491, 0.5127259492874146, 0.5377700924873352, 0.5628142356872559, 0.5878584384918213, 0.6129026412963867, 0.6379467844963074, 0.6629909873008728, 0.6880351305007935, 0.7130793333053589, 0.7381234765052795, 0.7631676197052002, 0.7882118225097656, 0.8132559657096863]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 9.0, 9.0, 20.0, 24.0, 44.0, 52.0, 61.0, 106.0, 134.0, 215.0, 322.0, 465.0, 728.0, 1138.0, 1820.0, 2955.0, 5184.0, 9233.0, 17070.0, 34086.0, 75939.0, 180606.0, 310327.0, 222970.0, 96208.0, 42403.0, 20398.0, 10593.0, 6079.0, 3449.0, 2131.0, 1261.0, 833.0, 543.0, 350.0, 230.0, 180.0, 105.0, 78.0, 71.0, 32.0, 32.0, 14.0, 14.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.231201171875, -0.22411727905273438, -0.21703338623046875, -0.20994949340820312, -0.2028656005859375, -0.19578170776367188, -0.18869781494140625, -0.18161392211914062, -0.174530029296875, -0.16744613647460938, -0.16036224365234375, -0.15327835083007812, -0.1461944580078125, -0.13911056518554688, -0.13202667236328125, -0.12494277954101562, -0.11785888671875, -0.11077499389648438, -0.10369110107421875, -0.09660720825195312, -0.0895233154296875, -0.08243942260742188, -0.07535552978515625, -0.06827163696289062, -0.061187744140625, -0.054103851318359375, -0.04701995849609375, -0.039936065673828125, -0.0328521728515625, -0.025768280029296875, -0.01868438720703125, -0.011600494384765625, -0.0045166015625, 0.002567291259765625, 0.00965118408203125, 0.016735076904296875, 0.0238189697265625, 0.030902862548828125, 0.03798675537109375, 0.045070648193359375, 0.052154541015625, 0.059238433837890625, 0.06632232666015625, 0.07340621948242188, 0.0804901123046875, 0.08757400512695312, 0.09465789794921875, 0.10174179077148438, 0.10882568359375, 0.11590957641601562, 0.12299346923828125, 0.13007736206054688, 0.1371612548828125, 0.14424514770507812, 0.15132904052734375, 0.15841293334960938, 0.165496826171875, 0.17258071899414062, 0.17966461181640625, 0.18674850463867188, 0.1938323974609375, 0.20091629028320312, 0.20800018310546875, 0.21508407592773438, 0.22216796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 5.0, 10.0, 6.0, 15.0, 11.0, 9.0, 22.0, 19.0, 31.0, 26.0, 31.0, 34.0, 34.0, 51.0, 37.0, 47.0, 47.0, 44.0, 34.0, 54.0, 58.0, 49.0, 39.0, 35.0, 32.0, 35.0, 36.0, 18.0, 17.0, 29.0, 14.0, 12.0, 7.0, 8.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.5205078125, -0.5052566528320312, -0.4900054931640625, -0.47475433349609375, -0.459503173828125, -0.44425201416015625, -0.4290008544921875, -0.41374969482421875, -0.39849853515625, -0.38324737548828125, -0.3679962158203125, -0.35274505615234375, -0.337493896484375, -0.32224273681640625, -0.3069915771484375, -0.29174041748046875, -0.2764892578125, -0.26123809814453125, -0.2459869384765625, -0.23073577880859375, -0.215484619140625, -0.20023345947265625, -0.1849822998046875, -0.16973114013671875, -0.15447998046875, -0.13922882080078125, -0.1239776611328125, -0.10872650146484375, -0.093475341796875, -0.07822418212890625, -0.0629730224609375, -0.04772186279296875, -0.032470703125, -0.01721954345703125, -0.0019683837890625, 0.01328277587890625, 0.028533935546875, 0.04378509521484375, 0.0590362548828125, 0.07428741455078125, 0.08953857421875, 0.10478973388671875, 0.1200408935546875, 0.13529205322265625, 0.150543212890625, 0.16579437255859375, 0.1810455322265625, 0.19629669189453125, 0.2115478515625, 0.22679901123046875, 0.2420501708984375, 0.25730133056640625, 0.272552490234375, 0.28780364990234375, 0.3030548095703125, 0.31830596923828125, 0.33355712890625, 0.34880828857421875, 0.3640594482421875, 0.37931060791015625, 0.394561767578125, 0.40981292724609375, 0.4250640869140625, 0.44031524658203125, 0.45556640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 16.0, 28.0, 28.0, 43.0, 56.0, 73.0, 87.0, 150.0, 235.0, 445.0, 760.0, 1446.0, 2872.0, 6475.0, 14582.0, 37167.0, 101503.0, 271473.0, 351811.0, 161462.0, 57837.0, 22106.0, 9075.0, 4233.0, 2003.0, 1013.0, 560.0, 312.0, 209.0, 116.0, 81.0, 60.0, 55.0, 40.0, 25.0, 17.0, 16.0, 12.0, 7.0, 6.0, 5.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2479248046875, -0.23998451232910156, -0.23204421997070312, -0.2241039276123047, -0.21616363525390625, -0.2082233428955078, -0.20028305053710938, -0.19234275817871094, -0.1844024658203125, -0.17646217346191406, -0.16852188110351562, -0.1605815887451172, -0.15264129638671875, -0.1447010040283203, -0.13676071166992188, -0.12882041931152344, -0.120880126953125, -0.11293983459472656, -0.10499954223632812, -0.09705924987792969, -0.08911895751953125, -0.08117866516113281, -0.07323837280273438, -0.06529808044433594, -0.0573577880859375, -0.04941749572753906, -0.041477203369140625, -0.03353691101074219, -0.02559661865234375, -0.017656326293945312, -0.009716033935546875, -0.0017757415771484375, 0.00616455078125, 0.014104843139648438, 0.022045135498046875, 0.029985427856445312, 0.03792572021484375, 0.04586601257324219, 0.053806304931640625, 0.06174659729003906, 0.0696868896484375, 0.07762718200683594, 0.08556747436523438, 0.09350776672363281, 0.10144805908203125, 0.10938835144042969, 0.11732864379882812, 0.12526893615722656, 0.133209228515625, 0.14114952087402344, 0.14908981323242188, 0.1570301055908203, 0.16497039794921875, 0.1729106903076172, 0.18085098266601562, 0.18879127502441406, 0.1967315673828125, 0.20467185974121094, 0.21261215209960938, 0.2205524444580078, 0.22849273681640625, 0.2364330291748047, 0.24437332153320312, 0.25231361389160156, 0.26025390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 6.0, 5.0, 7.0, 16.0, 13.0, 13.0, 12.0, 10.0, 15.0, 20.0, 26.0, 32.0, 25.0, 39.0, 37.0, 32.0, 38.0, 57.0, 46.0, 54.0, 42.0, 49.0, 43.0, 50.0, 42.0, 46.0, 31.0, 31.0, 24.0, 24.0, 21.0, 20.0, 12.0, 19.0, 11.0, 0.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.11328125, -1.078338623046875, -1.04339599609375, -1.008453369140625, -0.9735107421875, -0.938568115234375, -0.90362548828125, -0.868682861328125, -0.833740234375, -0.798797607421875, -0.76385498046875, -0.728912353515625, -0.6939697265625, -0.659027099609375, -0.62408447265625, -0.589141845703125, -0.55419921875, -0.519256591796875, -0.48431396484375, -0.449371337890625, -0.4144287109375, -0.379486083984375, -0.34454345703125, -0.309600830078125, -0.274658203125, -0.239715576171875, -0.20477294921875, -0.169830322265625, -0.1348876953125, -0.099945068359375, -0.06500244140625, -0.030059814453125, 0.0048828125, 0.039825439453125, 0.07476806640625, 0.109710693359375, 0.1446533203125, 0.179595947265625, 0.21453857421875, 0.249481201171875, 0.284423828125, 0.319366455078125, 0.35430908203125, 0.389251708984375, 0.4241943359375, 0.459136962890625, 0.49407958984375, 0.529022216796875, 0.56396484375, 0.598907470703125, 0.63385009765625, 0.668792724609375, 0.7037353515625, 0.738677978515625, 0.77362060546875, 0.808563232421875, 0.843505859375, 0.878448486328125, 0.91339111328125, 0.948333740234375, 0.9832763671875, 1.018218994140625, 1.05316162109375, 1.088104248046875, 1.123046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 10.0, 13.0, 17.0, 19.0, 29.0, 61.0, 91.0, 132.0, 204.0, 410.0, 715.0, 1580.0, 4377.0, 16202.0, 113568.0, 728328.0, 154352.0, 19693.0, 5091.0, 1822.0, 861.0, 375.0, 201.0, 120.0, 88.0, 62.0, 38.0, 25.0, 14.0, 9.0, 10.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2900390625, -0.2821063995361328, -0.2741737365722656, -0.26624107360839844, -0.25830841064453125, -0.25037574768066406, -0.24244308471679688, -0.2345104217529297, -0.2265777587890625, -0.2186450958251953, -0.21071243286132812, -0.20277976989746094, -0.19484710693359375, -0.18691444396972656, -0.17898178100585938, -0.1710491180419922, -0.163116455078125, -0.1551837921142578, -0.14725112915039062, -0.13931846618652344, -0.13138580322265625, -0.12345314025878906, -0.11552047729492188, -0.10758781433105469, -0.0996551513671875, -0.09172248840332031, -0.08378982543945312, -0.07585716247558594, -0.06792449951171875, -0.05999183654785156, -0.052059173583984375, -0.04412651062011719, -0.03619384765625, -0.028261184692382812, -0.020328521728515625, -0.012395858764648438, -0.00446319580078125, 0.0034694671630859375, 0.011402130126953125, 0.019334793090820312, 0.0272674560546875, 0.03520011901855469, 0.043132781982421875, 0.05106544494628906, 0.05899810791015625, 0.06693077087402344, 0.07486343383789062, 0.08279609680175781, 0.090728759765625, 0.09866142272949219, 0.10659408569335938, 0.11452674865722656, 0.12245941162109375, 0.13039207458496094, 0.13832473754882812, 0.1462574005126953, 0.1541900634765625, 0.1621227264404297, 0.17005538940429688, 0.17798805236816406, 0.18592071533203125, 0.19385337829589844, 0.20178604125976562, 0.2097187042236328, 0.2176513671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 22.0, 18.0, 29.0, 51.0, 89.0, 129.0, 149.0, 132.0, 128.0, 70.0, 61.0, 27.0, 25.0, 17.0, 9.0, 6.0, 3.0, 1.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.611513137817383e-05, -7.33034685254097e-05, -7.049180567264557e-05, -6.768014281988144e-05, -6.486847996711731e-05, -6.205681711435318e-05, -5.924515426158905e-05, -5.643349140882492e-05, -5.362182855606079e-05, -5.081016570329666e-05, -4.799850285053253e-05, -4.51868399977684e-05, -4.237517714500427e-05, -3.956351429224014e-05, -3.675185143947601e-05, -3.3940188586711884e-05, -3.1128525733947754e-05, -2.8316862881183624e-05, -2.5505200028419495e-05, -2.2693537175655365e-05, -1.9881874322891235e-05, -1.7070211470127106e-05, -1.4258548617362976e-05, -1.1446885764598846e-05, -8.635222911834717e-06, -5.823560059070587e-06, -3.0118972063064575e-06, -2.0023435354232788e-07, 2.6114284992218018e-06, 5.423091351985931e-06, 8.234754204750061e-06, 1.104641705751419e-05, 1.385807991027832e-05, 1.666974276304245e-05, 1.948140561580658e-05, 2.229306846857071e-05, 2.510473132133484e-05, 2.791639417409897e-05, 3.07280570268631e-05, 3.353971987962723e-05, 3.635138273239136e-05, 3.916304558515549e-05, 4.197470843791962e-05, 4.4786371290683746e-05, 4.7598034143447876e-05, 5.0409696996212006e-05, 5.3221359848976135e-05, 5.6033022701740265e-05, 5.8844685554504395e-05, 6.165634840726852e-05, 6.446801126003265e-05, 6.727967411279678e-05, 7.009133696556091e-05, 7.290299981832504e-05, 7.571466267108917e-05, 7.85263255238533e-05, 8.133798837661743e-05, 8.414965122938156e-05, 8.696131408214569e-05, 8.977297693490982e-05, 9.258463978767395e-05, 9.539630264043808e-05, 9.820796549320221e-05, 0.00010101962834596634, 0.00010383129119873047]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 16.0, 24.0, 33.0, 76.0, 121.0, 261.0, 558.0, 1451.0, 4904.0, 24670.0, 344086.0, 618959.0, 43227.0, 6750.0, 1964.0, 735.0, 304.0, 136.0, 106.0, 51.0, 19.0, 14.0, 16.0, 17.0, 7.0, 6.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.37744140625, -0.3666954040527344, -0.35594940185546875, -0.3452033996582031, -0.3344573974609375, -0.3237113952636719, -0.31296539306640625, -0.3022193908691406, -0.291473388671875, -0.2807273864746094, -0.26998138427734375, -0.2592353820800781, -0.2484893798828125, -0.23774337768554688, -0.22699737548828125, -0.21625137329101562, -0.20550537109375, -0.19475936889648438, -0.18401336669921875, -0.17326736450195312, -0.1625213623046875, -0.15177536010742188, -0.14102935791015625, -0.13028335571289062, -0.119537353515625, -0.10879135131835938, -0.09804534912109375, -0.08729934692382812, -0.0765533447265625, -0.06580734252929688, -0.05506134033203125, -0.044315338134765625, -0.0335693359375, -0.022823333740234375, -0.01207733154296875, -0.001331329345703125, 0.0094146728515625, 0.020160675048828125, 0.03090667724609375, 0.041652679443359375, 0.052398681640625, 0.06314468383789062, 0.07389068603515625, 0.08463668823242188, 0.0953826904296875, 0.10612869262695312, 0.11687469482421875, 0.12762069702148438, 0.13836669921875, 0.14911270141601562, 0.15985870361328125, 0.17060470581054688, 0.1813507080078125, 0.19209671020507812, 0.20284271240234375, 0.21358871459960938, 0.224334716796875, 0.23508071899414062, 0.24582672119140625, 0.2565727233886719, 0.2673187255859375, 0.2780647277832031, 0.28881072998046875, 0.2995567321777344, 0.310302734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 3.0, 10.0, 14.0, 18.0, 17.0, 30.0, 71.0, 99.0, 160.0, 179.0, 164.0, 91.0, 55.0, 22.0, 22.0, 14.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.0779581069946289, -0.07510566711425781, -0.07225322723388672, -0.06940078735351562, -0.06654834747314453, -0.06369590759277344, -0.060843467712402344, -0.05799102783203125, -0.055138587951660156, -0.05228614807128906, -0.04943370819091797, -0.046581268310546875, -0.04372882843017578, -0.04087638854980469, -0.038023948669433594, -0.0351715087890625, -0.032319068908691406, -0.029466629028320312, -0.02661418914794922, -0.023761749267578125, -0.02090930938720703, -0.018056869506835938, -0.015204429626464844, -0.01235198974609375, -0.009499549865722656, -0.0066471099853515625, -0.0037946701049804688, -0.000942230224609375, 0.0019102096557617188, 0.0047626495361328125, 0.007615089416503906, 0.010467529296875, 0.013319969177246094, 0.016172409057617188, 0.01902484893798828, 0.021877288818359375, 0.02472972869873047, 0.027582168579101562, 0.030434608459472656, 0.03328704833984375, 0.036139488220214844, 0.03899192810058594, 0.04184436798095703, 0.044696807861328125, 0.04754924774169922, 0.05040168762207031, 0.053254127502441406, 0.0561065673828125, 0.058959007263183594, 0.06181144714355469, 0.06466388702392578, 0.06751632690429688, 0.07036876678466797, 0.07322120666503906, 0.07607364654541016, 0.07892608642578125, 0.08177852630615234, 0.08463096618652344, 0.08748340606689453, 0.09033584594726562, 0.09318828582763672, 0.09604072570800781, 0.0988931655883789, 0.10174560546875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 9.0, 16.0, 16.0, 33.0, 55.0, 70.0, 76.0, 104.0, 106.0, 106.0, 96.0, 85.0, 66.0, 60.0, 34.0, 27.0, 13.0, 10.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6006758809089661, -0.5724876523017883, -0.5442994236946106, -0.5161111950874329, -0.4879229664802551, -0.4597347378730774, -0.43154647946357727, -0.40335825085639954, -0.3751700222492218, -0.34698179364204407, -0.31879356503486633, -0.2906053066253662, -0.2624170780181885, -0.23422886431217194, -0.206040620803833, -0.17785239219665527, -0.14966416358947754, -0.1214759349822998, -0.09328769892454147, -0.06509946286678314, -0.03691123425960541, -0.008723005652427673, 0.019465237855911255, 0.04765346646308899, 0.07584169507026672, 0.10402992367744446, 0.1322181522846222, 0.16040639579296112, 0.18859462440013885, 0.2167828530073166, 0.24497109651565552, 0.27315932512283325, 0.30134761333465576, 0.3295358419418335, 0.35772407054901123, 0.38591229915618896, 0.4141005277633667, 0.44228875637054443, 0.47047701478004456, 0.4986652433872223, 0.5268534421920776, 0.5550416707992554, 0.5832298994064331, 0.6114181280136108, 0.6396063566207886, 0.6677945852279663, 0.695982813835144, 0.7241710424423218, 0.7523593306541443, 0.780547559261322, 0.8087357878684998, 0.8369240164756775, 0.8651122450828552, 0.893300473690033, 0.9214887619018555, 0.9496769905090332, 0.9778652191162109, 1.0060534477233887, 1.0342416763305664, 1.0624299049377441, 1.0906181335449219, 1.1188063621520996, 1.1469945907592773, 1.175182819366455, 1.2033710479736328]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 12.0, 7.0, 6.0, 8.0, 5.0, 13.0, 14.0, 12.0, 20.0, 23.0, 19.0, 20.0, 30.0, 30.0, 38.0, 41.0, 43.0, 43.0, 38.0, 43.0, 43.0, 45.0, 51.0, 36.0, 45.0, 47.0, 41.0, 25.0, 32.0, 26.0, 19.0, 17.0, 25.0, 16.0, 11.0, 16.0, 9.0, 7.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.45147401094436646, -0.4374980330467224, -0.42352208495140076, -0.4095461368560791, -0.39557015895843506, -0.381594181060791, -0.36761823296546936, -0.3536422848701477, -0.33966630697250366, -0.3256903290748596, -0.31171438097953796, -0.2977384328842163, -0.28376245498657227, -0.2697864770889282, -0.25581052899360657, -0.24183456599712372, -0.22785860300064087, -0.21388264000415802, -0.19990667700767517, -0.18593071401119232, -0.17195475101470947, -0.15797878801822662, -0.14400282502174377, -0.13002686202526093, -0.11605089902877808, -0.10207493603229523, -0.08809897303581238, -0.07412301003932953, -0.06014704704284668, -0.04617108404636383, -0.03219512104988098, -0.018219158053398132, -0.004243195056915283, 0.009732767939567566, 0.023708730936050415, 0.037684693932533264, 0.05166065692901611, 0.06563661992549896, 0.07961258292198181, 0.09358854591846466, 0.10756450891494751, 0.12154047191143036, 0.1355164349079132, 0.14949239790439606, 0.1634683609008789, 0.17744432389736176, 0.1914202868938446, 0.20539624989032745, 0.2193722128868103, 0.23334817588329315, 0.247324138879776, 0.26130008697509766, 0.2752760648727417, 0.28925204277038574, 0.3032279908657074, 0.31720393896102905, 0.3311799168586731, 0.34515589475631714, 0.3591318428516388, 0.37310779094696045, 0.3870837688446045, 0.40105974674224854, 0.4150356948375702, 0.42901164293289185, 0.4429876208305359]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 10.0, 13.0, 12.0, 35.0, 34.0, 73.0, 108.0, 181.0, 294.0, 514.0, 893.0, 1836.0, 3586.0, 7416.0, 17097.0, 44663.0, 153963.0, 478989.0, 236135.0, 61706.0, 22156.0, 9619.0, 4420.0, 2211.0, 1101.0, 583.0, 330.0, 208.0, 110.0, 72.0, 44.0, 38.0, 27.0, 18.0, 18.0, 12.0, 9.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.65869140625, -0.6371994018554688, -0.6157073974609375, -0.5942153930664062, -0.572723388671875, -0.5512313842773438, -0.5297393798828125, -0.5082473754882812, -0.48675537109375, -0.46526336669921875, -0.4437713623046875, -0.42227935791015625, -0.400787353515625, -0.37929534912109375, -0.3578033447265625, -0.33631134033203125, -0.3148193359375, -0.29332733154296875, -0.2718353271484375, -0.25034332275390625, -0.228851318359375, -0.20735931396484375, -0.1858673095703125, -0.16437530517578125, -0.14288330078125, -0.12139129638671875, -0.0998992919921875, -0.07840728759765625, -0.056915283203125, -0.03542327880859375, -0.0139312744140625, 0.00756072998046875, 0.029052734375, 0.05054473876953125, 0.0720367431640625, 0.09352874755859375, 0.115020751953125, 0.13651275634765625, 0.1580047607421875, 0.17949676513671875, 0.20098876953125, 0.22248077392578125, 0.2439727783203125, 0.26546478271484375, 0.286956787109375, 0.30844879150390625, 0.3299407958984375, 0.35143280029296875, 0.3729248046875, 0.39441680908203125, 0.4159088134765625, 0.43740081787109375, 0.458892822265625, 0.48038482666015625, 0.5018768310546875, 0.5233688354492188, 0.54486083984375, 0.5663528442382812, 0.5878448486328125, 0.6093368530273438, 0.630828857421875, 0.6523208618164062, 0.6738128662109375, 0.6953048706054688, 0.716796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 8.0, 6.0, 9.0, 7.0, 14.0, 15.0, 14.0, 27.0, 36.0, 28.0, 40.0, 34.0, 46.0, 38.0, 45.0, 55.0, 55.0, 50.0, 42.0, 51.0, 54.0, 38.0, 50.0, 34.0, 29.0, 28.0, 15.0, 20.0, 20.0, 11.0, 10.0, 8.0, 12.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.1416015625, -1.1098403930664062, -1.0780792236328125, -1.0463180541992188, -1.014556884765625, -0.9827957153320312, -0.9510345458984375, -0.9192733764648438, -0.88751220703125, -0.8557510375976562, -0.8239898681640625, -0.7922286987304688, -0.760467529296875, -0.7287063598632812, -0.6969451904296875, -0.6651840209960938, -0.6334228515625, -0.6016616821289062, -0.5699005126953125, -0.5381393432617188, -0.506378173828125, -0.47461700439453125, -0.4428558349609375, -0.41109466552734375, -0.37933349609375, -0.34757232666015625, -0.3158111572265625, -0.28404998779296875, -0.252288818359375, -0.22052764892578125, -0.1887664794921875, -0.15700531005859375, -0.125244140625, -0.09348297119140625, -0.0617218017578125, -0.02996063232421875, 0.001800537109375, 0.03356170654296875, 0.0653228759765625, 0.09708404541015625, 0.12884521484375, 0.16060638427734375, 0.1923675537109375, 0.22412872314453125, 0.255889892578125, 0.28765106201171875, 0.3194122314453125, 0.35117340087890625, 0.3829345703125, 0.41469573974609375, 0.4464569091796875, 0.47821807861328125, 0.509979248046875, 0.5417404174804688, 0.5735015869140625, 0.6052627563476562, 0.63702392578125, 0.6687850952148438, 0.7005462646484375, 0.7323074340820312, 0.764068603515625, 0.7958297729492188, 0.8275909423828125, 0.8593521118164062, 0.89111328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 1.0, 4.0, 3.0, 9.0, 11.0, 11.0, 34.0, 45.0, 77.0, 131.0, 338.0, 1086.0, 7947.0, 162601.0, 837364.0, 35008.0, 2818.0, 571.0, 229.0, 105.0, 65.0, 35.0, 24.0, 13.0, 5.0, 4.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91796875, -1.852447509765625, -1.78692626953125, -1.721405029296875, -1.6558837890625, -1.590362548828125, -1.52484130859375, -1.459320068359375, -1.393798828125, -1.328277587890625, -1.26275634765625, -1.197235107421875, -1.1317138671875, -1.066192626953125, -1.00067138671875, -0.935150146484375, -0.86962890625, -0.804107666015625, -0.73858642578125, -0.673065185546875, -0.6075439453125, -0.542022705078125, -0.47650146484375, -0.410980224609375, -0.345458984375, -0.279937744140625, -0.21441650390625, -0.148895263671875, -0.0833740234375, -0.017852783203125, 0.04766845703125, 0.113189697265625, 0.1787109375, 0.244232177734375, 0.30975341796875, 0.375274658203125, 0.4407958984375, 0.506317138671875, 0.57183837890625, 0.637359619140625, 0.702880859375, 0.768402099609375, 0.83392333984375, 0.899444580078125, 0.9649658203125, 1.030487060546875, 1.09600830078125, 1.161529541015625, 1.22705078125, 1.292572021484375, 1.35809326171875, 1.423614501953125, 1.4891357421875, 1.554656982421875, 1.62017822265625, 1.685699462890625, 1.751220703125, 1.816741943359375, 1.88226318359375, 1.947784423828125, 2.0133056640625, 2.078826904296875, 2.14434814453125, 2.209869384765625, 2.275390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 12.0, 7.0, 13.0, 21.0, 21.0, 19.0, 30.0, 31.0, 46.0, 37.0, 53.0, 46.0, 57.0, 61.0, 65.0, 59.0, 70.0, 50.0, 42.0, 34.0, 46.0, 34.0, 23.0, 22.0, 28.0, 17.0, 15.0, 5.0, 8.0, 6.0, 1.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4404296875, -1.396240234375, -1.35205078125, -1.307861328125, -1.263671875, -1.219482421875, -1.17529296875, -1.131103515625, -1.0869140625, -1.042724609375, -0.99853515625, -0.954345703125, -0.91015625, -0.865966796875, -0.82177734375, -0.777587890625, -0.7333984375, -0.689208984375, -0.64501953125, -0.600830078125, -0.556640625, -0.512451171875, -0.46826171875, -0.424072265625, -0.3798828125, -0.335693359375, -0.29150390625, -0.247314453125, -0.203125, -0.158935546875, -0.11474609375, -0.070556640625, -0.0263671875, 0.017822265625, 0.06201171875, 0.106201171875, 0.150390625, 0.194580078125, 0.23876953125, 0.282958984375, 0.3271484375, 0.371337890625, 0.41552734375, 0.459716796875, 0.50390625, 0.548095703125, 0.59228515625, 0.636474609375, 0.6806640625, 0.724853515625, 0.76904296875, 0.813232421875, 0.857421875, 0.901611328125, 0.94580078125, 0.989990234375, 1.0341796875, 1.078369140625, 1.12255859375, 1.166748046875, 1.2109375, 1.255126953125, 1.29931640625, 1.343505859375, 1.3876953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 18.0, 19.0, 39.0, 50.0, 64.0, 133.0, 226.0, 474.0, 1569.0, 5858.0, 34807.0, 383829.0, 561163.0, 49652.0, 7577.0, 1891.0, 586.0, 257.0, 135.0, 72.0, 52.0, 20.0, 19.0, 3.0, 11.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.3451423645019531, -0.33530426025390625, -0.3254661560058594, -0.3156280517578125, -0.3057899475097656, -0.29595184326171875, -0.2861137390136719, -0.276275634765625, -0.2664375305175781, -0.25659942626953125, -0.24676132202148438, -0.2369232177734375, -0.22708511352539062, -0.21724700927734375, -0.20740890502929688, -0.19757080078125, -0.18773269653320312, -0.17789459228515625, -0.16805648803710938, -0.1582183837890625, -0.14838027954101562, -0.13854217529296875, -0.12870407104492188, -0.118865966796875, -0.10902786254882812, -0.09918975830078125, -0.08935165405273438, -0.0795135498046875, -0.06967544555664062, -0.05983734130859375, -0.049999237060546875, -0.0401611328125, -0.030323028564453125, -0.02048492431640625, -0.010646820068359375, -0.0008087158203125, 0.009029388427734375, 0.01886749267578125, 0.028705596923828125, 0.038543701171875, 0.048381805419921875, 0.05821990966796875, 0.06805801391601562, 0.0778961181640625, 0.08773422241210938, 0.09757232666015625, 0.10741043090820312, 0.11724853515625, 0.12708663940429688, 0.13692474365234375, 0.14676284790039062, 0.1566009521484375, 0.16643905639648438, 0.17627716064453125, 0.18611526489257812, 0.195953369140625, 0.20579147338867188, 0.21562957763671875, 0.22546768188476562, 0.2353057861328125, 0.24514389038085938, 0.25498199462890625, 0.2648200988769531, 0.274658203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 1.0, 7.0, 7.0, 7.0, 9.0, 14.0, 16.0, 14.0, 26.0, 34.0, 38.0, 45.0, 65.0, 69.0, 87.0, 105.0, 91.0, 74.0, 58.0, 57.0, 40.0, 35.0, 18.0, 17.0, 20.0, 10.0, 14.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.820657730102539e-05, -3.7212856113910675e-05, -3.621913492679596e-05, -3.5225413739681244e-05, -3.423169255256653e-05, -3.323797136545181e-05, -3.22442501783371e-05, -3.125052899122238e-05, -3.0256807804107666e-05, -2.926308661699295e-05, -2.8269365429878235e-05, -2.727564424276352e-05, -2.6281923055648804e-05, -2.5288201868534088e-05, -2.4294480681419373e-05, -2.3300759494304657e-05, -2.230703830718994e-05, -2.1313317120075226e-05, -2.031959593296051e-05, -1.9325874745845795e-05, -1.833215355873108e-05, -1.7338432371616364e-05, -1.6344711184501648e-05, -1.5350989997386932e-05, -1.4357268810272217e-05, -1.3363547623157501e-05, -1.2369826436042786e-05, -1.137610524892807e-05, -1.0382384061813354e-05, -9.388662874698639e-06, -8.394941687583923e-06, -7.401220500469208e-06, -6.407499313354492e-06, -5.413778126239777e-06, -4.420056939125061e-06, -3.4263357520103455e-06, -2.43261456489563e-06, -1.4388933777809143e-06, -4.4517219066619873e-07, 5.485489964485168e-07, 1.5422701835632324e-06, 2.535991370677948e-06, 3.5297125577926636e-06, 4.523433744907379e-06, 5.517154932022095e-06, 6.51087611913681e-06, 7.504597306251526e-06, 8.498318493366241e-06, 9.492039680480957e-06, 1.0485760867595673e-05, 1.1479482054710388e-05, 1.2473203241825104e-05, 1.346692442893982e-05, 1.4460645616054535e-05, 1.545436680316925e-05, 1.6448087990283966e-05, 1.744180917739868e-05, 1.8435530364513397e-05, 1.9429251551628113e-05, 2.042297273874283e-05, 2.1416693925857544e-05, 2.241041511297226e-05, 2.3404136300086975e-05, 2.439785748720169e-05, 2.5391578674316406e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 7.0, 5.0, 10.0, 15.0, 19.0, 30.0, 59.0, 107.0, 210.0, 515.0, 1360.0, 4677.0, 28212.0, 464922.0, 510321.0, 30700.0, 4909.0, 1467.0, 491.0, 222.0, 110.0, 60.0, 30.0, 21.0, 15.0, 13.0, 10.0, 3.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.40673828125, -0.3931884765625, -0.379638671875, -0.3660888671875, -0.3525390625, -0.3389892578125, -0.325439453125, -0.3118896484375, -0.29833984375, -0.2847900390625, -0.271240234375, -0.2576904296875, -0.244140625, -0.2305908203125, -0.217041015625, -0.2034912109375, -0.18994140625, -0.1763916015625, -0.162841796875, -0.1492919921875, -0.1357421875, -0.1221923828125, -0.108642578125, -0.0950927734375, -0.08154296875, -0.0679931640625, -0.054443359375, -0.0408935546875, -0.02734375, -0.0137939453125, -0.000244140625, 0.0133056640625, 0.02685546875, 0.0404052734375, 0.053955078125, 0.0675048828125, 0.0810546875, 0.0946044921875, 0.108154296875, 0.1217041015625, 0.13525390625, 0.1488037109375, 0.162353515625, 0.1759033203125, 0.189453125, 0.2030029296875, 0.216552734375, 0.2301025390625, 0.24365234375, 0.2572021484375, 0.270751953125, 0.2843017578125, 0.2978515625, 0.3114013671875, 0.324951171875, 0.3385009765625, 0.35205078125, 0.3656005859375, 0.379150390625, 0.3927001953125, 0.40625, 0.4197998046875, 0.433349609375, 0.4468994140625, 0.46044921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 7.0, 16.0, 17.0, 35.0, 50.0, 66.0, 98.0, 129.0, 133.0, 139.0, 87.0, 71.0, 45.0, 32.0, 28.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2032470703125, -0.19715309143066406, -0.19105911254882812, -0.1849651336669922, -0.17887115478515625, -0.1727771759033203, -0.16668319702148438, -0.16058921813964844, -0.1544952392578125, -0.14840126037597656, -0.14230728149414062, -0.1362133026123047, -0.13011932373046875, -0.12402534484863281, -0.11793136596679688, -0.11183738708496094, -0.105743408203125, -0.09964942932128906, -0.09355545043945312, -0.08746147155761719, -0.08136749267578125, -0.07527351379394531, -0.06917953491210938, -0.06308555603027344, -0.0569915771484375, -0.05089759826660156, -0.044803619384765625, -0.03870964050292969, -0.03261566162109375, -0.026521682739257812, -0.020427703857421875, -0.014333724975585938, -0.00823974609375, -0.0021457672119140625, 0.003948211669921875, 0.010042190551757812, 0.01613616943359375, 0.022230148315429688, 0.028324127197265625, 0.03441810607910156, 0.0405120849609375, 0.04660606384277344, 0.052700042724609375, 0.05879402160644531, 0.06488800048828125, 0.07098197937011719, 0.07707595825195312, 0.08316993713378906, 0.089263916015625, 0.09535789489746094, 0.10145187377929688, 0.10754585266113281, 0.11363983154296875, 0.11973381042480469, 0.12582778930664062, 0.13192176818847656, 0.1380157470703125, 0.14410972595214844, 0.15020370483398438, 0.1562976837158203, 0.16239166259765625, 0.1684856414794922, 0.17457962036132812, 0.18067359924316406, 0.186767578125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 10.0, 30.0, 47.0, 71.0, 100.0, 149.0, 141.0, 138.0, 119.0, 83.0, 48.0, 26.0, 15.0, 13.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.666508674621582, -3.582791328430176, -3.4990737438201904, -3.415356397628784, -3.331639051437378, -3.2479214668273926, -3.1642041206359863, -3.08048677444458, -2.996769428253174, -2.9130520820617676, -2.8293344974517822, -2.745617151260376, -2.6618998050689697, -2.5781822204589844, -2.494464874267578, -2.410747528076172, -2.3270299434661865, -2.2433125972747803, -2.159595012664795, -2.0758776664733887, -1.9921603202819824, -1.9084428548812866, -1.8247253894805908, -1.7410080432891846, -1.6572905778884888, -1.573573112487793, -1.4898557662963867, -1.406138300895691, -1.3224208354949951, -1.2387034893035889, -1.154986023902893, -1.0712685585021973, -0.9875510931015015, -0.9038336873054504, -0.8201162815093994, -0.7363988161087036, -0.6526814103126526, -0.5689640045166016, -0.48524653911590576, -0.40152913331985474, -0.3178117275238037, -0.2340943068265915, -0.15037688612937927, -0.06665945053100586, 0.017057955265045166, 0.10077536106109619, 0.184492826461792, 0.268210232257843, 0.35192763805389404, 0.43564504384994507, 0.5193624496459961, 0.6030799150466919, 0.6867973208427429, 0.770514726638794, 0.8542321920394897, 0.9379495978355408, 1.0216670036315918, 1.1053844690322876, 1.1891018152236938, 1.2728192806243896, 1.356536626815796, 1.4402540922164917, 1.5239715576171875, 1.6076889038085938, 1.6914063692092896]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 8.0, 14.0, 10.0, 14.0, 16.0, 24.0, 18.0, 22.0, 23.0, 27.0, 32.0, 37.0, 37.0, 40.0, 33.0, 42.0, 34.0, 45.0, 34.0, 38.0, 54.0, 46.0, 38.0, 36.0, 33.0, 25.0, 34.0, 32.0, 27.0, 17.0, 15.0, 17.0, 18.0, 13.0, 11.0, 7.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.075371742248535, -2.0160861015319824, -1.9568005800247192, -1.897515058517456, -1.8382294178009033, -1.7789438962936401, -1.719658374786377, -1.6603727340698242, -1.601087212562561, -1.5418016910552979, -1.4825160503387451, -1.423230528831482, -1.3639450073242188, -1.304659366607666, -1.2453738451004028, -1.1860883235931396, -1.126802682876587, -1.0675171613693237, -1.008231520652771, -0.9489459991455078, -0.8896604180335999, -0.8303748369216919, -0.7710893154144287, -0.7118037343025208, -0.6525181531906128, -0.5932325720787048, -0.5339469909667969, -0.4746614694595337, -0.41537588834762573, -0.3560903072357178, -0.2968047559261322, -0.23751920461654663, -0.17823362350463867, -0.1189480572938919, -0.05966249108314514, -0.00037692487239837646, 0.05890864133834839, 0.11819422245025635, 0.17747977375984192, 0.2367653250694275, 0.29605090618133545, 0.3553364872932434, 0.414622038602829, 0.47390758991241455, 0.5331931710243225, 0.5924787521362305, 0.6517642736434937, 0.7110498547554016, 0.7703354358673096, 0.8296210169792175, 0.8889065980911255, 0.9481921195983887, 1.0074777603149414, 1.0667632818222046, 1.1260488033294678, 1.1853344440460205, 1.2446199655532837, 1.3039054870605469, 1.3631911277770996, 1.4224766492843628, 1.481762170791626, 1.5410478115081787, 1.600333333015442, 1.659618854522705, 1.7189044952392578]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 4.0, 16.0, 15.0, 21.0, 26.0, 37.0, 35.0, 89.0, 124.0, 192.0, 410.0, 833.0, 2009.0, 4908.0, 15662.0, 87331.0, 1804943.0, 2152950.0, 98059.0, 17078.0, 5465.0, 2089.0, 929.0, 406.0, 227.0, 123.0, 88.0, 53.0, 41.0, 20.0, 21.0, 8.0, 9.0, 10.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6123046875, -1.5687713623046875, -1.525238037109375, -1.4817047119140625, -1.43817138671875, -1.3946380615234375, -1.351104736328125, -1.3075714111328125, -1.2640380859375, -1.2205047607421875, -1.176971435546875, -1.1334381103515625, -1.08990478515625, -1.0463714599609375, -1.002838134765625, -0.9593048095703125, -0.915771484375, -0.8722381591796875, -0.828704833984375, -0.7851715087890625, -0.74163818359375, -0.6981048583984375, -0.654571533203125, -0.6110382080078125, -0.5675048828125, -0.5239715576171875, -0.480438232421875, -0.4369049072265625, -0.39337158203125, -0.3498382568359375, -0.306304931640625, -0.2627716064453125, -0.21923828125, -0.1757049560546875, -0.132171630859375, -0.0886383056640625, -0.04510498046875, -0.0015716552734375, 0.041961669921875, 0.0854949951171875, 0.1290283203125, 0.1725616455078125, 0.216094970703125, 0.2596282958984375, 0.30316162109375, 0.3466949462890625, 0.390228271484375, 0.4337615966796875, 0.477294921875, 0.5208282470703125, 0.564361572265625, 0.6078948974609375, 0.65142822265625, 0.6949615478515625, 0.738494873046875, 0.7820281982421875, 0.8255615234375, 0.8690948486328125, 0.912628173828125, 0.9561614990234375, 0.99969482421875, 1.0432281494140625, 1.086761474609375, 1.1302947998046875, 1.173828125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 4.0, 4.0, 11.0, 9.0, 19.0, 12.0, 14.0, 23.0, 24.0, 16.0, 29.0, 30.0, 31.0, 36.0, 43.0, 26.0, 42.0, 39.0, 52.0, 38.0, 40.0, 39.0, 60.0, 48.0, 34.0, 37.0, 33.0, 29.0, 26.0, 21.0, 13.0, 20.0, 10.0, 16.0, 12.0, 10.0, 6.0, 3.0, 6.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4208984375, -0.40557098388671875, -0.3902435302734375, -0.37491607666015625, -0.359588623046875, -0.34426116943359375, -0.3289337158203125, -0.31360626220703125, -0.29827880859375, -0.28295135498046875, -0.2676239013671875, -0.25229644775390625, -0.236968994140625, -0.22164154052734375, -0.2063140869140625, -0.19098663330078125, -0.1756591796875, -0.16033172607421875, -0.1450042724609375, -0.12967681884765625, -0.114349365234375, -0.09902191162109375, -0.0836944580078125, -0.06836700439453125, -0.05303955078125, -0.03771209716796875, -0.0223846435546875, -0.00705718994140625, 0.008270263671875, 0.02359771728515625, 0.0389251708984375, 0.05425262451171875, 0.069580078125, 0.08490753173828125, 0.1002349853515625, 0.11556243896484375, 0.130889892578125, 0.14621734619140625, 0.1615447998046875, 0.17687225341796875, 0.19219970703125, 0.20752716064453125, 0.2228546142578125, 0.23818206787109375, 0.253509521484375, 0.26883697509765625, 0.2841644287109375, 0.29949188232421875, 0.3148193359375, 0.33014678955078125, 0.3454742431640625, 0.36080169677734375, 0.376129150390625, 0.39145660400390625, 0.4067840576171875, 0.42211151123046875, 0.43743896484375, 0.45276641845703125, 0.4680938720703125, 0.48342132568359375, 0.498748779296875, 0.5140762329101562, 0.5294036865234375, 0.5447311401367188, 0.56005859375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 10.0, 8.0, 7.0, 10.0, 15.0, 43.0, 69.0, 90.0, 174.0, 491.0, 2270.0, 23487.0, 3339438.0, 813528.0, 12327.0, 1525.0, 417.0, 152.0, 78.0, 46.0, 28.0, 23.0, 16.0, 11.0, 2.0, 9.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.619140625, -2.5369873046875, -2.454833984375, -2.3726806640625, -2.29052734375, -2.2083740234375, -2.126220703125, -2.0440673828125, -1.9619140625, -1.8797607421875, -1.797607421875, -1.7154541015625, -1.63330078125, -1.5511474609375, -1.468994140625, -1.3868408203125, -1.3046875, -1.2225341796875, -1.140380859375, -1.0582275390625, -0.97607421875, -0.8939208984375, -0.811767578125, -0.7296142578125, -0.6474609375, -0.5653076171875, -0.483154296875, -0.4010009765625, -0.31884765625, -0.2366943359375, -0.154541015625, -0.0723876953125, 0.009765625, 0.0919189453125, 0.174072265625, 0.2562255859375, 0.33837890625, 0.4205322265625, 0.502685546875, 0.5848388671875, 0.6669921875, 0.7491455078125, 0.831298828125, 0.9134521484375, 0.99560546875, 1.0777587890625, 1.159912109375, 1.2420654296875, 1.32421875, 1.4063720703125, 1.488525390625, 1.5706787109375, 1.65283203125, 1.7349853515625, 1.817138671875, 1.8992919921875, 1.9814453125, 2.0635986328125, 2.145751953125, 2.2279052734375, 2.31005859375, 2.3922119140625, 2.474365234375, 2.5565185546875, 2.638671875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 10.0, 4.0, 4.0, 11.0, 10.0, 14.0, 22.0, 34.0, 47.0, 47.0, 76.0, 112.0, 211.0, 334.0, 449.0, 498.0, 566.0, 510.0, 344.0, 247.0, 159.0, 101.0, 69.0, 39.0, 33.0, 21.0, 28.0, 13.0, 11.0, 16.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.337890625, -0.3280372619628906, -0.31818389892578125, -0.3083305358886719, -0.2984771728515625, -0.2886238098144531, -0.27877044677734375, -0.2689170837402344, -0.259063720703125, -0.24921035766601562, -0.23935699462890625, -0.22950363159179688, -0.2196502685546875, -0.20979690551757812, -0.19994354248046875, -0.19009017944335938, -0.18023681640625, -0.17038345336914062, -0.16053009033203125, -0.15067672729492188, -0.1408233642578125, -0.13097000122070312, -0.12111663818359375, -0.11126327514648438, -0.101409912109375, -0.09155654907226562, -0.08170318603515625, -0.07184982299804688, -0.0619964599609375, -0.052143096923828125, -0.04228973388671875, -0.032436370849609375, -0.0225830078125, -0.012729644775390625, -0.00287628173828125, 0.006977081298828125, 0.0168304443359375, 0.026683807373046875, 0.03653717041015625, 0.046390533447265625, 0.056243896484375, 0.06609725952148438, 0.07595062255859375, 0.08580398559570312, 0.0956573486328125, 0.10551071166992188, 0.11536407470703125, 0.12521743774414062, 0.13507080078125, 0.14492416381835938, 0.15477752685546875, 0.16463088989257812, 0.1744842529296875, 0.18433761596679688, 0.19419097900390625, 0.20404434204101562, 0.213897705078125, 0.22375106811523438, 0.23360443115234375, 0.24345779418945312, 0.2533111572265625, 0.2631645202636719, 0.27301788330078125, 0.2828712463378906, 0.292724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 2.0, 13.0, 12.0, 10.0, 15.0, 27.0, 21.0, 26.0, 30.0, 32.0, 39.0, 54.0, 56.0, 57.0, 55.0, 59.0, 46.0, 55.0, 54.0, 34.0, 48.0, 41.0, 36.0, 38.0, 30.0, 25.0, 18.0, 12.0, 10.0, 15.0, 9.0, 5.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7114796042442322, -0.6886913776397705, -0.6659030914306641, -0.6431148052215576, -0.620326578617096, -0.5975383520126343, -0.5747500658035278, -0.5519617795944214, -0.5291735529899597, -0.506385326385498, -0.4835970401763916, -0.46080878376960754, -0.4380205273628235, -0.41523227095603943, -0.39244401454925537, -0.3696557581424713, -0.34686750173568726, -0.3240792453289032, -0.30129098892211914, -0.2785027325153351, -0.255714476108551, -0.23292621970176697, -0.2101379632949829, -0.18734970688819885, -0.1645614504814148, -0.14177319407463074, -0.11898493766784668, -0.09619668126106262, -0.07340842485427856, -0.05062016844749451, -0.02783191204071045, -0.005043655633926392, 0.01774466037750244, 0.0405329167842865, 0.06332117319107056, 0.08610942959785461, 0.10889768600463867, 0.13168594241142273, 0.1544741988182068, 0.17726245522499084, 0.2000507116317749, 0.22283896803855896, 0.24562722444534302, 0.2684154808521271, 0.29120373725891113, 0.3139919936656952, 0.33678025007247925, 0.3595685064792633, 0.38235676288604736, 0.4051450192928314, 0.4279332756996155, 0.45072153210639954, 0.4735097885131836, 0.49629804491996765, 0.5190863013267517, 0.5418745279312134, 0.5646628141403198, 0.5874511003494263, 0.6102393269538879, 0.6330275535583496, 0.655815839767456, 0.6786041259765625, 0.7013923525810242, 0.7241805791854858, 0.7469688653945923]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 12.0, 5.0, 6.0, 12.0, 15.0, 9.0, 11.0, 12.0, 19.0, 20.0, 22.0, 23.0, 38.0, 28.0, 30.0, 25.0, 50.0, 40.0, 41.0, 41.0, 36.0, 54.0, 42.0, 39.0, 43.0, 36.0, 38.0, 28.0, 39.0, 22.0, 32.0, 16.0, 17.0, 16.0, 15.0, 16.0, 15.0, 4.0, 7.0, 7.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6414443254470825, -0.6223491430282593, -0.603253960609436, -0.5841587781906128, -0.5650635957717896, -0.5459684133529663, -0.5268732309341431, -0.5077780485153198, -0.4886828362941742, -0.46958765387535095, -0.4504924714565277, -0.43139728903770447, -0.41230207681655884, -0.3932068943977356, -0.37411171197891235, -0.3550165295600891, -0.33592134714126587, -0.3168261647224426, -0.2977309823036194, -0.27863579988479614, -0.2595406174659729, -0.24044542014598846, -0.22135022282600403, -0.2022550404071808, -0.18315985798835754, -0.1640646755695343, -0.14496949315071106, -0.12587429583072662, -0.10677911341190338, -0.08768393099308014, -0.0685887411236763, -0.04949355125427246, -0.030398309230804443, -0.011303123086690903, 0.007792063057422638, 0.02688724920153618, 0.04598243534564972, 0.06507761776447296, 0.0841728076338768, 0.10326799750328064, 0.12236317992210388, 0.14145836234092712, 0.16055354475975037, 0.1796487420797348, 0.19874392449855804, 0.2178391069173813, 0.23693430423736572, 0.25602948665618896, 0.2751246690750122, 0.29421985149383545, 0.3133150339126587, 0.33241021633148193, 0.3515053987503052, 0.3706005811691284, 0.38969579339027405, 0.4087909758090973, 0.42788615822792053, 0.4469813406467438, 0.466076523065567, 0.48517170548439026, 0.5042669177055359, 0.5233621001243591, 0.5424572825431824, 0.5615524649620056, 0.5806476473808289]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 12.0, 6.0, 12.0, 18.0, 29.0, 35.0, 44.0, 84.0, 74.0, 132.0, 178.0, 299.0, 448.0, 689.0, 1224.0, 2030.0, 3930.0, 8616.0, 26019.0, 125414.0, 489423.0, 303829.0, 58182.0, 14828.0, 5887.0, 2930.0, 1554.0, 880.0, 597.0, 392.0, 224.0, 153.0, 100.0, 85.0, 42.0, 43.0, 30.0, 28.0, 15.0, 9.0, 14.0, 8.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2357177734375, -0.2278003692626953, -0.21988296508789062, -0.21196556091308594, -0.20404815673828125, -0.19613075256347656, -0.18821334838867188, -0.1802959442138672, -0.1723785400390625, -0.1644611358642578, -0.15654373168945312, -0.14862632751464844, -0.14070892333984375, -0.13279151916503906, -0.12487411499023438, -0.11695671081542969, -0.109039306640625, -0.10112190246582031, -0.09320449829101562, -0.08528709411621094, -0.07736968994140625, -0.06945228576660156, -0.061534881591796875, -0.05361747741699219, -0.0457000732421875, -0.03778266906738281, -0.029865264892578125, -0.021947860717773438, -0.01403045654296875, -0.0061130523681640625, 0.001804351806640625, 0.009721755981445312, 0.01763916015625, 0.025556564331054688, 0.033473968505859375, 0.04139137268066406, 0.04930877685546875, 0.05722618103027344, 0.06514358520507812, 0.07306098937988281, 0.0809783935546875, 0.08889579772949219, 0.09681320190429688, 0.10473060607910156, 0.11264801025390625, 0.12056541442871094, 0.12848281860351562, 0.1364002227783203, 0.144317626953125, 0.1522350311279297, 0.16015243530273438, 0.16806983947753906, 0.17598724365234375, 0.18390464782714844, 0.19182205200195312, 0.1997394561767578, 0.2076568603515625, 0.2155742645263672, 0.22349166870117188, 0.23140907287597656, 0.23932647705078125, 0.24724388122558594, 0.2551612854003906, 0.2630786895751953, 0.27099609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 5.0, 7.0, 14.0, 4.0, 15.0, 11.0, 18.0, 22.0, 16.0, 32.0, 30.0, 27.0, 33.0, 39.0, 37.0, 40.0, 46.0, 44.0, 45.0, 62.0, 41.0, 45.0, 39.0, 39.0, 35.0, 31.0, 37.0, 22.0, 30.0, 22.0, 20.0, 10.0, 13.0, 11.0, 9.0, 10.0, 13.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.414794921875, -0.4024810791015625, -0.390167236328125, -0.3778533935546875, -0.36553955078125, -0.3532257080078125, -0.340911865234375, -0.3285980224609375, -0.3162841796875, -0.3039703369140625, -0.291656494140625, -0.2793426513671875, -0.26702880859375, -0.2547149658203125, -0.242401123046875, -0.2300872802734375, -0.2177734375, -0.2054595947265625, -0.193145751953125, -0.1808319091796875, -0.16851806640625, -0.1562042236328125, -0.143890380859375, -0.1315765380859375, -0.1192626953125, -0.1069488525390625, -0.094635009765625, -0.0823211669921875, -0.07000732421875, -0.0576934814453125, -0.045379638671875, -0.0330657958984375, -0.020751953125, -0.0084381103515625, 0.003875732421875, 0.0161895751953125, 0.02850341796875, 0.0408172607421875, 0.053131103515625, 0.0654449462890625, 0.0777587890625, 0.0900726318359375, 0.102386474609375, 0.1147003173828125, 0.12701416015625, 0.1393280029296875, 0.151641845703125, 0.1639556884765625, 0.17626953125, 0.1885833740234375, 0.200897216796875, 0.2132110595703125, 0.22552490234375, 0.2378387451171875, 0.250152587890625, 0.2624664306640625, 0.2747802734375, 0.2870941162109375, 0.299407958984375, 0.3117218017578125, 0.32403564453125, 0.3363494873046875, 0.348663330078125, 0.3609771728515625, 0.373291015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 10.0, 8.0, 14.0, 16.0, 33.0, 84.0, 154.0, 277.0, 787.0, 2383.0, 11759.0, 123790.0, 757381.0, 135391.0, 12461.0, 2573.0, 742.0, 336.0, 161.0, 68.0, 38.0, 31.0, 13.0, 15.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.48773193359375, -0.4739990234375, -0.46026611328125, -0.446533203125, -0.43280029296875, -0.4190673828125, -0.40533447265625, -0.3916015625, -0.37786865234375, -0.3641357421875, -0.35040283203125, -0.336669921875, -0.32293701171875, -0.3092041015625, -0.29547119140625, -0.28173828125, -0.26800537109375, -0.2542724609375, -0.24053955078125, -0.226806640625, -0.21307373046875, -0.1993408203125, -0.18560791015625, -0.171875, -0.15814208984375, -0.1444091796875, -0.13067626953125, -0.116943359375, -0.10321044921875, -0.0894775390625, -0.07574462890625, -0.06201171875, -0.04827880859375, -0.0345458984375, -0.02081298828125, -0.007080078125, 0.00665283203125, 0.0203857421875, 0.03411865234375, 0.0478515625, 0.06158447265625, 0.0753173828125, 0.08905029296875, 0.102783203125, 0.11651611328125, 0.1302490234375, 0.14398193359375, 0.15771484375, 0.17144775390625, 0.1851806640625, 0.19891357421875, 0.212646484375, 0.22637939453125, 0.2401123046875, 0.25384521484375, 0.267578125, 0.28131103515625, 0.2950439453125, 0.30877685546875, 0.322509765625, 0.33624267578125, 0.3499755859375, 0.36370849609375, 0.37744140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 7.0, 8.0, 13.0, 19.0, 15.0, 26.0, 17.0, 25.0, 31.0, 27.0, 30.0, 31.0, 46.0, 50.0, 45.0, 56.0, 49.0, 43.0, 33.0, 58.0, 35.0, 33.0, 38.0, 33.0, 36.0, 24.0, 30.0, 21.0, 26.0, 11.0, 8.0, 8.0, 8.0, 11.0, 11.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.158203125, -1.1236572265625, -1.089111328125, -1.0545654296875, -1.02001953125, -0.9854736328125, -0.950927734375, -0.9163818359375, -0.8818359375, -0.8472900390625, -0.812744140625, -0.7781982421875, -0.74365234375, -0.7091064453125, -0.674560546875, -0.6400146484375, -0.60546875, -0.5709228515625, -0.536376953125, -0.5018310546875, -0.46728515625, -0.4327392578125, -0.398193359375, -0.3636474609375, -0.3291015625, -0.2945556640625, -0.260009765625, -0.2254638671875, -0.19091796875, -0.1563720703125, -0.121826171875, -0.0872802734375, -0.052734375, -0.0181884765625, 0.016357421875, 0.0509033203125, 0.08544921875, 0.1199951171875, 0.154541015625, 0.1890869140625, 0.2236328125, 0.2581787109375, 0.292724609375, 0.3272705078125, 0.36181640625, 0.3963623046875, 0.430908203125, 0.4654541015625, 0.5, 0.5345458984375, 0.569091796875, 0.6036376953125, 0.63818359375, 0.6727294921875, 0.707275390625, 0.7418212890625, 0.7763671875, 0.8109130859375, 0.845458984375, 0.8800048828125, 0.91455078125, 0.9490966796875, 0.983642578125, 1.0181884765625, 1.052734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 4.0, 11.0, 20.0, 38.0, 54.0, 98.0, 169.0, 303.0, 562.0, 1053.0, 2473.0, 6162.0, 20930.0, 109270.0, 518139.0, 316315.0, 52851.0, 12315.0, 4144.0, 1712.0, 866.0, 465.0, 262.0, 126.0, 75.0, 57.0, 21.0, 25.0, 7.0, 7.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12176513671875, -0.1179351806640625, -0.114105224609375, -0.1102752685546875, -0.1064453125, -0.1026153564453125, -0.098785400390625, -0.0949554443359375, -0.09112548828125, -0.0872955322265625, -0.083465576171875, -0.0796356201171875, -0.0758056640625, -0.0719757080078125, -0.068145751953125, -0.0643157958984375, -0.06048583984375, -0.0566558837890625, -0.052825927734375, -0.0489959716796875, -0.045166015625, -0.0413360595703125, -0.037506103515625, -0.0336761474609375, -0.02984619140625, -0.0260162353515625, -0.022186279296875, -0.0183563232421875, -0.0145263671875, -0.0106964111328125, -0.006866455078125, -0.0030364990234375, 0.00079345703125, 0.0046234130859375, 0.008453369140625, 0.0122833251953125, 0.01611328125, 0.0199432373046875, 0.023773193359375, 0.0276031494140625, 0.03143310546875, 0.0352630615234375, 0.039093017578125, 0.0429229736328125, 0.0467529296875, 0.0505828857421875, 0.054412841796875, 0.0582427978515625, 0.06207275390625, 0.0659027099609375, 0.069732666015625, 0.0735626220703125, 0.077392578125, 0.0812225341796875, 0.085052490234375, 0.0888824462890625, 0.09271240234375, 0.0965423583984375, 0.100372314453125, 0.1042022705078125, 0.1080322265625, 0.1118621826171875, 0.115692138671875, 0.1195220947265625, 0.12335205078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 9.0, 13.0, 15.0, 18.0, 27.0, 53.0, 71.0, 78.0, 104.0, 128.0, 102.0, 98.0, 82.0, 55.0, 29.0, 34.0, 15.0, 14.0, 11.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.389617919921875e-05, -6.201118230819702e-05, -6.012618541717529e-05, -5.8241188526153564e-05, -5.6356191635131836e-05, -5.447119474411011e-05, -5.258619785308838e-05, -5.070120096206665e-05, -4.881620407104492e-05, -4.693120718002319e-05, -4.5046210289001465e-05, -4.3161213397979736e-05, -4.127621650695801e-05, -3.939121961593628e-05, -3.750622272491455e-05, -3.562122583389282e-05, -3.3736228942871094e-05, -3.1851232051849365e-05, -2.9966235160827637e-05, -2.8081238269805908e-05, -2.619624137878418e-05, -2.431124448776245e-05, -2.2426247596740723e-05, -2.0541250705718994e-05, -1.8656253814697266e-05, -1.6771256923675537e-05, -1.4886260032653809e-05, -1.300126314163208e-05, -1.1116266250610352e-05, -9.231269359588623e-06, -7.3462724685668945e-06, -5.461275577545166e-06, -3.5762786865234375e-06, -1.691281795501709e-06, 1.9371509552001953e-07, 2.078711986541748e-06, 3.9637088775634766e-06, 5.848705768585205e-06, 7.733702659606934e-06, 9.618699550628662e-06, 1.150369644165039e-05, 1.3388693332672119e-05, 1.5273690223693848e-05, 1.7158687114715576e-05, 1.9043684005737305e-05, 2.0928680896759033e-05, 2.2813677787780762e-05, 2.469867467880249e-05, 2.658367156982422e-05, 2.8468668460845947e-05, 3.0353665351867676e-05, 3.2238662242889404e-05, 3.412365913391113e-05, 3.600865602493286e-05, 3.789365291595459e-05, 3.977864980697632e-05, 4.166364669799805e-05, 4.3548643589019775e-05, 4.5433640480041504e-05, 4.731863737106323e-05, 4.920363426208496e-05, 5.108863115310669e-05, 5.297362804412842e-05, 5.4858624935150146e-05, 5.6743621826171875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 12.0, 10.0, 19.0, 25.0, 34.0, 59.0, 82.0, 131.0, 174.0, 304.0, 425.0, 773.0, 1228.0, 2092.0, 3611.0, 6396.0, 12420.0, 25215.0, 53398.0, 117848.0, 227050.0, 270822.0, 171222.0, 80170.0, 36663.0, 17485.0, 8967.0, 4885.0, 2756.0, 1558.0, 1005.0, 594.0, 374.0, 239.0, 162.0, 101.0, 66.0, 54.0, 35.0, 22.0, 26.0, 10.0, 7.0, 9.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.05908203125, -0.0573573112487793, -0.055632591247558594, -0.05390787124633789, -0.05218315124511719, -0.050458431243896484, -0.04873371124267578, -0.04700899124145508, -0.045284271240234375, -0.04355955123901367, -0.04183483123779297, -0.040110111236572266, -0.03838539123535156, -0.03666067123413086, -0.034935951232910156, -0.03321123123168945, -0.03148651123046875, -0.029761791229248047, -0.028037071228027344, -0.02631235122680664, -0.024587631225585938, -0.022862911224365234, -0.02113819122314453, -0.019413471221923828, -0.017688751220703125, -0.015964031219482422, -0.014239311218261719, -0.012514591217041016, -0.010789871215820312, -0.00906515121459961, -0.007340431213378906, -0.005615711212158203, -0.0038909912109375, -0.002166271209716797, -0.00044155120849609375, 0.0012831687927246094, 0.0030078887939453125, 0.004732608795166016, 0.006457328796386719, 0.008182048797607422, 0.009906768798828125, 0.011631488800048828, 0.013356208801269531, 0.015080928802490234, 0.016805648803710938, 0.01853036880493164, 0.020255088806152344, 0.021979808807373047, 0.02370452880859375, 0.025429248809814453, 0.027153968811035156, 0.02887868881225586, 0.030603408813476562, 0.032328128814697266, 0.03405284881591797, 0.03577756881713867, 0.037502288818359375, 0.03922700881958008, 0.04095172882080078, 0.042676448822021484, 0.04440116882324219, 0.04612588882446289, 0.047850608825683594, 0.0495753288269043, 0.051300048828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 11.0, 10.0, 13.0, 8.0, 10.0, 16.0, 18.0, 30.0, 33.0, 32.0, 40.0, 69.0, 56.0, 62.0, 62.0, 73.0, 73.0, 38.0, 61.0, 53.0, 31.0, 30.0, 36.0, 28.0, 21.0, 14.0, 12.0, 9.0, 8.0, 8.0, 3.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0203399658203125, -0.0197451114654541, -0.019150257110595703, -0.018555402755737305, -0.017960548400878906, -0.017365694046020508, -0.01677083969116211, -0.01617598533630371, -0.015581130981445312, -0.014986276626586914, -0.014391422271728516, -0.013796567916870117, -0.013201713562011719, -0.01260685920715332, -0.012012004852294922, -0.011417150497436523, -0.010822296142578125, -0.010227441787719727, -0.009632587432861328, -0.00903773307800293, -0.008442878723144531, -0.007848024368286133, -0.007253170013427734, -0.006658315658569336, -0.0060634613037109375, -0.005468606948852539, -0.004873752593994141, -0.004278898239135742, -0.0036840438842773438, -0.0030891895294189453, -0.002494335174560547, -0.0018994808197021484, -0.00130462646484375, -0.0007097721099853516, -0.00011491775512695312, 0.0004799365997314453, 0.0010747909545898438, 0.0016696453094482422, 0.0022644996643066406, 0.002859354019165039, 0.0034542083740234375, 0.004049062728881836, 0.004643917083740234, 0.005238771438598633, 0.005833625793457031, 0.00642848014831543, 0.007023334503173828, 0.0076181888580322266, 0.008213043212890625, 0.008807897567749023, 0.009402751922607422, 0.00999760627746582, 0.010592460632324219, 0.011187314987182617, 0.011782169342041016, 0.012377023696899414, 0.012971878051757812, 0.013566732406616211, 0.01416158676147461, 0.014756441116333008, 0.015351295471191406, 0.015946149826049805, 0.016541004180908203, 0.0171358585357666, 0.017730712890625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 6.0, 10.0, 23.0, 25.0, 23.0, 39.0, 43.0, 32.0, 41.0, 48.0, 37.0, 53.0, 67.0, 63.0, 44.0, 46.0, 50.0, 38.0, 49.0, 22.0, 37.0, 26.0, 33.0, 28.0, 17.0, 16.0, 12.0, 11.0, 6.0, 13.0, 5.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3567678928375244, -0.3444017469882965, -0.3320356011390686, -0.3196694552898407, -0.3073033094406128, -0.2949371635913849, -0.282571017742157, -0.2702048718929291, -0.25783872604370117, -0.24547258019447327, -0.23310643434524536, -0.22074028849601746, -0.20837414264678955, -0.19600799679756165, -0.18364185094833374, -0.17127570509910583, -0.15890955924987793, -0.14654341340065002, -0.13417726755142212, -0.12181112170219421, -0.10944497585296631, -0.0970788300037384, -0.0847126841545105, -0.07234653830528259, -0.05998039245605469, -0.04761424660682678, -0.03524810075759888, -0.02288195490837097, -0.010515809059143066, 0.0018503367900848389, 0.014216482639312744, 0.02658262848854065, 0.03894874453544617, 0.05131489038467407, 0.06368103623390198, 0.07604718208312988, 0.08841332793235779, 0.1007794737815857, 0.1131456196308136, 0.1255117654800415, 0.1378779113292694, 0.15024405717849731, 0.16261020302772522, 0.17497634887695312, 0.18734249472618103, 0.19970864057540894, 0.21207478642463684, 0.22444093227386475, 0.23680707812309265, 0.24917322397232056, 0.26153936982154846, 0.27390551567077637, 0.2862716615200043, 0.2986378073692322, 0.3110039532184601, 0.323370099067688, 0.3357362449169159, 0.3481023907661438, 0.3604685366153717, 0.3728346824645996, 0.3852008283138275, 0.3975669741630554, 0.4099331200122833, 0.42229926586151123, 0.43466541171073914]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 9.0, 9.0, 17.0, 13.0, 15.0, 18.0, 12.0, 25.0, 26.0, 22.0, 36.0, 28.0, 38.0, 39.0, 42.0, 48.0, 45.0, 41.0, 36.0, 45.0, 47.0, 41.0, 42.0, 35.0, 37.0, 38.0, 26.0, 20.0, 26.0, 19.0, 15.0, 13.0, 22.0, 11.0, 9.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37559691071510315, -0.3638674020767212, -0.35213789343833923, -0.3404083847999573, -0.3286789059638977, -0.31694939732551575, -0.3052198886871338, -0.29349038004875183, -0.2817608714103699, -0.2700313627719879, -0.25830185413360596, -0.2465723603963852, -0.23484285175800323, -0.22311334311962128, -0.2113838493824005, -0.19965434074401855, -0.1879248321056366, -0.17619532346725464, -0.16446581482887268, -0.15273632109165192, -0.14100681245326996, -0.129277303814888, -0.11754780262708664, -0.10581830143928528, -0.09408879280090332, -0.08235928416252136, -0.07062978297472, -0.05890027806162834, -0.04717077314853668, -0.03544126823544502, -0.023711763322353363, -0.011982262134552002, -0.00025278329849243164, 0.011476721614599228, 0.023206226527690887, 0.03493573144078255, 0.04666523635387421, 0.058394741266965866, 0.07012424618005753, 0.08185374736785889, 0.09358325600624084, 0.1053127646446228, 0.11704226583242416, 0.12877176702022552, 0.14050127565860748, 0.15223078429698944, 0.1639602780342102, 0.17568978667259216, 0.18741929531097412, 0.19914880394935608, 0.21087831258773804, 0.2226078063249588, 0.23433731496334076, 0.24606682360172272, 0.2577963173389435, 0.26952582597732544, 0.2812553346157074, 0.29298484325408936, 0.3047143518924713, 0.31644386053085327, 0.32817333936691284, 0.3399028480052948, 0.35163235664367676, 0.3633618652820587, 0.3750913739204407]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 6.0, 11.0, 7.0, 12.0, 17.0, 25.0, 48.0, 60.0, 91.0, 137.0, 204.0, 276.0, 442.0, 842.0, 1508.0, 2749.0, 5279.0, 9712.0, 18771.0, 36939.0, 81212.0, 221925.0, 375843.0, 164908.0, 64048.0, 30096.0, 15462.0, 8007.0, 4341.0, 2413.0, 1255.0, 744.0, 416.0, 236.0, 150.0, 108.0, 75.0, 47.0, 29.0, 23.0, 18.0, 15.0, 11.0, 10.0, 8.0, 1.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.509765625, -0.49297332763671875, -0.4761810302734375, -0.45938873291015625, -0.442596435546875, -0.42580413818359375, -0.4090118408203125, -0.39221954345703125, -0.37542724609375, -0.35863494873046875, -0.3418426513671875, -0.32505035400390625, -0.308258056640625, -0.29146575927734375, -0.2746734619140625, -0.25788116455078125, -0.2410888671875, -0.22429656982421875, -0.2075042724609375, -0.19071197509765625, -0.173919677734375, -0.15712738037109375, -0.1403350830078125, -0.12354278564453125, -0.10675048828125, -0.08995819091796875, -0.0731658935546875, -0.05637359619140625, -0.039581298828125, -0.02278900146484375, -0.0059967041015625, 0.01079559326171875, 0.027587890625, 0.04438018798828125, 0.0611724853515625, 0.07796478271484375, 0.094757080078125, 0.11154937744140625, 0.1283416748046875, 0.14513397216796875, 0.16192626953125, 0.17871856689453125, 0.1955108642578125, 0.21230316162109375, 0.229095458984375, 0.24588775634765625, 0.2626800537109375, 0.27947235107421875, 0.2962646484375, 0.31305694580078125, 0.3298492431640625, 0.34664154052734375, 0.363433837890625, 0.38022613525390625, 0.3970184326171875, 0.41381072998046875, 0.43060302734375, 0.44739532470703125, 0.4641876220703125, 0.48097991943359375, 0.497772216796875, 0.5145645141601562, 0.5313568115234375, 0.5481491088867188, 0.56494140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 8.0, 1.0, 7.0, 4.0, 14.0, 13.0, 9.0, 18.0, 21.0, 18.0, 24.0, 25.0, 24.0, 29.0, 25.0, 46.0, 39.0, 36.0, 43.0, 41.0, 46.0, 45.0, 40.0, 51.0, 43.0, 46.0, 43.0, 34.0, 20.0, 29.0, 27.0, 12.0, 25.0, 29.0, 10.0, 11.0, 19.0, 8.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6337890625, -0.6126861572265625, -0.591583251953125, -0.5704803466796875, -0.54937744140625, -0.5282745361328125, -0.507171630859375, -0.4860687255859375, -0.4649658203125, -0.4438629150390625, -0.422760009765625, -0.4016571044921875, -0.38055419921875, -0.3594512939453125, -0.338348388671875, -0.3172454833984375, -0.296142578125, -0.2750396728515625, -0.253936767578125, -0.2328338623046875, -0.21173095703125, -0.1906280517578125, -0.169525146484375, -0.1484222412109375, -0.1273193359375, -0.1062164306640625, -0.085113525390625, -0.0640106201171875, -0.04290771484375, -0.0218048095703125, -0.000701904296875, 0.0204010009765625, 0.04150390625, 0.0626068115234375, 0.083709716796875, 0.1048126220703125, 0.12591552734375, 0.1470184326171875, 0.168121337890625, 0.1892242431640625, 0.2103271484375, 0.2314300537109375, 0.252532958984375, 0.2736358642578125, 0.29473876953125, 0.3158416748046875, 0.336944580078125, 0.3580474853515625, 0.379150390625, 0.4002532958984375, 0.421356201171875, 0.4424591064453125, 0.46356201171875, 0.4846649169921875, 0.505767822265625, 0.5268707275390625, 0.5479736328125, 0.5690765380859375, 0.590179443359375, 0.6112823486328125, 0.63238525390625, 0.6534881591796875, 0.674591064453125, 0.6956939697265625, 0.716796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 20.0, 23.0, 34.0, 39.0, 55.0, 86.0, 117.0, 172.0, 246.0, 371.0, 633.0, 1173.0, 2175.0, 4408.0, 9898.0, 23919.0, 64609.0, 200282.0, 431732.0, 200440.0, 64891.0, 23925.0, 9668.0, 4479.0, 2137.0, 1187.0, 614.0, 381.0, 239.0, 164.0, 117.0, 79.0, 67.0, 43.0, 27.0, 25.0, 21.0, 9.0, 10.0, 7.0, 7.0, 5.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7412109375, -0.719085693359375, -0.69696044921875, -0.674835205078125, -0.6527099609375, -0.630584716796875, -0.60845947265625, -0.586334228515625, -0.564208984375, -0.542083740234375, -0.51995849609375, -0.497833251953125, -0.4757080078125, -0.453582763671875, -0.43145751953125, -0.409332275390625, -0.38720703125, -0.365081787109375, -0.34295654296875, -0.320831298828125, -0.2987060546875, -0.276580810546875, -0.25445556640625, -0.232330322265625, -0.210205078125, -0.188079833984375, -0.16595458984375, -0.143829345703125, -0.1217041015625, -0.099578857421875, -0.07745361328125, -0.055328369140625, -0.033203125, -0.011077880859375, 0.01104736328125, 0.033172607421875, 0.0552978515625, 0.077423095703125, 0.09954833984375, 0.121673583984375, 0.143798828125, 0.165924072265625, 0.18804931640625, 0.210174560546875, 0.2322998046875, 0.254425048828125, 0.27655029296875, 0.298675537109375, 0.32080078125, 0.342926025390625, 0.36505126953125, 0.387176513671875, 0.4093017578125, 0.431427001953125, 0.45355224609375, 0.475677490234375, 0.497802734375, 0.519927978515625, 0.54205322265625, 0.564178466796875, 0.5863037109375, 0.608428955078125, 0.63055419921875, 0.652679443359375, 0.6748046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 8.0, 7.0, 10.0, 13.0, 14.0, 17.0, 20.0, 24.0, 24.0, 25.0, 34.0, 34.0, 44.0, 43.0, 49.0, 42.0, 45.0, 52.0, 53.0, 55.0, 46.0, 51.0, 41.0, 22.0, 30.0, 25.0, 25.0, 23.0, 19.0, 19.0, 9.0, 16.0, 11.0, 8.0, 5.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6748886108398438, -0.6510467529296875, -0.6272048950195312, -0.603363037109375, -0.5795211791992188, -0.5556793212890625, -0.5318374633789062, -0.50799560546875, -0.48415374755859375, -0.4603118896484375, -0.43647003173828125, -0.412628173828125, -0.38878631591796875, -0.3649444580078125, -0.34110260009765625, -0.3172607421875, -0.29341888427734375, -0.2695770263671875, -0.24573516845703125, -0.221893310546875, -0.19805145263671875, -0.1742095947265625, -0.15036773681640625, -0.12652587890625, -0.10268402099609375, -0.0788421630859375, -0.05500030517578125, -0.031158447265625, -0.00731658935546875, 0.0165252685546875, 0.04036712646484375, 0.064208984375, 0.08805084228515625, 0.1118927001953125, 0.13573455810546875, 0.159576416015625, 0.18341827392578125, 0.2072601318359375, 0.23110198974609375, 0.25494384765625, 0.27878570556640625, 0.3026275634765625, 0.32646942138671875, 0.350311279296875, 0.37415313720703125, 0.3979949951171875, 0.42183685302734375, 0.4456787109375, 0.46952056884765625, 0.4933624267578125, 0.5172042846679688, 0.541046142578125, 0.5648880004882812, 0.5887298583984375, 0.6125717163085938, 0.63641357421875, 0.6602554321289062, 0.6840972900390625, 0.7079391479492188, 0.731781005859375, 0.7556228637695312, 0.7794647216796875, 0.8033065795898438, 0.8271484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 9.0, 6.0, 14.0, 16.0, 23.0, 38.0, 52.0, 70.0, 99.0, 109.0, 164.0, 259.0, 367.0, 488.0, 794.0, 1299.0, 2034.0, 3581.0, 6285.0, 11827.0, 24890.0, 57311.0, 147059.0, 341027.0, 263632.0, 103917.0, 41881.0, 18866.0, 9416.0, 5028.0, 2926.0, 1743.0, 1123.0, 719.0, 447.0, 329.0, 216.0, 136.0, 103.0, 67.0, 42.0, 42.0, 35.0, 16.0, 12.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.09649658203125, -0.09336566925048828, -0.09023475646972656, -0.08710384368896484, -0.08397293090820312, -0.0808420181274414, -0.07771110534667969, -0.07458019256591797, -0.07144927978515625, -0.06831836700439453, -0.06518745422363281, -0.062056541442871094, -0.058925628662109375, -0.055794715881347656, -0.05266380310058594, -0.04953289031982422, -0.0464019775390625, -0.04327106475830078, -0.04014015197753906, -0.037009239196777344, -0.033878326416015625, -0.030747413635253906, -0.027616500854492188, -0.02448558807373047, -0.02135467529296875, -0.01822376251220703, -0.015092849731445312, -0.011961936950683594, -0.008831024169921875, -0.005700111389160156, -0.0025691986083984375, 0.0005617141723632812, 0.003692626953125, 0.006823539733886719, 0.009954452514648438, 0.013085365295410156, 0.016216278076171875, 0.019347190856933594, 0.022478103637695312, 0.02560901641845703, 0.02873992919921875, 0.03187084197998047, 0.03500175476074219, 0.038132667541503906, 0.041263580322265625, 0.044394493103027344, 0.04752540588378906, 0.05065631866455078, 0.0537872314453125, 0.05691814422607422, 0.06004905700683594, 0.06317996978759766, 0.06631088256835938, 0.0694417953491211, 0.07257270812988281, 0.07570362091064453, 0.07883453369140625, 0.08196544647216797, 0.08509635925292969, 0.0882272720336914, 0.09135818481445312, 0.09448909759521484, 0.09762001037597656, 0.10075092315673828, 0.1038818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 15.0, 12.0, 7.0, 18.0, 32.0, 27.0, 39.0, 53.0, 70.0, 79.0, 99.0, 99.0, 83.0, 80.0, 69.0, 41.0, 30.0, 26.0, 23.0, 21.0, 9.0, 14.0, 7.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.36766242980957e-05, -3.269221633672714e-05, -3.170780837535858e-05, -3.072340041399002e-05, -2.973899245262146e-05, -2.87545844912529e-05, -2.777017652988434e-05, -2.6785768568515778e-05, -2.5801360607147217e-05, -2.4816952645778656e-05, -2.3832544684410095e-05, -2.2848136723041534e-05, -2.1863728761672974e-05, -2.0879320800304413e-05, -1.9894912838935852e-05, -1.891050487756729e-05, -1.792609691619873e-05, -1.694168895483017e-05, -1.595728099346161e-05, -1.4972873032093048e-05, -1.3988465070724487e-05, -1.3004057109355927e-05, -1.2019649147987366e-05, -1.1035241186618805e-05, -1.0050833225250244e-05, -9.066425263881683e-06, -8.082017302513123e-06, -7.097609341144562e-06, -6.113201379776001e-06, -5.12879341840744e-06, -4.144385457038879e-06, -3.1599774956703186e-06, -2.175569534301758e-06, -1.191161572933197e-06, -2.0675361156463623e-07, 7.776543498039246e-07, 1.7620623111724854e-06, 2.746470272541046e-06, 3.730878233909607e-06, 4.715286195278168e-06, 5.6996941566467285e-06, 6.684102118015289e-06, 7.66851007938385e-06, 8.652918040752411e-06, 9.637326002120972e-06, 1.0621733963489532e-05, 1.1606141924858093e-05, 1.2590549886226654e-05, 1.3574957847595215e-05, 1.4559365808963776e-05, 1.5543773770332336e-05, 1.6528181731700897e-05, 1.7512589693069458e-05, 1.849699765443802e-05, 1.948140561580658e-05, 2.046581357717514e-05, 2.14502215385437e-05, 2.2434629499912262e-05, 2.3419037461280823e-05, 2.4403445422649384e-05, 2.5387853384017944e-05, 2.6372261345386505e-05, 2.7356669306755066e-05, 2.8341077268123627e-05, 2.9325485229492188e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 1.0, 10.0, 4.0, 9.0, 9.0, 23.0, 20.0, 31.0, 32.0, 61.0, 95.0, 128.0, 155.0, 268.0, 444.0, 802.0, 1543.0, 3182.0, 8317.0, 26965.0, 132229.0, 658751.0, 167550.0, 30983.0, 9477.0, 3613.0, 1626.0, 861.0, 480.0, 273.0, 193.0, 116.0, 87.0, 60.0, 41.0, 20.0, 17.0, 16.0, 19.0, 19.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.299560546875, -0.2903594970703125, -0.281158447265625, -0.2719573974609375, -0.26275634765625, -0.2535552978515625, -0.244354248046875, -0.2351531982421875, -0.2259521484375, -0.2167510986328125, -0.207550048828125, -0.1983489990234375, -0.18914794921875, -0.1799468994140625, -0.170745849609375, -0.1615447998046875, -0.15234375, -0.1431427001953125, -0.133941650390625, -0.1247406005859375, -0.11553955078125, -0.1063385009765625, -0.097137451171875, -0.0879364013671875, -0.0787353515625, -0.0695343017578125, -0.060333251953125, -0.0511322021484375, -0.04193115234375, -0.0327301025390625, -0.023529052734375, -0.0143280029296875, -0.005126953125, 0.0040740966796875, 0.013275146484375, 0.0224761962890625, 0.03167724609375, 0.0408782958984375, 0.050079345703125, 0.0592803955078125, 0.0684814453125, 0.0776824951171875, 0.086883544921875, 0.0960845947265625, 0.10528564453125, 0.1144866943359375, 0.123687744140625, 0.1328887939453125, 0.14208984375, 0.1512908935546875, 0.160491943359375, 0.1696929931640625, 0.17889404296875, 0.1880950927734375, 0.197296142578125, 0.2064971923828125, 0.2156982421875, 0.2248992919921875, 0.234100341796875, 0.2433013916015625, 0.25250244140625, 0.2617034912109375, 0.270904541015625, 0.2801055908203125, 0.289306640625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 2.0, 5.0, 11.0, 11.0, 12.0, 29.0, 64.0, 98.0, 126.0, 139.0, 130.0, 133.0, 72.0, 51.0, 42.0, 23.0, 15.0, 8.0, 15.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1343994140625, -0.129241943359375, -0.12408447265625, -0.118927001953125, -0.11376953125, -0.108612060546875, -0.10345458984375, -0.098297119140625, -0.0931396484375, -0.087982177734375, -0.08282470703125, -0.077667236328125, -0.072509765625, -0.067352294921875, -0.06219482421875, -0.057037353515625, -0.0518798828125, -0.046722412109375, -0.04156494140625, -0.036407470703125, -0.03125, -0.026092529296875, -0.02093505859375, -0.015777587890625, -0.0106201171875, -0.005462646484375, -0.00030517578125, 0.004852294921875, 0.010009765625, 0.015167236328125, 0.02032470703125, 0.025482177734375, 0.0306396484375, 0.035797119140625, 0.04095458984375, 0.046112060546875, 0.05126953125, 0.056427001953125, 0.06158447265625, 0.066741943359375, 0.0718994140625, 0.077056884765625, 0.08221435546875, 0.087371826171875, 0.092529296875, 0.097686767578125, 0.10284423828125, 0.108001708984375, 0.1131591796875, 0.118316650390625, 0.12347412109375, 0.128631591796875, 0.1337890625, 0.138946533203125, 0.14410400390625, 0.149261474609375, 0.1544189453125, 0.159576416015625, 0.16473388671875, 0.169891357421875, 0.175048828125, 0.180206298828125, 0.18536376953125, 0.190521240234375, 0.1956787109375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 12.0, 14.0, 24.0, 44.0, 59.0, 85.0, 75.0, 113.0, 109.0, 101.0, 80.0, 82.0, 60.0, 34.0, 32.0, 23.0, 17.0, 5.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.334603190422058, -1.2885206937789917, -1.2424380779266357, -1.1963555812835693, -1.1502729654312134, -1.104190468788147, -1.058107852935791, -1.0120253562927246, -0.9659427404403687, -0.9198601841926575, -0.8737776279449463, -0.8276950716972351, -0.7816125154495239, -0.7355299592018127, -0.6894474029541016, -0.6433649063110352, -0.597282350063324, -0.5511997938156128, -0.5051172375679016, -0.45903468132019043, -0.41295212507247925, -0.36686956882476807, -0.3207870423793793, -0.2747044861316681, -0.2286219298839569, -0.18253937363624573, -0.13645681738853455, -0.09037427604198456, -0.044291719794273376, 0.0017908364534378052, 0.04787337779998779, 0.09395593404769897, 0.14003849029541016, 0.18612104654312134, 0.23220360279083252, 0.2782861590385437, 0.3243687152862549, 0.37045127153396606, 0.41653379797935486, 0.46261635422706604, 0.5086989402770996, 0.5547814965248108, 0.600864052772522, 0.6469466090202332, 0.6930291652679443, 0.7391117215156555, 0.7851942777633667, 0.8312767744064331, 0.8773593306541443, 0.9234418869018555, 0.9695244431495667, 1.0156069993972778, 1.0616894960403442, 1.1077721118927002, 1.1538546085357666, 1.1999372243881226, 1.246019721031189, 1.2921022176742554, 1.3381848335266113, 1.3842673301696777, 1.4303499460220337, 1.4764324426651, 1.522515058517456, 1.5685975551605225, 1.6146801710128784]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 12.0, 3.0, 6.0, 10.0, 11.0, 25.0, 19.0, 23.0, 20.0, 38.0, 20.0, 27.0, 35.0, 35.0, 35.0, 32.0, 46.0, 45.0, 45.0, 46.0, 45.0, 34.0, 47.0, 38.0, 43.0, 29.0, 39.0, 27.0, 26.0, 15.0, 18.0, 21.0, 15.0, 23.0, 8.0, 6.0, 15.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0049383640289307, -0.9675004482269287, -0.9300625920295715, -0.8926246762275696, -0.8551868200302124, -0.8177489042282104, -0.7803109884262085, -0.7428730726242065, -0.7054352164268494, -0.6679973006248474, -0.6305594444274902, -0.5931215286254883, -0.5556836128234863, -0.5182457566261292, -0.4808078408241272, -0.44336995482444763, -0.40593206882476807, -0.3684941828250885, -0.33105629682540894, -0.293618381023407, -0.2561804950237274, -0.21874260902404785, -0.1813047081232071, -0.14386680722236633, -0.10642892122268677, -0.0689910277724266, -0.03155313432216644, 0.0058847591280937195, 0.04332265257835388, 0.08076053857803345, 0.1181984394788742, 0.15563634037971497, 0.19307422637939453, 0.2305121123790741, 0.26794999837875366, 0.3053879141807556, 0.3428258001804352, 0.38026368618011475, 0.4177016019821167, 0.45513948798179626, 0.49257737398147583, 0.5300152897834778, 0.567453145980835, 0.6048910617828369, 0.6423289775848389, 0.679766833782196, 0.717204749584198, 0.7546426057815552, 0.7920805215835571, 0.8295184373855591, 0.8669562935829163, 0.9043942093849182, 0.9418320655822754, 0.9792699813842773, 1.0167078971862793, 1.0541458129882812, 1.0915837287902832, 1.1290216445922852, 1.166459560394287, 1.2038973569869995, 1.2413352727890015, 1.2787731885910034, 1.3162111043930054, 1.3536490201950073, 1.3910868167877197]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 15.0, 14.0, 18.0, 18.0, 25.0, 37.0, 50.0, 66.0, 78.0, 96.0, 132.0, 151.0, 175.0, 209.0, 284.0, 288.0, 377.0, 476.0, 553.0, 733.0, 932.0, 1300.0, 1039761.0, 996.0, 739.0, 522.0, 440.0, 398.0, 316.0, 273.0, 229.0, 177.0, 133.0, 129.0, 106.0, 72.0, 61.0, 57.0, 37.0, 28.0, 31.0, 21.0, 17.0, 6.0, 11.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2057493925094604, -1.1642473936080933, -1.1227455139160156, -1.0812435150146484, -1.0397415161132812, -0.9982396364212036, -0.9567376375198364, -0.915235698223114, -0.8737337589263916, -0.8322318196296692, -0.7907298803329468, -0.7492278814315796, -0.7077259421348572, -0.6662240028381348, -0.6247220039367676, -0.5832200646400452, -0.5417181253433228, -0.5002161860466003, -0.45871421694755554, -0.41721224784851074, -0.37571030855178833, -0.3342083692550659, -0.2927064001560211, -0.2512044310569763, -0.2097024917602539, -0.1682005375623703, -0.1266985833644867, -0.08519662916660309, -0.04369467496871948, -0.0021927207708358765, 0.03930923342704773, 0.08081120252609253, 0.12231326103210449, 0.1638152152299881, 0.2053171694278717, 0.2468191236257553, 0.2883210778236389, 0.32982301712036133, 0.37132498621940613, 0.4128269553184509, 0.45432889461517334, 0.49583083391189575, 0.5373327732086182, 0.5788347721099854, 0.6203367114067078, 0.6618386507034302, 0.7033406496047974, 0.7448425889015198, 0.7863445281982422, 0.8278464674949646, 0.869348406791687, 0.9108504056930542, 0.9523523449897766, 0.993854284286499, 1.0353562831878662, 1.0768582820892334, 1.118360161781311, 1.1598621606826782, 1.2013640403747559, 1.242866039276123, 1.2843680381774902, 1.3258699178695679, 1.367371916770935, 1.4088737964630127, 1.4503757953643799]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 14.0, 14.0, 22.0, 22.0, 42.0, 127.0, 302.0, 868.0, 2666.0, 9021.0, 51408944.0, 37870.0, 7559.0, 2524.0, 842.0, 279.0, 99.0, 49.0, 34.0, 13.0, 7.0, 8.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.55303955078125, -9.197623252868652, -8.842206954956055, -8.486791610717773, -8.131375312805176, -7.775959014892578, -7.420543193817139, -7.065127372741699, -6.709711074829102, -6.354294776916504, -5.9988789558410645, -5.643463134765625, -5.288046836853027, -4.93263053894043, -4.57721471786499, -4.221798896789551, -3.866382598876953, -3.5109665393829346, -3.155550479888916, -2.8001344203948975, -2.444718360900879, -2.0893023014068604, -1.7338862419128418, -1.3784701824188232, -1.0230541229248047, -0.6676380634307861, -0.3122220039367676, 0.04319405555725098, 0.39861011505126953, 0.7540261745452881, 1.1094422340393066, 1.4648582935333252, 1.8202743530273438, 2.1756904125213623, 2.531106472015381, 2.8865225315093994, 3.241938591003418, 3.5973546504974365, 3.952770709991455, 4.3081865310668945, 4.663602828979492, 5.01901912689209, 5.374434947967529, 5.729850769042969, 6.085267066955566, 6.440683364868164, 6.7960991859436035, 7.151515007019043, 7.506931304931641, 7.862347602844238, 8.217763900756836, 8.573179244995117, 8.928595542907715, 9.284011840820312, 9.639427185058594, 9.994843482971191, 10.350259780883789, 10.705676078796387, 11.061092376708984, 11.416507720947266, 11.771924018859863, 12.127340316772461, 12.482755661010742, 12.83817195892334, 13.193588256835938]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 17.0, 14.0, 21.0, 49.0, 66.0, 115.0, 170.0, 232.0, 368.0, 582.0, 899.0, 1450.0, 2280.0, 3798.0, 6144.0, 9954.0, 15841.0, 25818.0, 41834.0, 65299.0, 100480.0, 147505.0, 208603.0, 276450.0, 378769.0, 2079189.0, 1690914.0, 359471.0, 269230.0, 200362.0, 143228.0, 96825.0, 62038.0, 39117.0, 24465.0, 14980.0, 9528.0, 5728.0, 3550.0, 2231.0, 1365.0, 865.0, 556.0, 352.0, 231.0, 146.0, 106.0, 64.0, 45.0, 27.0, 28.0, 20.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.890625, -0.8627471923828125, -0.834869384765625, -0.8069915771484375, -0.77911376953125, -0.7512359619140625, -0.723358154296875, -0.6954803466796875, -0.6676025390625, -0.6397247314453125, -0.611846923828125, -0.5839691162109375, -0.55609130859375, -0.5282135009765625, -0.500335693359375, -0.4724578857421875, -0.444580078125, -0.4167022705078125, -0.388824462890625, -0.3609466552734375, -0.33306884765625, -0.3051910400390625, -0.277313232421875, -0.2494354248046875, -0.2215576171875, -0.1936798095703125, -0.165802001953125, -0.1379241943359375, -0.11004638671875, -0.0821685791015625, -0.054290771484375, -0.0264129638671875, 0.00146484375, 0.0293426513671875, 0.057220458984375, 0.0850982666015625, 0.11297607421875, 0.1408538818359375, 0.168731689453125, 0.1966094970703125, 0.2244873046875, 0.2523651123046875, 0.280242919921875, 0.3081207275390625, 0.33599853515625, 0.3638763427734375, 0.391754150390625, 0.4196319580078125, 0.447509765625, 0.4753875732421875, 0.503265380859375, 0.5311431884765625, 0.55902099609375, 0.5868988037109375, 0.614776611328125, 0.6426544189453125, 0.6705322265625, 0.6984100341796875, 0.726287841796875, 0.7541656494140625, 0.78204345703125, 0.8099212646484375, 0.837799072265625, 0.8656768798828125, 0.8935546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 8.0, 4.0, 11.0, 15.0, 16.0, 15.0, 22.0, 25.0, 23.0, 30.0, 27.0, 30.0, 31.0, 35.0, 33.0, 48.0, 43.0, 189.0, 832.0, 128.0, 51.0, 41.0, 50.0, 18.0, 43.0, 20.0, 30.0, 36.0, 35.0, 16.0, 21.0, 17.0, 16.0, 10.0, 13.0, 10.0, 6.0, 3.0, 2.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.73394775390625, -6.5264892578125, -6.31903076171875, -6.111572265625, -5.90411376953125, -5.6966552734375, -5.48919677734375, -5.28173828125, -5.07427978515625, -4.8668212890625, -4.65936279296875, -4.451904296875, -4.24444580078125, -4.0369873046875, -3.82952880859375, -3.6220703125, -3.41461181640625, -3.2071533203125, -2.99969482421875, -2.792236328125, -2.58477783203125, -2.3773193359375, -2.16986083984375, -1.96240234375, -1.75494384765625, -1.5474853515625, -1.34002685546875, -1.132568359375, -0.92510986328125, -0.7176513671875, -0.51019287109375, -0.302734375, -0.09527587890625, 0.1121826171875, 0.31964111328125, 0.527099609375, 0.73455810546875, 0.9420166015625, 1.14947509765625, 1.35693359375, 1.56439208984375, 1.7718505859375, 1.97930908203125, 2.186767578125, 2.39422607421875, 2.6016845703125, 2.80914306640625, 3.0166015625, 3.22406005859375, 3.4315185546875, 3.63897705078125, 3.846435546875, 4.05389404296875, 4.2613525390625, 4.46881103515625, 4.67626953125, 4.88372802734375, 5.0911865234375, 5.29864501953125, 5.506103515625, 5.71356201171875, 5.9210205078125, 6.12847900390625, 6.3359375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 30.0, 58.0, 96.0, 161.0, 241.0, 443.0, 591.0, 1075.0, 1749.0, 2974.0, 4680.0, 7437.0, 12000.0, 18663.0, 28855.0, 43203.0, 62772.0, 88461.0, 120951.0, 158691.0, 198718.0, 238872.0, 323125.0, 1506428.0, 2031334.0, 391971.0, 248195.0, 208364.0, 167579.0, 128296.0, 94789.0, 67990.0, 46351.0, 31339.0, 20587.0, 13064.0, 8236.0, 5123.0, 3116.0, 1878.0, 1160.0, 721.0, 426.0, 243.0, 160.0, 80.0, 58.0, 44.0, 19.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.5211563110351562, -0.5032501220703125, -0.48534393310546875, -0.467437744140625, -0.44953155517578125, -0.4316253662109375, -0.41371917724609375, -0.39581298828125, -0.37790679931640625, -0.3600006103515625, -0.34209442138671875, -0.324188232421875, -0.30628204345703125, -0.2883758544921875, -0.27046966552734375, -0.2525634765625, -0.23465728759765625, -0.2167510986328125, -0.19884490966796875, -0.180938720703125, -0.16303253173828125, -0.1451263427734375, -0.12722015380859375, -0.10931396484375, -0.09140777587890625, -0.0735015869140625, -0.05559539794921875, -0.037689208984375, -0.01978302001953125, -0.0018768310546875, 0.01602935791015625, 0.033935546875, 0.05184173583984375, 0.0697479248046875, 0.08765411376953125, 0.105560302734375, 0.12346649169921875, 0.1413726806640625, 0.15927886962890625, 0.17718505859375, 0.19509124755859375, 0.2129974365234375, 0.23090362548828125, 0.248809814453125, 0.26671600341796875, 0.2846221923828125, 0.30252838134765625, 0.3204345703125, 0.33834075927734375, 0.3562469482421875, 0.37415313720703125, 0.392059326171875, 0.40996551513671875, 0.4278717041015625, 0.44577789306640625, 0.46368408203125, 0.48159027099609375, 0.4994964599609375, 0.5174026489257812, 0.535308837890625, 0.5532150268554688, 0.5711212158203125, 0.5890274047851562, 0.60693359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 8.0, 7.0, 10.0, 7.0, 15.0, 19.0, 26.0, 20.0, 31.0, 33.0, 36.0, 39.0, 41.0, 46.0, 37.0, 50.0, 251.0, 825.0, 108.0, 53.0, 43.0, 42.0, 51.0, 41.0, 28.0, 31.0, 32.0, 21.0, 21.0, 17.0, 11.0, 8.0, 6.0, 4.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.90899658203125, -4.7359619140625, -4.56292724609375, -4.389892578125, -4.21685791015625, -4.0438232421875, -3.87078857421875, -3.69775390625, -3.52471923828125, -3.3516845703125, -3.17864990234375, -3.005615234375, -2.83258056640625, -2.6595458984375, -2.48651123046875, -2.3134765625, -2.14044189453125, -1.9674072265625, -1.79437255859375, -1.621337890625, -1.44830322265625, -1.2752685546875, -1.10223388671875, -0.92919921875, -0.75616455078125, -0.5831298828125, -0.41009521484375, -0.237060546875, -0.06402587890625, 0.1090087890625, 0.28204345703125, 0.455078125, 0.62811279296875, 0.8011474609375, 0.97418212890625, 1.147216796875, 1.32025146484375, 1.4932861328125, 1.66632080078125, 1.83935546875, 2.01239013671875, 2.1854248046875, 2.35845947265625, 2.531494140625, 2.70452880859375, 2.8775634765625, 3.05059814453125, 3.2236328125, 3.39666748046875, 3.5697021484375, 3.74273681640625, 3.915771484375, 4.08880615234375, 4.2618408203125, 4.43487548828125, 4.60791015625, 4.78094482421875, 4.9539794921875, 5.12701416015625, 5.300048828125, 5.47308349609375, 5.6461181640625, 5.81915283203125, 5.9921875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 18.0, 29.0, 22.0, 48.0, 61.0, 88.0, 94.0, 143.0, 174.0, 213.0, 308.0, 377.0, 549.0, 803.0, 1175.0, 1902.0, 3712.0, 8208.0, 20655.0, 55281.0, 144832.0, 329701.0, 614494.0, 3831153.0, 661069.0, 354890.0, 158285.0, 61118.0, 23057.0, 8821.0, 4008.0, 2006.0, 1200.0, 776.0, 527.0, 439.0, 310.0, 229.0, 161.0, 125.0, 86.0, 66.0, 54.0, 41.0, 30.0, 27.0, 18.0, 12.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.3330078125, -1.29327392578125, -1.2535400390625, -1.21380615234375, -1.174072265625, -1.13433837890625, -1.0946044921875, -1.05487060546875, -1.01513671875, -0.97540283203125, -0.9356689453125, -0.89593505859375, -0.856201171875, -0.81646728515625, -0.7767333984375, -0.73699951171875, -0.697265625, -0.65753173828125, -0.6177978515625, -0.57806396484375, -0.538330078125, -0.49859619140625, -0.4588623046875, -0.41912841796875, -0.37939453125, -0.33966064453125, -0.2999267578125, -0.26019287109375, -0.220458984375, -0.18072509765625, -0.1409912109375, -0.10125732421875, -0.0615234375, -0.02178955078125, 0.0179443359375, 0.05767822265625, 0.097412109375, 0.13714599609375, 0.1768798828125, 0.21661376953125, 0.25634765625, 0.29608154296875, 0.3358154296875, 0.37554931640625, 0.415283203125, 0.45501708984375, 0.4947509765625, 0.53448486328125, 0.57421875, 0.61395263671875, 0.6536865234375, 0.69342041015625, 0.733154296875, 0.77288818359375, 0.8126220703125, 0.85235595703125, 0.89208984375, 0.93182373046875, 0.9715576171875, 1.01129150390625, 1.051025390625, 1.09075927734375, 1.1304931640625, 1.17022705078125, 1.2099609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 11.0, 6.0, 16.0, 12.0, 15.0, 21.0, 25.0, 28.0, 29.0, 36.0, 35.0, 28.0, 31.0, 32.0, 43.0, 48.0, 179.0, 711.0, 237.0, 56.0, 39.0, 41.0, 46.0, 49.0, 36.0, 29.0, 25.0, 24.0, 25.0, 17.0, 14.0, 16.0, 13.0, 9.0, 8.0, 8.0, 4.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.5859375, -3.475860595703125, -3.36578369140625, -3.255706787109375, -3.1456298828125, -3.035552978515625, -2.92547607421875, -2.815399169921875, -2.705322265625, -2.595245361328125, -2.48516845703125, -2.375091552734375, -2.2650146484375, -2.154937744140625, -2.04486083984375, -1.934783935546875, -1.82470703125, -1.714630126953125, -1.60455322265625, -1.494476318359375, -1.3843994140625, -1.274322509765625, -1.16424560546875, -1.054168701171875, -0.944091796875, -0.834014892578125, -0.72393798828125, -0.613861083984375, -0.5037841796875, -0.393707275390625, -0.28363037109375, -0.173553466796875, -0.0634765625, 0.046600341796875, 0.15667724609375, 0.266754150390625, 0.3768310546875, 0.486907958984375, 0.59698486328125, 0.707061767578125, 0.817138671875, 0.927215576171875, 1.03729248046875, 1.147369384765625, 1.2574462890625, 1.367523193359375, 1.47760009765625, 1.587677001953125, 1.69775390625, 1.807830810546875, 1.91790771484375, 2.027984619140625, 2.1380615234375, 2.248138427734375, 2.35821533203125, 2.468292236328125, 2.578369140625, 2.688446044921875, 2.79852294921875, 2.908599853515625, 3.0186767578125, 3.128753662109375, 3.23883056640625, 3.348907470703125, 3.458984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 12.0, 21.0, 31.0, 49.0, 65.0, 131.0, 158.0, 160.0, 148.0, 94.0, 60.0, 30.0, 17.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-14.953716278076172, -14.661749839782715, -14.369783401489258, -14.077817916870117, -13.78585147857666, -13.493885040283203, -13.201918601989746, -12.909952163696289, -12.617986679077148, -12.326020240783691, -12.034053802490234, -11.742088317871094, -11.450121879577637, -11.15815544128418, -10.866189002990723, -10.574222564697266, -10.282257080078125, -9.990290641784668, -9.698324203491211, -9.40635871887207, -9.114392280578613, -8.822425842285156, -8.5304594039917, -8.238492965698242, -7.946526527404785, -7.654560089111328, -7.362594127655029, -7.070627689361572, -6.778661727905273, -6.486695289611816, -6.194728851318359, -5.9027628898620605, -5.61079740524292, -5.318830966949463, -5.026865005493164, -4.734898567199707, -4.442932605743408, -4.150966167449951, -3.8589999675750732, -3.5670337677001953, -3.2750675678253174, -2.9831013679504395, -2.6911351680755615, -2.3991689682006836, -2.1072025299072266, -1.8152364492416382, -1.5232701301574707, -1.2313039302825928, -0.9393377304077148, -0.6473715305328369, -0.3554052710533142, -0.0634390115737915, 0.22852718830108643, 0.5204933881759644, 0.8124597072601318, 1.1044259071350098, 1.3963921070098877, 1.6883583068847656, 1.9803245067596436, 2.2722907066345215, 2.5642571449279785, 2.8562231063842773, 3.1481895446777344, 3.4401557445526123, 3.7321219444274902]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 3.0, 7.0, 7.0, 14.0, 13.0, 10.0, 23.0, 19.0, 23.0, 29.0, 29.0, 40.0, 37.0, 41.0, 42.0, 62.0, 42.0, 61.0, 47.0, 39.0, 41.0, 46.0, 37.0, 26.0, 27.0, 34.0, 35.0, 20.0, 25.0, 27.0, 24.0, 14.0, 15.0, 6.0, 5.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74615478515625, -6.553769588470459, -6.36138391494751, -6.168998718261719, -5.9766130447387695, -5.7842278480529785, -5.5918426513671875, -5.399456977844238, -5.207071781158447, -5.014686584472656, -4.822300910949707, -4.629915714263916, -4.437530517578125, -4.245144844055176, -4.052759647369385, -3.8603742122650146, -3.6679887771606445, -3.4756033420562744, -3.2832179069519043, -3.0908327102661133, -2.898447275161743, -2.706061840057373, -2.513676643371582, -2.321291208267212, -2.128905773162842, -1.9365203380584717, -1.7441350221633911, -1.5517497062683105, -1.3593642711639404, -1.1669788360595703, -0.9745935201644897, -0.7822082042694092, -0.5898227691650391, -0.3974373936653137, -0.20505201816558838, -0.012666642665863037, 0.1797187328338623, 0.37210410833358765, 0.564489483833313, 0.7568747997283936, 0.9492602348327637, 1.1416456699371338, 1.3340309858322144, 1.526416301727295, 1.718801736831665, 1.9111871719360352, 2.103572368621826, 2.2959578037261963, 2.4883432388305664, 2.6807286739349365, 2.8731141090393066, 3.0654993057250977, 3.2578847408294678, 3.450270175933838, 3.642655372619629, 3.835040807723999, 4.027426242828369, 4.21981143951416, 4.412197113037109, 4.6045823097229, 4.796967506408691, 4.989353179931641, 5.181738376617432, 5.374123573303223, 5.566509246826172]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 14.0, 13.0, 28.0, 34.0, 74.0, 110.0, 175.0, 291.0, 512.0, 866.0, 1751.0, 4437.0, 11706.0, 37141.0, 393429.0, 3264917.0, 414782.0, 42178.0, 13260.0, 5084.0, 1973.0, 749.0, 330.0, 184.0, 78.0, 47.0, 32.0, 23.0, 16.0, 15.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34130859375, -0.3322105407714844, -0.32311248779296875, -0.3140144348144531, -0.3049163818359375, -0.2958183288574219, -0.28672027587890625, -0.2776222229003906, -0.268524169921875, -0.2594261169433594, -0.25032806396484375, -0.24123001098632812, -0.2321319580078125, -0.22303390502929688, -0.21393585205078125, -0.20483779907226562, -0.19573974609375, -0.18664169311523438, -0.17754364013671875, -0.16844558715820312, -0.1593475341796875, -0.15024948120117188, -0.14115142822265625, -0.13205337524414062, -0.122955322265625, -0.11385726928710938, -0.10475921630859375, -0.09566116333007812, -0.0865631103515625, -0.07746505737304688, -0.06836700439453125, -0.059268951416015625, -0.0501708984375, -0.041072845458984375, -0.03197479248046875, -0.022876739501953125, -0.0137786865234375, -0.004680633544921875, 0.00441741943359375, 0.013515472412109375, 0.022613525390625, 0.031711578369140625, 0.04080963134765625, 0.049907684326171875, 0.0590057373046875, 0.06810379028320312, 0.07720184326171875, 0.08629989624023438, 0.09539794921875, 0.10449600219726562, 0.11359405517578125, 0.12269210815429688, 0.1317901611328125, 0.14088821411132812, 0.14998626708984375, 0.15908432006835938, 0.168182373046875, 0.17728042602539062, 0.18637847900390625, 0.19547653198242188, 0.2045745849609375, 0.21367263793945312, 0.22277069091796875, 0.23186874389648438, 0.240966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 12.0, 7.0, 11.0, 6.0, 14.0, 23.0, 22.0, 25.0, 26.0, 45.0, 49.0, 45.0, 74.0, 59.0, 68.0, 72.0, 50.0, 51.0, 39.0, 44.0, 42.0, 37.0, 34.0, 16.0, 23.0, 22.0, 11.0, 21.0, 10.0, 7.0, 12.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12383174896240234, -0.12022209167480469, -0.11661243438720703, -0.11300277709960938, -0.10939311981201172, -0.10578346252441406, -0.1021738052368164, -0.09856414794921875, -0.0949544906616211, -0.09134483337402344, -0.08773517608642578, -0.08412551879882812, -0.08051586151123047, -0.07690620422363281, -0.07329654693603516, -0.0696868896484375, -0.06607723236083984, -0.06246757507324219, -0.05885791778564453, -0.055248260498046875, -0.05163860321044922, -0.04802894592285156, -0.044419288635253906, -0.04080963134765625, -0.037199974060058594, -0.03359031677246094, -0.02998065948486328, -0.026371002197265625, -0.02276134490966797, -0.019151687622070312, -0.015542030334472656, -0.011932373046875, -0.008322715759277344, -0.0047130584716796875, -0.0011034011840820312, 0.002506256103515625, 0.006115913391113281, 0.009725570678710938, 0.013335227966308594, 0.01694488525390625, 0.020554542541503906, 0.024164199829101562, 0.02777385711669922, 0.031383514404296875, 0.03499317169189453, 0.03860282897949219, 0.042212486267089844, 0.0458221435546875, 0.049431800842285156, 0.05304145812988281, 0.05665111541748047, 0.060260772705078125, 0.06387042999267578, 0.06748008728027344, 0.0710897445678711, 0.07469940185546875, 0.0783090591430664, 0.08191871643066406, 0.08552837371826172, 0.08913803100585938, 0.09274768829345703, 0.09635734558105469, 0.09996700286865234, 0.10357666015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 6.0, 18.0, 12.0, 16.0, 22.0, 19.0, 44.0, 47.0, 99.0, 139.0, 266.0, 527.0, 1517.0, 5068.0, 21882.0, 151318.0, 1854339.0, 1964621.0, 162985.0, 23060.0, 5335.0, 1675.0, 615.0, 251.0, 109.0, 78.0, 44.0, 28.0, 27.0, 25.0, 15.0, 10.0, 8.0, 6.0, 7.0, 1.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1749267578125, -0.16928672790527344, -0.16364669799804688, -0.1580066680908203, -0.15236663818359375, -0.1467266082763672, -0.14108657836914062, -0.13544654846191406, -0.1298065185546875, -0.12416648864746094, -0.11852645874023438, -0.11288642883300781, -0.10724639892578125, -0.10160636901855469, -0.09596633911132812, -0.09032630920410156, -0.084686279296875, -0.07904624938964844, -0.07340621948242188, -0.06776618957519531, -0.06212615966796875, -0.05648612976074219, -0.050846099853515625, -0.04520606994628906, -0.0395660400390625, -0.03392601013183594, -0.028285980224609375, -0.022645950317382812, -0.01700592041015625, -0.011365890502929688, -0.005725860595703125, -8.58306884765625e-05, 0.00555419921875, 0.011194229125976562, 0.016834259033203125, 0.022474288940429688, 0.02811431884765625, 0.03375434875488281, 0.039394378662109375, 0.04503440856933594, 0.0506744384765625, 0.05631446838378906, 0.061954498291015625, 0.06759452819824219, 0.07323455810546875, 0.07887458801269531, 0.08451461791992188, 0.09015464782714844, 0.095794677734375, 0.10143470764160156, 0.10707473754882812, 0.11271476745605469, 0.11835479736328125, 0.12399482727050781, 0.12963485717773438, 0.13527488708496094, 0.1409149169921875, 0.14655494689941406, 0.15219497680664062, 0.1578350067138672, 0.16347503662109375, 0.1691150665283203, 0.17475509643554688, 0.18039512634277344, 0.18603515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 4.0, 1.0, 9.0, 3.0, 8.0, 26.0, 27.0, 33.0, 47.0, 73.0, 100.0, 149.0, 258.0, 332.0, 459.0, 550.0, 557.0, 408.0, 347.0, 231.0, 146.0, 80.0, 72.0, 43.0, 26.0, 20.0, 18.0, 12.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1431884765625, -0.1395092010498047, -0.13582992553710938, -0.13215065002441406, -0.12847137451171875, -0.12479209899902344, -0.12111282348632812, -0.11743354797363281, -0.1137542724609375, -0.11007499694824219, -0.10639572143554688, -0.10271644592285156, -0.09903717041015625, -0.09535789489746094, -0.09167861938476562, -0.08799934387207031, -0.084320068359375, -0.08064079284667969, -0.07696151733398438, -0.07328224182128906, -0.06960296630859375, -0.06592369079589844, -0.062244415283203125, -0.05856513977050781, -0.0548858642578125, -0.05120658874511719, -0.047527313232421875, -0.04384803771972656, -0.04016876220703125, -0.03648948669433594, -0.032810211181640625, -0.029130935668945312, -0.02545166015625, -0.021772384643554688, -0.018093109130859375, -0.014413833618164062, -0.01073455810546875, -0.0070552825927734375, -0.003376007080078125, 0.0003032684326171875, 0.0039825439453125, 0.0076618194580078125, 0.011341094970703125, 0.015020370483398438, 0.01869964599609375, 0.022378921508789062, 0.026058197021484375, 0.029737472534179688, 0.033416748046875, 0.03709602355957031, 0.040775299072265625, 0.04445457458496094, 0.04813385009765625, 0.05181312561035156, 0.055492401123046875, 0.05917167663574219, 0.0628509521484375, 0.06653022766113281, 0.07020950317382812, 0.07388877868652344, 0.07756805419921875, 0.08124732971191406, 0.08492660522460938, 0.08860588073730469, 0.09228515625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 13.0, 27.0, 54.0, 97.0, 124.0, 155.0, 164.0, 142.0, 90.0, 64.0, 41.0, 15.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.9826609492301941, -0.9622719287872314, -0.9418829083442688, -0.9214938879013062, -0.9011048674583435, -0.8807158470153809, -0.860326886177063, -0.8399378657341003, -0.8195488452911377, -0.799159824848175, -0.7787708044052124, -0.7583817839622498, -0.7379927635192871, -0.7176038026809692, -0.6972147226333618, -0.676825761795044, -0.6564366817474365, -0.6360476613044739, -0.6156586408615112, -0.5952696204185486, -0.5748805999755859, -0.5544916391372681, -0.5341025590896606, -0.5137135982513428, -0.4933245778083801, -0.4729355573654175, -0.45254653692245483, -0.4321575164794922, -0.41176852583885193, -0.3913795053958893, -0.37099048495292664, -0.3506014943122864, -0.33021244406700134, -0.3098234236240387, -0.28943440318107605, -0.2690454125404358, -0.24865639209747314, -0.2282673716545105, -0.20787835121154785, -0.1874893456697464, -0.16710032522678375, -0.1467113047838211, -0.12632229924201965, -0.105933278799057, -0.08554426580667496, -0.06515525281429291, -0.04476623237133026, -0.02437722682952881, -0.003988206386566162, 0.016400808468461037, 0.036789823323488235, 0.057178840041160583, 0.07756785303354263, 0.09795686602592468, 0.11834588646888733, 0.13873489201068878, 0.15912391245365143, 0.17951293289661407, 0.19990193843841553, 0.22029095888137817, 0.24067997932434082, 0.26106899976730347, 0.2814580202102661, 0.30184701085090637, 0.322236031293869]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 6.0, 10.0, 6.0, 4.0, 8.0, 16.0, 12.0, 17.0, 22.0, 21.0, 25.0, 28.0, 30.0, 30.0, 31.0, 35.0, 34.0, 46.0, 51.0, 46.0, 38.0, 44.0, 35.0, 39.0, 40.0, 39.0, 30.0, 33.0, 13.0, 24.0, 27.0, 21.0, 23.0, 14.0, 10.0, 12.0, 15.0, 12.0, 10.0, 9.0, 10.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22161346673965454, -0.2146337479352951, -0.20765402913093567, -0.20067429542541504, -0.1936945766210556, -0.18671485781669617, -0.17973512411117554, -0.1727554053068161, -0.16577568650245667, -0.15879596769809723, -0.1518162488937378, -0.14483651518821716, -0.13785679638385773, -0.1308770775794983, -0.12389735132455826, -0.11691762506961823, -0.10993790626525879, -0.10295818746089935, -0.09597846120595932, -0.08899873495101929, -0.08201901614665985, -0.07503929734230042, -0.06805957108736038, -0.06107984855771065, -0.05410012602806091, -0.04712040349841118, -0.040140680968761444, -0.03316095843911171, -0.026181235909461975, -0.01920151337981224, -0.012221790850162506, -0.005242068320512772, 0.0017376542091369629, 0.008717376738786697, 0.015697099268436432, 0.022676821798086166, 0.0296565443277359, 0.036636266857385635, 0.04361598938703537, 0.050595711916685104, 0.05757543444633484, 0.06455515325069427, 0.07153487950563431, 0.07851460576057434, 0.08549432456493378, 0.09247404336929321, 0.09945376962423325, 0.10643349587917328, 0.11341321468353271, 0.12039293348789215, 0.1273726522922516, 0.13435238599777222, 0.14133210480213165, 0.1483118236064911, 0.15529155731201172, 0.16227127611637115, 0.1692509949207306, 0.17623071372509003, 0.18321043252944946, 0.1901901662349701, 0.19716988503932953, 0.20414960384368896, 0.2111293375492096, 0.21810905635356903, 0.22508877515792847]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 12.0, 14.0, 22.0, 19.0, 32.0, 34.0, 64.0, 84.0, 144.0, 226.0, 331.0, 546.0, 1034.0, 2115.0, 5042.0, 14682.0, 53402.0, 220324.0, 472709.0, 204701.0, 49758.0, 13867.0, 4860.0, 2084.0, 1040.0, 510.0, 288.0, 200.0, 129.0, 77.0, 54.0, 34.0, 29.0, 21.0, 14.0, 6.0, 11.0, 3.0, 7.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1611328125, -0.15526771545410156, -0.14940261840820312, -0.1435375213623047, -0.13767242431640625, -0.1318073272705078, -0.12594223022460938, -0.12007713317871094, -0.1142120361328125, -0.10834693908691406, -0.10248184204101562, -0.09661674499511719, -0.09075164794921875, -0.08488655090332031, -0.07902145385742188, -0.07315635681152344, -0.067291259765625, -0.06142616271972656, -0.055561065673828125, -0.04969596862792969, -0.04383087158203125, -0.03796577453613281, -0.032100677490234375, -0.026235580444335938, -0.0203704833984375, -0.014505386352539062, -0.008640289306640625, -0.0027751922607421875, 0.00308990478515625, 0.008955001831054688, 0.014820098876953125, 0.020685195922851562, 0.02655029296875, 0.03241539001464844, 0.038280487060546875, 0.04414558410644531, 0.05001068115234375, 0.05587577819824219, 0.061740875244140625, 0.06760597229003906, 0.0734710693359375, 0.07933616638183594, 0.08520126342773438, 0.09106636047363281, 0.09693145751953125, 0.10279655456542969, 0.10866165161132812, 0.11452674865722656, 0.120391845703125, 0.12625694274902344, 0.13212203979492188, 0.1379871368408203, 0.14385223388671875, 0.1497173309326172, 0.15558242797851562, 0.16144752502441406, 0.1673126220703125, 0.17317771911621094, 0.17904281616210938, 0.1849079132080078, 0.19077301025390625, 0.1966381072998047, 0.20250320434570312, 0.20836830139160156, 0.2142333984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 15.0, 6.0, 9.0, 13.0, 19.0, 25.0, 29.0, 42.0, 57.0, 51.0, 67.0, 68.0, 72.0, 60.0, 75.0, 69.0, 42.0, 53.0, 37.0, 38.0, 39.0, 24.0, 22.0, 19.0, 12.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14507007598876953, -0.14084815979003906, -0.1366262435913086, -0.13240432739257812, -0.12818241119384766, -0.12396049499511719, -0.11973857879638672, -0.11551666259765625, -0.11129474639892578, -0.10707283020019531, -0.10285091400146484, -0.09862899780273438, -0.0944070816040039, -0.09018516540527344, -0.08596324920654297, -0.0817413330078125, -0.07751941680908203, -0.07329750061035156, -0.0690755844116211, -0.06485366821289062, -0.060631752014160156, -0.05640983581542969, -0.05218791961669922, -0.04796600341796875, -0.04374408721923828, -0.03952217102050781, -0.035300254821777344, -0.031078338623046875, -0.026856422424316406, -0.022634506225585938, -0.01841259002685547, -0.014190673828125, -0.009968757629394531, -0.0057468414306640625, -0.0015249252319335938, 0.002696990966796875, 0.006918907165527344, 0.011140823364257812, 0.015362739562988281, 0.01958465576171875, 0.02380657196044922, 0.028028488159179688, 0.032250404357910156, 0.036472320556640625, 0.040694236755371094, 0.04491615295410156, 0.04913806915283203, 0.0533599853515625, 0.05758190155029297, 0.06180381774902344, 0.0660257339477539, 0.07024765014648438, 0.07446956634521484, 0.07869148254394531, 0.08291339874267578, 0.08713531494140625, 0.09135723114013672, 0.09557914733886719, 0.09980106353759766, 0.10402297973632812, 0.1082448959350586, 0.11246681213378906, 0.11668872833251953, 0.12091064453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 8.0, 11.0, 11.0, 21.0, 27.0, 28.0, 30.0, 28.0, 47.0, 83.0, 211.0, 575.0, 1909.0, 7135.0, 27826.0, 109954.0, 323175.0, 373911.0, 150516.0, 39140.0, 9864.0, 2659.0, 799.0, 254.0, 97.0, 53.0, 36.0, 21.0, 19.0, 19.0, 13.0, 15.0, 7.0, 9.0, 9.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18603515625, -0.18005752563476562, -0.17407989501953125, -0.16810226440429688, -0.1621246337890625, -0.15614700317382812, -0.15016937255859375, -0.14419174194335938, -0.138214111328125, -0.13223648071289062, -0.12625885009765625, -0.12028121948242188, -0.1143035888671875, -0.10832595825195312, -0.10234832763671875, -0.09637069702148438, -0.09039306640625, -0.08441543579101562, -0.07843780517578125, -0.07246017456054688, -0.0664825439453125, -0.060504913330078125, -0.05452728271484375, -0.048549652099609375, -0.042572021484375, -0.036594390869140625, -0.03061676025390625, -0.024639129638671875, -0.0186614990234375, -0.012683868408203125, -0.00670623779296875, -0.000728607177734375, 0.0052490234375, 0.011226654052734375, 0.01720428466796875, 0.023181915283203125, 0.0291595458984375, 0.035137176513671875, 0.04111480712890625, 0.047092437744140625, 0.053070068359375, 0.059047698974609375, 0.06502532958984375, 0.07100296020507812, 0.0769805908203125, 0.08295822143554688, 0.08893585205078125, 0.09491348266601562, 0.10089111328125, 0.10686874389648438, 0.11284637451171875, 0.11882400512695312, 0.1248016357421875, 0.13077926635742188, 0.13675689697265625, 0.14273452758789062, 0.148712158203125, 0.15468978881835938, 0.16066741943359375, 0.16664505004882812, 0.1726226806640625, 0.17860031127929688, 0.18457794189453125, 0.19055557250976562, 0.196533203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 4.0, 9.0, 8.0, 11.0, 11.0, 14.0, 17.0, 19.0, 17.0, 19.0, 27.0, 28.0, 33.0, 28.0, 42.0, 45.0, 35.0, 41.0, 44.0, 47.0, 45.0, 32.0, 45.0, 37.0, 36.0, 30.0, 31.0, 30.0, 27.0, 24.0, 23.0, 35.0, 20.0, 13.0, 15.0, 12.0, 8.0, 10.0, 5.0, 6.0, 6.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.22346115112304688, -0.21608734130859375, -0.20871353149414062, -0.2013397216796875, -0.19396591186523438, -0.18659210205078125, -0.17921829223632812, -0.171844482421875, -0.16447067260742188, -0.15709686279296875, -0.14972305297851562, -0.1423492431640625, -0.13497543334960938, -0.12760162353515625, -0.12022781372070312, -0.11285400390625, -0.10548019409179688, -0.09810638427734375, -0.09073257446289062, -0.0833587646484375, -0.07598495483398438, -0.06861114501953125, -0.061237335205078125, -0.053863525390625, -0.046489715576171875, -0.03911590576171875, -0.031742095947265625, -0.0243682861328125, -0.016994476318359375, -0.00962066650390625, -0.002246856689453125, 0.005126953125, 0.012500762939453125, 0.01987457275390625, 0.027248382568359375, 0.0346221923828125, 0.041996002197265625, 0.04936981201171875, 0.056743621826171875, 0.064117431640625, 0.07149124145507812, 0.07886505126953125, 0.08623886108398438, 0.0936126708984375, 0.10098648071289062, 0.10836029052734375, 0.11573410034179688, 0.12310791015625, 0.13048171997070312, 0.13785552978515625, 0.14522933959960938, 0.1526031494140625, 0.15997695922851562, 0.16735076904296875, 0.17472457885742188, 0.182098388671875, 0.18947219848632812, 0.19684600830078125, 0.20421981811523438, 0.2115936279296875, 0.21896743774414062, 0.22634124755859375, 0.23371505737304688, 0.2410888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 10.0, 11.0, 7.0, 17.0, 28.0, 56.0, 77.0, 150.0, 280.0, 599.0, 1571.0, 5155.0, 24333.0, 247080.0, 668733.0, 83936.0, 11655.0, 2969.0, 962.0, 406.0, 238.0, 111.0, 65.0, 33.0, 28.0, 12.0, 10.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11767578125, -0.11391448974609375, -0.1101531982421875, -0.10639190673828125, -0.102630615234375, -0.09886932373046875, -0.0951080322265625, -0.09134674072265625, -0.08758544921875, -0.08382415771484375, -0.0800628662109375, -0.07630157470703125, -0.072540283203125, -0.06877899169921875, -0.0650177001953125, -0.06125640869140625, -0.0574951171875, -0.05373382568359375, -0.0499725341796875, -0.04621124267578125, -0.042449951171875, -0.03868865966796875, -0.0349273681640625, -0.03116607666015625, -0.02740478515625, -0.02364349365234375, -0.0198822021484375, -0.01612091064453125, -0.012359619140625, -0.00859832763671875, -0.0048370361328125, -0.00107574462890625, 0.002685546875, 0.00644683837890625, 0.0102081298828125, 0.01396942138671875, 0.017730712890625, 0.02149200439453125, 0.0252532958984375, 0.02901458740234375, 0.03277587890625, 0.03653717041015625, 0.0402984619140625, 0.04405975341796875, 0.047821044921875, 0.05158233642578125, 0.0553436279296875, 0.05910491943359375, 0.0628662109375, 0.06662750244140625, 0.0703887939453125, 0.07415008544921875, 0.077911376953125, 0.08167266845703125, 0.0854339599609375, 0.08919525146484375, 0.09295654296875, 0.09671783447265625, 0.1004791259765625, 0.10424041748046875, 0.108001708984375, 0.11176300048828125, 0.1155242919921875, 0.11928558349609375, 0.123046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 5.0, 1.0, 10.0, 14.0, 12.0, 18.0, 13.0, 25.0, 29.0, 37.0, 26.0, 46.0, 37.0, 52.0, 32.0, 66.0, 68.0, 39.0, 60.0, 42.0, 46.0, 32.0, 49.0, 48.0, 28.0, 31.0, 19.0, 15.0, 16.0, 19.0, 9.0, 11.0, 5.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.245208740234375e-06, -5.0924718379974365e-06, -4.939734935760498e-06, -4.7869980335235596e-06, -4.634261131286621e-06, -4.481524229049683e-06, -4.328787326812744e-06, -4.176050424575806e-06, -4.023313522338867e-06, -3.870576620101929e-06, -3.7178397178649902e-06, -3.5651028156280518e-06, -3.4123659133911133e-06, -3.259629011154175e-06, -3.1068921089172363e-06, -2.954155206680298e-06, -2.8014183044433594e-06, -2.648681402206421e-06, -2.4959444999694824e-06, -2.343207597732544e-06, -2.1904706954956055e-06, -2.037733793258667e-06, -1.8849968910217285e-06, -1.73225998878479e-06, -1.5795230865478516e-06, -1.426786184310913e-06, -1.2740492820739746e-06, -1.1213123798370361e-06, -9.685754776000977e-07, -8.158385753631592e-07, -6.631016731262207e-07, -5.103647708892822e-07, -3.5762786865234375e-07, -2.0489096641540527e-07, -5.21540641784668e-08, 1.0058283805847168e-07, 2.5331974029541016e-07, 4.0605664253234863e-07, 5.587935447692871e-07, 7.115304470062256e-07, 8.642673492431641e-07, 1.0170042514801025e-06, 1.169741153717041e-06, 1.3224780559539795e-06, 1.475214958190918e-06, 1.6279518604278564e-06, 1.780688762664795e-06, 1.9334256649017334e-06, 2.086162567138672e-06, 2.2388994693756104e-06, 2.391636371612549e-06, 2.5443732738494873e-06, 2.6971101760864258e-06, 2.8498470783233643e-06, 3.0025839805603027e-06, 3.155320882797241e-06, 3.3080577850341797e-06, 3.460794687271118e-06, 3.6135315895080566e-06, 3.766268491744995e-06, 3.919005393981934e-06, 4.071742296218872e-06, 4.2244791984558105e-06, 4.377216100692749e-06, 4.5299530029296875e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 11.0, 17.0, 31.0, 27.0, 61.0, 69.0, 90.0, 154.0, 276.0, 453.0, 614.0, 1133.0, 2242.0, 3953.0, 8338.0, 20948.0, 61783.0, 208318.0, 420759.0, 215980.0, 63745.0, 21509.0, 8799.0, 4142.0, 2104.0, 1110.0, 709.0, 427.0, 232.0, 175.0, 95.0, 75.0, 53.0, 43.0, 31.0, 16.0, 12.0, 10.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060455322265625, -0.05853700637817383, -0.056618690490722656, -0.054700374603271484, -0.05278205871582031, -0.05086374282836914, -0.04894542694091797, -0.0470271110534668, -0.045108795166015625, -0.04319047927856445, -0.04127216339111328, -0.03935384750366211, -0.03743553161621094, -0.035517215728759766, -0.033598899841308594, -0.03168058395385742, -0.02976226806640625, -0.027843952178955078, -0.025925636291503906, -0.024007320404052734, -0.022089004516601562, -0.02017068862915039, -0.01825237274169922, -0.016334056854248047, -0.014415740966796875, -0.012497425079345703, -0.010579109191894531, -0.00866079330444336, -0.0067424774169921875, -0.004824161529541016, -0.0029058456420898438, -0.0009875297546386719, 0.0009307861328125, 0.002849102020263672, 0.004767417907714844, 0.006685733795166016, 0.008604049682617188, 0.01052236557006836, 0.012440681457519531, 0.014358997344970703, 0.016277313232421875, 0.018195629119873047, 0.02011394500732422, 0.02203226089477539, 0.023950576782226562, 0.025868892669677734, 0.027787208557128906, 0.029705524444580078, 0.03162384033203125, 0.03354215621948242, 0.035460472106933594, 0.037378787994384766, 0.03929710388183594, 0.04121541976928711, 0.04313373565673828, 0.04505205154418945, 0.046970367431640625, 0.0488886833190918, 0.05080699920654297, 0.05272531509399414, 0.05464363098144531, 0.056561946868896484, 0.058480262756347656, 0.06039857864379883, 0.06231689453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 15.0, 11.0, 29.0, 36.0, 51.0, 87.0, 121.0, 142.0, 141.0, 126.0, 83.0, 42.0, 30.0, 22.0, 16.0, 9.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.14498424530029297, -0.14116477966308594, -0.1373453140258789, -0.13352584838867188, -0.12970638275146484, -0.1258869171142578, -0.12206745147705078, -0.11824798583984375, -0.11442852020263672, -0.11060905456542969, -0.10678958892822266, -0.10297012329101562, -0.0991506576538086, -0.09533119201660156, -0.09151172637939453, -0.0876922607421875, -0.08387279510498047, -0.08005332946777344, -0.0762338638305664, -0.07241439819335938, -0.06859493255615234, -0.06477546691894531, -0.06095600128173828, -0.05713653564453125, -0.05331707000732422, -0.04949760437011719, -0.045678138732910156, -0.041858673095703125, -0.038039207458496094, -0.03421974182128906, -0.03040027618408203, -0.026580810546875, -0.02276134490966797, -0.018941879272460938, -0.015122413635253906, -0.011302947998046875, -0.007483482360839844, -0.0036640167236328125, 0.00015544891357421875, 0.00397491455078125, 0.007794380187988281, 0.011613845825195312, 0.015433311462402344, 0.019252777099609375, 0.023072242736816406, 0.026891708374023438, 0.03071117401123047, 0.0345306396484375, 0.03835010528564453, 0.04216957092285156, 0.045989036560058594, 0.049808502197265625, 0.053627967834472656, 0.05744743347167969, 0.06126689910888672, 0.06508636474609375, 0.06890583038330078, 0.07272529602050781, 0.07654476165771484, 0.08036422729492188, 0.0841836929321289, 0.08800315856933594, 0.09182262420654297, 0.09564208984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 17.0, 82.0, 259.0, 401.0, 187.0, 49.0, 13.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.7434539794921875, -5.63785457611084, -5.53225564956665, -5.426656246185303, -5.321056842803955, -5.215457439422607, -5.109858512878418, -5.00425910949707, -4.898659706115723, -4.793060302734375, -4.6874613761901855, -4.581861972808838, -4.47626256942749, -4.370663166046143, -4.265064239501953, -4.1594648361206055, -4.053865432739258, -3.9482662677764893, -3.8426668643951416, -3.737067699432373, -3.6314682960510254, -3.525869131088257, -3.4202699661254883, -3.3146705627441406, -3.209071636199951, -3.1034724712371826, -2.997873067855835, -2.8922739028930664, -2.7866744995117188, -2.68107533454895, -2.5754761695861816, -2.469876766204834, -2.3642771244049072, -2.2586779594421387, -2.153078556060791, -2.0474793910980225, -1.9418799877166748, -1.8362808227539062, -1.7306815385818481, -1.62508225440979, -1.519482970237732, -1.4138836860656738, -1.3082844018936157, -1.2026851177215576, -1.097085952758789, -0.9914866089820862, -0.8858873844146729, -0.7802881002426147, -0.6746888160705566, -0.5690895318984985, -0.4634902775287628, -0.3578910231590271, -0.252291738986969, -0.1466924548149109, -0.04109323024749756, 0.06450605392456055, 0.17010533809661865, 0.27570462226867676, 0.3813038766384125, 0.4869031310081482, 0.5925024151802063, 0.6981016993522644, 0.8037009239196777, 0.9093002080917358, 1.014899492263794]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 6.0, 9.0, 11.0, 16.0, 19.0, 19.0, 15.0, 16.0, 20.0, 27.0, 25.0, 33.0, 25.0, 35.0, 47.0, 54.0, 60.0, 38.0, 60.0, 40.0, 47.0, 45.0, 43.0, 45.0, 38.0, 30.0, 29.0, 30.0, 22.0, 13.0, 15.0, 8.0, 11.0, 6.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.203584909439087, -1.1623998880386353, -1.121214747428894, -1.0800297260284424, -1.0388447046279907, -0.9976596236228943, -0.9564745426177979, -0.9152895212173462, -0.8741044998168945, -0.8329194188117981, -0.7917343974113464, -0.75054931640625, -0.7093642950057983, -0.6681792140007019, -0.6269941329956055, -0.5858091115951538, -0.5446240305900574, -0.5034389495849609, -0.4622539281845093, -0.42106884717941284, -0.3798838257789612, -0.33869874477386475, -0.2975136935710907, -0.25632864236831665, -0.2151435911655426, -0.17395853996276855, -0.1327734887599945, -0.09158842265605927, -0.05040337145328522, -0.00921832025051117, 0.03196674585342407, 0.07315179705619812, 0.11433684825897217, 0.15552189946174622, 0.19670695066452026, 0.2378920167684555, 0.27907705307006836, 0.3202621340751648, 0.36144718527793884, 0.4026322364807129, 0.44381728768348694, 0.485002338886261, 0.5261874198913574, 0.5673724412918091, 0.6085575222969055, 0.6497425436973572, 0.6909276247024536, 0.7321126461029053, 0.7732977271080017, 0.8144828081130981, 0.8556678295135498, 0.8968529105186462, 0.9380379319190979, 0.9792230129241943, 1.020408034324646, 1.0615930557250977, 1.1027781963348389, 1.1439632177352905, 1.1851483583450317, 1.2263333797454834, 1.267518401145935, 1.3087034225463867, 1.349888563156128, 1.3910735845565796, 1.4322586059570312]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 11.0, 9.0, 15.0, 12.0, 19.0, 24.0, 26.0, 51.0, 90.0, 157.0, 337.0, 829.0, 2613.0, 12911.0, 145487.0, 3716373.0, 290619.0, 19228.0, 3631.0, 1001.0, 388.0, 157.0, 82.0, 57.0, 40.0, 21.0, 21.0, 15.0, 9.0, 6.0, 4.0, 5.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.615234375, -0.5984230041503906, -0.5816116333007812, -0.5648002624511719, -0.5479888916015625, -0.5311775207519531, -0.5143661499023438, -0.4975547790527344, -0.480743408203125, -0.4639320373535156, -0.44712066650390625, -0.4303092956542969, -0.4134979248046875, -0.3966865539550781, -0.37987518310546875, -0.3630638122558594, -0.34625244140625, -0.3294410705566406, -0.31262969970703125, -0.2958183288574219, -0.2790069580078125, -0.2621955871582031, -0.24538421630859375, -0.22857284545898438, -0.211761474609375, -0.19495010375976562, -0.17813873291015625, -0.16132736206054688, -0.1445159912109375, -0.12770462036132812, -0.11089324951171875, -0.09408187866210938, -0.0772705078125, -0.060459136962890625, -0.04364776611328125, -0.026836395263671875, -0.0100250244140625, 0.006786346435546875, 0.02359771728515625, 0.040409088134765625, 0.057220458984375, 0.07403182983398438, 0.09084320068359375, 0.10765457153320312, 0.1244659423828125, 0.14127731323242188, 0.15808868408203125, 0.17490005493164062, 0.19171142578125, 0.20852279663085938, 0.22533416748046875, 0.24214553833007812, 0.2589569091796875, 0.2757682800292969, 0.29257965087890625, 0.3093910217285156, 0.326202392578125, 0.3430137634277344, 0.35982513427734375, 0.3766365051269531, 0.3934478759765625, 0.4102592468261719, 0.42707061767578125, 0.4438819885253906, 0.460693359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 13.0, 11.0, 14.0, 21.0, 20.0, 17.0, 27.0, 36.0, 38.0, 35.0, 48.0, 61.0, 60.0, 52.0, 80.0, 54.0, 58.0, 51.0, 42.0, 44.0, 29.0, 22.0, 20.0, 34.0, 27.0, 10.0, 17.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12926101684570312, -0.12558746337890625, -0.12191390991210938, -0.1182403564453125, -0.11456680297851562, -0.11089324951171875, -0.10721969604492188, -0.103546142578125, -0.09987258911132812, -0.09619903564453125, -0.09252548217773438, -0.0888519287109375, -0.08517837524414062, -0.08150482177734375, -0.07783126831054688, -0.07415771484375, -0.07048416137695312, -0.06681060791015625, -0.06313705444335938, -0.0594635009765625, -0.055789947509765625, -0.05211639404296875, -0.048442840576171875, -0.044769287109375, -0.041095733642578125, -0.03742218017578125, -0.033748626708984375, -0.0300750732421875, -0.026401519775390625, -0.02272796630859375, -0.019054412841796875, -0.015380859375, -0.011707305908203125, -0.00803375244140625, -0.004360198974609375, -0.0006866455078125, 0.002986907958984375, 0.00666046142578125, 0.010334014892578125, 0.014007568359375, 0.017681121826171875, 0.02135467529296875, 0.025028228759765625, 0.0287017822265625, 0.032375335693359375, 0.03604888916015625, 0.039722442626953125, 0.04339599609375, 0.047069549560546875, 0.05074310302734375, 0.054416656494140625, 0.0580902099609375, 0.061763763427734375, 0.06543731689453125, 0.06911087036132812, 0.072784423828125, 0.07645797729492188, 0.08013153076171875, 0.08380508422851562, 0.0874786376953125, 0.09115219116210938, 0.09482574462890625, 0.09849929809570312, 0.1021728515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 10.0, 4.0, 13.0, 17.0, 23.0, 31.0, 34.0, 63.0, 110.0, 221.0, 450.0, 801.0, 1777.0, 4418.0, 11305.0, 32804.0, 111905.0, 455067.0, 1888724.0, 1284308.0, 289354.0, 75252.0, 22976.0, 8446.0, 3320.0, 1361.0, 664.0, 348.0, 183.0, 89.0, 70.0, 34.0, 27.0, 16.0, 16.0, 7.0, 6.0, 2.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.214019775390625, -0.20684814453125, -0.199676513671875, -0.1925048828125, -0.185333251953125, -0.17816162109375, -0.170989990234375, -0.163818359375, -0.156646728515625, -0.14947509765625, -0.142303466796875, -0.1351318359375, -0.127960205078125, -0.12078857421875, -0.113616943359375, -0.1064453125, -0.099273681640625, -0.09210205078125, -0.084930419921875, -0.0777587890625, -0.070587158203125, -0.06341552734375, -0.056243896484375, -0.049072265625, -0.041900634765625, -0.03472900390625, -0.027557373046875, -0.0203857421875, -0.013214111328125, -0.00604248046875, 0.001129150390625, 0.00830078125, 0.015472412109375, 0.02264404296875, 0.029815673828125, 0.0369873046875, 0.044158935546875, 0.05133056640625, 0.058502197265625, 0.065673828125, 0.072845458984375, 0.08001708984375, 0.087188720703125, 0.0943603515625, 0.101531982421875, 0.10870361328125, 0.115875244140625, 0.123046875, 0.130218505859375, 0.13739013671875, 0.144561767578125, 0.1517333984375, 0.158905029296875, 0.16607666015625, 0.173248291015625, 0.180419921875, 0.187591552734375, 0.19476318359375, 0.201934814453125, 0.2091064453125, 0.216278076171875, 0.22344970703125, 0.230621337890625, 0.23779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 9.0, 8.0, 19.0, 12.0, 13.0, 20.0, 27.0, 54.0, 56.0, 99.0, 125.0, 163.0, 225.0, 330.0, 411.0, 556.0, 502.0, 448.0, 259.0, 188.0, 139.0, 106.0, 66.0, 57.0, 35.0, 35.0, 24.0, 19.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1240234375, -0.11973190307617188, -0.11544036865234375, -0.11114883422851562, -0.1068572998046875, -0.10256576538085938, -0.09827423095703125, -0.09398269653320312, -0.089691162109375, -0.08539962768554688, -0.08110809326171875, -0.07681655883789062, -0.0725250244140625, -0.06823348999023438, -0.06394195556640625, -0.059650421142578125, -0.05535888671875, -0.051067352294921875, -0.04677581787109375, -0.042484283447265625, -0.0381927490234375, -0.033901214599609375, -0.02960968017578125, -0.025318145751953125, -0.021026611328125, -0.016735076904296875, -0.01244354248046875, -0.008152008056640625, -0.0038604736328125, 0.000431060791015625, 0.00472259521484375, 0.009014129638671875, 0.0133056640625, 0.017597198486328125, 0.02188873291015625, 0.026180267333984375, 0.0304718017578125, 0.034763336181640625, 0.03905487060546875, 0.043346405029296875, 0.047637939453125, 0.051929473876953125, 0.05622100830078125, 0.060512542724609375, 0.0648040771484375, 0.06909561157226562, 0.07338714599609375, 0.07767868041992188, 0.08197021484375, 0.08626174926757812, 0.09055328369140625, 0.09484481811523438, 0.0991363525390625, 0.10342788696289062, 0.10771942138671875, 0.11201095581054688, 0.116302490234375, 0.12059402465820312, 0.12488555908203125, 0.12917709350585938, 0.1334686279296875, 0.13776016235351562, 0.14205169677734375, 0.14634323120117188, 0.150634765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 31.0, 104.0, 282.0, 334.0, 193.0, 42.0, 11.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2407147884368896, -1.1728157997131348, -1.1049169301986694, -1.037018060684204, -0.9691190719604492, -0.9012201428413391, -0.833321213722229, -0.7654222846031189, -0.6975233554840088, -0.6296244263648987, -0.5617254972457886, -0.49382656812667847, -0.42592763900756836, -0.35802870988845825, -0.29012978076934814, -0.22223085165023804, -0.15433192253112793, -0.08643299341201782, -0.018534064292907715, 0.04936486482620239, 0.1172637939453125, 0.1851627230644226, 0.2530616521835327, 0.3209605813026428, 0.38885951042175293, 0.45675843954086304, 0.5246573686599731, 0.5925562977790833, 0.6604552268981934, 0.7283541560173035, 0.7962530851364136, 0.8641520142555237, 0.9320511817932129, 0.999950110912323, 1.067849040031433, 1.1357479095458984, 1.2036468982696533, 1.2715458869934082, 1.3394447565078735, 1.4073436260223389, 1.4752426147460938, 1.5431416034698486, 1.611040472984314, 1.6789393424987793, 1.7468383312225342, 1.814737319946289, 1.8826361894607544, 1.9505350589752197, 2.0184340476989746, 2.0863330364227295, 2.1542320251464844, 2.22213077545166, 2.290029764175415, 2.35792875289917, 2.4258275032043457, 2.4937264919281006, 2.5616254806518555, 2.6295244693756104, 2.6974234580993652, 2.765322208404541, 2.833221197128296, 2.901120185852051, 2.9690189361572266, 3.0369179248809814, 3.1048169136047363]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 11.0, 11.0, 15.0, 16.0, 28.0, 37.0, 32.0, 38.0, 44.0, 54.0, 60.0, 57.0, 71.0, 67.0, 66.0, 53.0, 45.0, 56.0, 37.0, 48.0, 37.0, 26.0, 19.0, 20.0, 13.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7587069272994995, -0.7395540475845337, -0.7204012274742126, -0.7012483477592468, -0.682095468044281, -0.66294264793396, -0.6437897682189941, -0.6246368885040283, -0.6054840087890625, -0.5863311290740967, -0.5671783089637756, -0.5480254292488098, -0.528872549533844, -0.509719729423523, -0.49056684970855713, -0.4714139699935913, -0.45226114988327026, -0.43310829997062683, -0.413955420255661, -0.3948025703430176, -0.37564969062805176, -0.3564968407154083, -0.3373439908027649, -0.3181911110877991, -0.29903826117515564, -0.2798854112625122, -0.2607325315475464, -0.24157968163490295, -0.22242681682109833, -0.2032739520072937, -0.18412110209465027, -0.16496823728084564, -0.14581537246704102, -0.1266625076532364, -0.10750965029001236, -0.08835679292678833, -0.0692039281129837, -0.05005106329917908, -0.030898205935955048, -0.011745348572731018, 0.007407516241073608, 0.026560377329587936, 0.045713238418102264, 0.0648660957813263, 0.08401896059513092, 0.10317182540893555, 0.12232468277215958, 0.1414775401353836, 0.16063040494918823, 0.17978326976299286, 0.19893613457679749, 0.21808898448944092, 0.23724184930324554, 0.25639471411705017, 0.2755475640296936, 0.2947004437446594, 0.31385329365730286, 0.3330061435699463, 0.3521590232849121, 0.37131187319755554, 0.390464723110199, 0.4096176028251648, 0.4287704527378082, 0.44792330265045166, 0.4670761823654175]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 13.0, 9.0, 19.0, 26.0, 23.0, 51.0, 93.0, 88.0, 152.0, 221.0, 286.0, 500.0, 716.0, 1257.0, 1960.0, 3418.0, 5987.0, 10750.0, 20136.0, 38136.0, 73759.0, 136714.0, 215200.0, 223009.0, 145562.0, 79634.0, 41543.0, 21818.0, 11810.0, 6366.0, 3629.0, 2064.0, 1231.0, 796.0, 506.0, 330.0, 209.0, 150.0, 119.0, 81.0, 54.0, 29.0, 33.0, 17.0, 11.0, 7.0, 11.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.129638671875, -0.1255950927734375, -0.121551513671875, -0.1175079345703125, -0.11346435546875, -0.1094207763671875, -0.105377197265625, -0.1013336181640625, -0.0972900390625, -0.0932464599609375, -0.089202880859375, -0.0851593017578125, -0.08111572265625, -0.0770721435546875, -0.073028564453125, -0.0689849853515625, -0.06494140625, -0.0608978271484375, -0.056854248046875, -0.0528106689453125, -0.04876708984375, -0.0447235107421875, -0.040679931640625, -0.0366363525390625, -0.0325927734375, -0.0285491943359375, -0.024505615234375, -0.0204620361328125, -0.01641845703125, -0.0123748779296875, -0.008331298828125, -0.0042877197265625, -0.000244140625, 0.0037994384765625, 0.007843017578125, 0.0118865966796875, 0.01593017578125, 0.0199737548828125, 0.024017333984375, 0.0280609130859375, 0.0321044921875, 0.0361480712890625, 0.040191650390625, 0.0442352294921875, 0.04827880859375, 0.0523223876953125, 0.056365966796875, 0.0604095458984375, 0.064453125, 0.0684967041015625, 0.072540283203125, 0.0765838623046875, 0.08062744140625, 0.0846710205078125, 0.088714599609375, 0.0927581787109375, 0.0968017578125, 0.1008453369140625, 0.104888916015625, 0.1089324951171875, 0.11297607421875, 0.1170196533203125, 0.121063232421875, 0.1251068115234375, 0.129150390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 3.0, 8.0, 12.0, 7.0, 14.0, 14.0, 16.0, 16.0, 17.0, 26.0, 29.0, 30.0, 37.0, 34.0, 48.0, 52.0, 59.0, 43.0, 59.0, 46.0, 42.0, 51.0, 44.0, 37.0, 27.0, 36.0, 17.0, 34.0, 20.0, 28.0, 15.0, 9.0, 19.0, 12.0, 8.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11053466796875, -0.10743141174316406, -0.10432815551757812, -0.10122489929199219, -0.09812164306640625, -0.09501838684082031, -0.09191513061523438, -0.08881187438964844, -0.0857086181640625, -0.08260536193847656, -0.07950210571289062, -0.07639884948730469, -0.07329559326171875, -0.07019233703613281, -0.06708908081054688, -0.06398582458496094, -0.060882568359375, -0.05777931213378906, -0.054676055908203125, -0.05157279968261719, -0.04846954345703125, -0.04536628723144531, -0.042263031005859375, -0.03915977478027344, -0.0360565185546875, -0.03295326232910156, -0.029850006103515625, -0.026746749877929688, -0.02364349365234375, -0.020540237426757812, -0.017436981201171875, -0.014333724975585938, -0.01123046875, -0.008127212524414062, -0.005023956298828125, -0.0019207000732421875, 0.00118255615234375, 0.0042858123779296875, 0.007389068603515625, 0.010492324829101562, 0.0135955810546875, 0.016698837280273438, 0.019802093505859375, 0.022905349731445312, 0.02600860595703125, 0.029111862182617188, 0.032215118408203125, 0.03531837463378906, 0.038421630859375, 0.04152488708496094, 0.044628143310546875, 0.04773139953613281, 0.05083465576171875, 0.05393791198730469, 0.057041168212890625, 0.06014442443847656, 0.0632476806640625, 0.06635093688964844, 0.06945419311523438, 0.07255744934082031, 0.07566070556640625, 0.07876396179199219, 0.08186721801757812, 0.08497047424316406, 0.08807373046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 5.0, 14.0, 11.0, 15.0, 13.0, 14.0, 17.0, 31.0, 20.0, 26.0, 30.0, 40.0, 33.0, 60.0, 102.0, 238.0, 1388.0, 29281.0, 805770.0, 205488.0, 4899.0, 481.0, 164.0, 67.0, 55.0, 38.0, 29.0, 35.0, 19.0, 34.0, 24.0, 15.0, 10.0, 18.0, 13.0, 13.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.89453125, -0.8672103881835938, -0.8398895263671875, -0.8125686645507812, -0.785247802734375, -0.7579269409179688, -0.7306060791015625, -0.7032852172851562, -0.67596435546875, -0.6486434936523438, -0.6213226318359375, -0.5940017700195312, -0.566680908203125, -0.5393600463867188, -0.5120391845703125, -0.48471832275390625, -0.4573974609375, -0.43007659912109375, -0.4027557373046875, -0.37543487548828125, -0.348114013671875, -0.32079315185546875, -0.2934722900390625, -0.26615142822265625, -0.23883056640625, -0.21150970458984375, -0.1841888427734375, -0.15686798095703125, -0.129547119140625, -0.10222625732421875, -0.0749053955078125, -0.04758453369140625, -0.020263671875, 0.00705718994140625, 0.0343780517578125, 0.06169891357421875, 0.089019775390625, 0.11634063720703125, 0.1436614990234375, 0.17098236083984375, 0.19830322265625, 0.22562408447265625, 0.2529449462890625, 0.28026580810546875, 0.307586669921875, 0.33490753173828125, 0.3622283935546875, 0.38954925537109375, 0.4168701171875, 0.44419097900390625, 0.4715118408203125, 0.49883270263671875, 0.526153564453125, 0.5534744262695312, 0.5807952880859375, 0.6081161499023438, 0.63543701171875, 0.6627578735351562, 0.6900787353515625, 0.7173995971679688, 0.744720458984375, 0.7720413208007812, 0.7993621826171875, 0.8266830444335938, 0.85400390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 11.0, 15.0, 12.0, 11.0, 12.0, 16.0, 19.0, 29.0, 28.0, 15.0, 35.0, 33.0, 27.0, 33.0, 35.0, 33.0, 42.0, 42.0, 42.0, 45.0, 42.0, 38.0, 35.0, 37.0, 39.0, 28.0, 27.0, 32.0, 22.0, 28.0, 23.0, 12.0, 16.0, 18.0, 9.0, 14.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17555809020996094, -0.16996383666992188, -0.1643695831298828, -0.15877532958984375, -0.1531810760498047, -0.14758682250976562, -0.14199256896972656, -0.1363983154296875, -0.13080406188964844, -0.12520980834960938, -0.11961555480957031, -0.11402130126953125, -0.10842704772949219, -0.10283279418945312, -0.09723854064941406, -0.091644287109375, -0.08605003356933594, -0.08045578002929688, -0.07486152648925781, -0.06926727294921875, -0.06367301940917969, -0.058078765869140625, -0.05248451232910156, -0.0468902587890625, -0.04129600524902344, -0.035701751708984375, -0.030107498168945312, -0.02451324462890625, -0.018918991088867188, -0.013324737548828125, -0.0077304840087890625, -0.00213623046875, 0.0034580230712890625, 0.009052276611328125, 0.014646530151367188, 0.02024078369140625, 0.025835037231445312, 0.031429290771484375, 0.03702354431152344, 0.0426177978515625, 0.04821205139160156, 0.053806304931640625, 0.05940055847167969, 0.06499481201171875, 0.07058906555175781, 0.07618331909179688, 0.08177757263183594, 0.087371826171875, 0.09296607971191406, 0.09856033325195312, 0.10415458679199219, 0.10974884033203125, 0.11534309387207031, 0.12093734741210938, 0.12653160095214844, 0.1321258544921875, 0.13772010803222656, 0.14331436157226562, 0.1489086151123047, 0.15450286865234375, 0.1600971221923828, 0.16569137573242188, 0.17128562927246094, 0.1768798828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 6.0, 11.0, 10.0, 29.0, 37.0, 54.0, 76.0, 150.0, 183.0, 380.0, 556.0, 955.0, 1878.0, 3761.0, 8098.0, 19227.0, 48571.0, 133762.0, 306426.0, 306381.0, 133612.0, 49124.0, 18878.0, 8236.0, 3786.0, 1922.0, 1028.0, 574.0, 301.0, 177.0, 104.0, 75.0, 45.0, 29.0, 21.0, 9.0, 14.0, 11.0, 11.0, 2.0, 5.0, 14.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09747314453125, -0.09442710876464844, -0.09138107299804688, -0.08833503723144531, -0.08528900146484375, -0.08224296569824219, -0.07919692993164062, -0.07615089416503906, -0.0731048583984375, -0.07005882263183594, -0.06701278686523438, -0.06396675109863281, -0.06092071533203125, -0.05787467956542969, -0.054828643798828125, -0.05178260803222656, -0.048736572265625, -0.04569053649902344, -0.042644500732421875, -0.03959846496582031, -0.03655242919921875, -0.03350639343261719, -0.030460357666015625, -0.027414321899414062, -0.0243682861328125, -0.021322250366210938, -0.018276214599609375, -0.015230178833007812, -0.01218414306640625, -0.009138107299804688, -0.006092071533203125, -0.0030460357666015625, 0.0, 0.0030460357666015625, 0.006092071533203125, 0.009138107299804688, 0.01218414306640625, 0.015230178833007812, 0.018276214599609375, 0.021322250366210938, 0.0243682861328125, 0.027414321899414062, 0.030460357666015625, 0.03350639343261719, 0.03655242919921875, 0.03959846496582031, 0.042644500732421875, 0.04569053649902344, 0.048736572265625, 0.05178260803222656, 0.054828643798828125, 0.05787467956542969, 0.06092071533203125, 0.06396675109863281, 0.06701278686523438, 0.07005882263183594, 0.0731048583984375, 0.07615089416503906, 0.07919692993164062, 0.08224296569824219, 0.08528900146484375, 0.08833503723144531, 0.09138107299804688, 0.09442710876464844, 0.09747314453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 5.0, 6.0, 7.0, 14.0, 19.0, 26.0, 67.0, 94.0, 123.0, 177.0, 146.0, 104.0, 86.0, 38.0, 33.0, 17.0, 12.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.562999725341797e-05, -2.49519944190979e-05, -2.4273991584777832e-05, -2.3595988750457764e-05, -2.2917985916137695e-05, -2.2239983081817627e-05, -2.156198024749756e-05, -2.088397741317749e-05, -2.0205974578857422e-05, -1.9527971744537354e-05, -1.8849968910217285e-05, -1.8171966075897217e-05, -1.749396324157715e-05, -1.681596040725708e-05, -1.6137957572937012e-05, -1.5459954738616943e-05, -1.4781951904296875e-05, -1.4103949069976807e-05, -1.3425946235656738e-05, -1.274794340133667e-05, -1.2069940567016602e-05, -1.1391937732696533e-05, -1.0713934898376465e-05, -1.0035932064056396e-05, -9.357929229736328e-06, -8.67992639541626e-06, -8.001923561096191e-06, -7.323920726776123e-06, -6.645917892456055e-06, -5.967915058135986e-06, -5.289912223815918e-06, -4.61190938949585e-06, -3.933906555175781e-06, -3.255903720855713e-06, -2.5779008865356445e-06, -1.8998980522155762e-06, -1.2218952178955078e-06, -5.438923835754395e-07, 1.341104507446289e-07, 8.121132850646973e-07, 1.4901161193847656e-06, 2.168118953704834e-06, 2.8461217880249023e-06, 3.5241246223449707e-06, 4.202127456665039e-06, 4.880130290985107e-06, 5.558133125305176e-06, 6.236135959625244e-06, 6.9141387939453125e-06, 7.592141628265381e-06, 8.27014446258545e-06, 8.948147296905518e-06, 9.626150131225586e-06, 1.0304152965545654e-05, 1.0982155799865723e-05, 1.1660158634185791e-05, 1.233816146850586e-05, 1.3016164302825928e-05, 1.3694167137145996e-05, 1.4372169971466064e-05, 1.5050172805786133e-05, 1.57281756401062e-05, 1.640617847442627e-05, 1.7084181308746338e-05, 1.7762184143066406e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 15.0, 18.0, 14.0, 19.0, 27.0, 20.0, 36.0, 49.0, 82.0, 297.0, 1632.0, 17932.0, 397016.0, 597984.0, 30363.0, 2377.0, 326.0, 108.0, 46.0, 45.0, 34.0, 20.0, 14.0, 9.0, 17.0, 8.0, 10.0, 5.0, 7.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27587890625, -0.2680168151855469, -0.26015472412109375, -0.2522926330566406, -0.2444305419921875, -0.23656845092773438, -0.22870635986328125, -0.22084426879882812, -0.212982177734375, -0.20512008666992188, -0.19725799560546875, -0.18939590454101562, -0.1815338134765625, -0.17367172241210938, -0.16580963134765625, -0.15794754028320312, -0.15008544921875, -0.14222335815429688, -0.13436126708984375, -0.12649917602539062, -0.1186370849609375, -0.11077499389648438, -0.10291290283203125, -0.09505081176757812, -0.087188720703125, -0.07932662963867188, -0.07146453857421875, -0.06360244750976562, -0.0557403564453125, -0.047878265380859375, -0.04001617431640625, -0.032154083251953125, -0.0242919921875, -0.016429901123046875, -0.00856781005859375, -0.000705718994140625, 0.0071563720703125, 0.015018463134765625, 0.02288055419921875, 0.030742645263671875, 0.038604736328125, 0.046466827392578125, 0.05432891845703125, 0.062191009521484375, 0.0700531005859375, 0.07791519165039062, 0.08577728271484375, 0.09363937377929688, 0.10150146484375, 0.10936355590820312, 0.11722564697265625, 0.12508773803710938, 0.1329498291015625, 0.14081192016601562, 0.14867401123046875, 0.15653610229492188, 0.164398193359375, 0.17226028442382812, 0.18012237548828125, 0.18798446655273438, 0.1958465576171875, 0.20370864868164062, 0.21157073974609375, 0.21943283081054688, 0.227294921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 12.0, 19.0, 19.0, 19.0, 21.0, 27.0, 36.0, 30.0, 54.0, 77.0, 62.0, 70.0, 55.0, 56.0, 67.0, 72.0, 53.0, 45.0, 41.0, 31.0, 32.0, 23.0, 10.0, 13.0, 9.0, 9.0, 10.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.055938720703125, -0.05433177947998047, -0.05272483825683594, -0.051117897033691406, -0.049510955810546875, -0.047904014587402344, -0.04629707336425781, -0.04469013214111328, -0.04308319091796875, -0.04147624969482422, -0.03986930847167969, -0.038262367248535156, -0.036655426025390625, -0.035048484802246094, -0.03344154357910156, -0.03183460235595703, -0.0302276611328125, -0.02862071990966797, -0.027013778686523438, -0.025406837463378906, -0.023799896240234375, -0.022192955017089844, -0.020586013793945312, -0.01897907257080078, -0.01737213134765625, -0.01576519012451172, -0.014158248901367188, -0.012551307678222656, -0.010944366455078125, -0.009337425231933594, -0.0077304840087890625, -0.006123542785644531, -0.0045166015625, -0.0029096603393554688, -0.0013027191162109375, 0.00030422210693359375, 0.001911163330078125, 0.0035181045532226562, 0.0051250457763671875, 0.006731986999511719, 0.00833892822265625, 0.009945869445800781, 0.011552810668945312, 0.013159751892089844, 0.014766693115234375, 0.016373634338378906, 0.017980575561523438, 0.01958751678466797, 0.0211944580078125, 0.02280139923095703, 0.024408340454101562, 0.026015281677246094, 0.027622222900390625, 0.029229164123535156, 0.030836105346679688, 0.03244304656982422, 0.03404998779296875, 0.03565692901611328, 0.03726387023925781, 0.038870811462402344, 0.040477752685546875, 0.042084693908691406, 0.04369163513183594, 0.04529857635498047, 0.046905517578125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 102.0, 909.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.018878936767578, -19.663183212280273, -19.30748748779297, -18.95178985595703, -18.596094131469727, -18.240398406982422, -17.884702682495117, -17.529006958007812, -17.173309326171875, -16.81761360168457, -16.461917877197266, -16.106220245361328, -15.750524520874023, -15.394828796386719, -15.039133071899414, -14.68343734741211, -14.327741622924805, -13.9720458984375, -13.616349220275879, -13.260653495788574, -12.904956817626953, -12.549261093139648, -12.193565368652344, -11.837869644165039, -11.482172966003418, -11.126477241516113, -10.770780563354492, -10.415084838867188, -10.059389114379883, -9.703692436218262, -9.347996711730957, -8.992300033569336, -8.636603355407715, -8.28090763092041, -7.925210952758789, -7.569515228271484, -7.2138190269470215, -6.858122825622559, -6.502427101135254, -6.146730899810791, -5.791034698486328, -5.435338497161865, -5.079642295837402, -4.723946571350098, -4.368250370025635, -4.012554168701172, -3.656858205795288, -3.3011622428894043, -2.9454660415649414, -2.5897698402404785, -2.2340738773345947, -1.8783777952194214, -1.522681713104248, -1.1669856309890747, -0.8112895488739014, -0.4555935859680176, -0.09989738464355469, 0.25579869747161865, 0.611494779586792, 0.9671908617019653, 1.3228869438171387, 1.678583025932312, 2.0342791080474854, 2.389975070953369, 2.745671272277832]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 1.0, 9.0, 9.0, 4.0, 10.0, 12.0, 15.0, 14.0, 18.0, 18.0, 21.0, 22.0, 26.0, 27.0, 39.0, 35.0, 34.0, 47.0, 48.0, 36.0, 38.0, 35.0, 36.0, 50.0, 38.0, 35.0, 42.0, 35.0, 29.0, 24.0, 26.0, 17.0, 22.0, 26.0, 15.0, 6.0, 13.0, 17.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.5929688811302185, -0.5729495882987976, -0.5529302954673767, -0.5329110026359558, -0.5128917098045349, -0.492872416973114, -0.4728530943393707, -0.45283380150794983, -0.43281450867652893, -0.41279521584510803, -0.39277592301368713, -0.37275663018226624, -0.35273730754852295, -0.33271801471710205, -0.31269872188568115, -0.29267942905426025, -0.27266013622283936, -0.25264084339141846, -0.23262155055999756, -0.21260224282741547, -0.19258294999599457, -0.17256365716457367, -0.15254434943199158, -0.13252505660057068, -0.11250576376914978, -0.09248647093772888, -0.07246717065572739, -0.05244787409901619, -0.03242857754230499, -0.012409284710884094, 0.007610015571117401, 0.027629315853118896, 0.047648608684539795, 0.0676679015159607, 0.08768720179796219, 0.10770650207996368, 0.12772579491138458, 0.14774508774280548, 0.16776439547538757, 0.18778368830680847, 0.20780298113822937, 0.22782227396965027, 0.24784156680107117, 0.26786085963249207, 0.28788018226623535, 0.30789947509765625, 0.32791876792907715, 0.34793806076049805, 0.36795735359191895, 0.38797664642333984, 0.40799593925476074, 0.42801523208618164, 0.44803452491760254, 0.46805381774902344, 0.4880731403827667, 0.5080924034118652, 0.5281116962432861, 0.548130989074707, 0.5681502819061279, 0.5881695747375488, 0.6081888675689697, 0.6282081604003906, 0.6482274532318115, 0.6682467460632324, 0.6882660984992981]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 23.0, 33.0, 42.0, 60.0, 72.0, 147.0, 202.0, 315.0, 556.0, 1085.0, 1887.0, 3770.0, 7954.0, 19459.0, 53327.0, 182091.0, 953310.0, 2328324.0, 470356.0, 108651.0, 35790.0, 14024.0, 6213.0, 2975.0, 1525.0, 802.0, 462.0, 277.0, 175.0, 117.0, 54.0, 43.0, 33.0, 32.0, 15.0, 17.0, 13.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2340087890625, -0.2271881103515625, -0.220367431640625, -0.2135467529296875, -0.20672607421875, -0.1999053955078125, -0.193084716796875, -0.1862640380859375, -0.179443359375, -0.1726226806640625, -0.165802001953125, -0.1589813232421875, -0.15216064453125, -0.1453399658203125, -0.138519287109375, -0.1316986083984375, -0.1248779296875, -0.1180572509765625, -0.111236572265625, -0.1044158935546875, -0.09759521484375, -0.0907745361328125, -0.083953857421875, -0.0771331787109375, -0.0703125, -0.0634918212890625, -0.056671142578125, -0.0498504638671875, -0.04302978515625, -0.0362091064453125, -0.029388427734375, -0.0225677490234375, -0.0157470703125, -0.0089263916015625, -0.002105712890625, 0.0047149658203125, 0.01153564453125, 0.0183563232421875, 0.025177001953125, 0.0319976806640625, 0.038818359375, 0.0456390380859375, 0.052459716796875, 0.0592803955078125, 0.06610107421875, 0.0729217529296875, 0.079742431640625, 0.0865631103515625, 0.0933837890625, 0.1002044677734375, 0.107025146484375, 0.1138458251953125, 0.12066650390625, 0.1274871826171875, 0.134307861328125, 0.1411285400390625, 0.14794921875, 0.1547698974609375, 0.161590576171875, 0.1684112548828125, 0.17523193359375, 0.1820526123046875, 0.188873291015625, 0.1956939697265625, 0.2025146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 0.0, 2.0, 4.0, 6.0, 9.0, 6.0, 11.0, 7.0, 7.0, 11.0, 8.0, 21.0, 26.0, 17.0, 30.0, 37.0, 54.0, 40.0, 44.0, 49.0, 46.0, 67.0, 61.0, 54.0, 51.0, 40.0, 30.0, 29.0, 38.0, 20.0, 32.0, 22.0, 23.0, 24.0, 13.0, 14.0, 10.0, 8.0, 7.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10345458984375, -0.1002349853515625, -0.097015380859375, -0.0937957763671875, -0.090576171875, -0.0873565673828125, -0.084136962890625, -0.0809173583984375, -0.07769775390625, -0.0744781494140625, -0.071258544921875, -0.0680389404296875, -0.0648193359375, -0.0615997314453125, -0.058380126953125, -0.0551605224609375, -0.05194091796875, -0.0487213134765625, -0.045501708984375, -0.0422821044921875, -0.0390625, -0.0358428955078125, -0.032623291015625, -0.0294036865234375, -0.02618408203125, -0.0229644775390625, -0.019744873046875, -0.0165252685546875, -0.0133056640625, -0.0100860595703125, -0.006866455078125, -0.0036468505859375, -0.00042724609375, 0.0027923583984375, 0.006011962890625, 0.0092315673828125, 0.012451171875, 0.0156707763671875, 0.018890380859375, 0.0221099853515625, 0.02532958984375, 0.0285491943359375, 0.031768798828125, 0.0349884033203125, 0.0382080078125, 0.0414276123046875, 0.044647216796875, 0.0478668212890625, 0.05108642578125, 0.0543060302734375, 0.057525634765625, 0.0607452392578125, 0.06396484375, 0.0671844482421875, 0.070404052734375, 0.0736236572265625, 0.07684326171875, 0.0800628662109375, 0.083282470703125, 0.0865020751953125, 0.0897216796875, 0.0929412841796875, 0.096160888671875, 0.0993804931640625, 0.10260009765625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 16.0, 11.0, 27.0, 51.0, 56.0, 85.0, 173.0, 310.0, 681.0, 1789.0, 6219.0, 25620.0, 129082.0, 779006.0, 2508130.0, 610643.0, 103384.0, 20975.0, 5082.0, 1607.0, 606.0, 296.0, 163.0, 89.0, 67.0, 31.0, 23.0, 9.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.44482421875, -0.43325042724609375, -0.4216766357421875, -0.41010284423828125, -0.398529052734375, -0.38695526123046875, -0.3753814697265625, -0.36380767822265625, -0.35223388671875, -0.34066009521484375, -0.3290863037109375, -0.31751251220703125, -0.305938720703125, -0.29436492919921875, -0.2827911376953125, -0.27121734619140625, -0.2596435546875, -0.24806976318359375, -0.2364959716796875, -0.22492218017578125, -0.213348388671875, -0.20177459716796875, -0.1902008056640625, -0.17862701416015625, -0.16705322265625, -0.15547943115234375, -0.1439056396484375, -0.13233184814453125, -0.120758056640625, -0.10918426513671875, -0.0976104736328125, -0.08603668212890625, -0.074462890625, -0.06288909912109375, -0.0513153076171875, -0.03974151611328125, -0.028167724609375, -0.01659393310546875, -0.0050201416015625, 0.00655364990234375, 0.01812744140625, 0.02970123291015625, 0.0412750244140625, 0.05284881591796875, 0.064422607421875, 0.07599639892578125, 0.0875701904296875, 0.09914398193359375, 0.1107177734375, 0.12229156494140625, 0.1338653564453125, 0.14543914794921875, 0.157012939453125, 0.16858673095703125, 0.1801605224609375, 0.19173431396484375, 0.20330810546875, 0.21488189697265625, 0.2264556884765625, 0.23802947998046875, 0.249603271484375, 0.26117706298828125, 0.2727508544921875, 0.28432464599609375, 0.2958984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 7.0, 7.0, 10.0, 11.0, 20.0, 24.0, 30.0, 37.0, 47.0, 76.0, 100.0, 117.0, 166.0, 196.0, 299.0, 415.0, 499.0, 535.0, 353.0, 283.0, 203.0, 159.0, 107.0, 83.0, 69.0, 55.0, 38.0, 38.0, 27.0, 12.0, 10.0, 11.0, 8.0, 2.0, 5.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.18555831909179688, -0.18007659912109375, -0.17459487915039062, -0.1691131591796875, -0.16363143920898438, -0.15814971923828125, -0.15266799926757812, -0.147186279296875, -0.14170455932617188, -0.13622283935546875, -0.13074111938476562, -0.1252593994140625, -0.11977767944335938, -0.11429595947265625, -0.10881423950195312, -0.10333251953125, -0.09785079956054688, -0.09236907958984375, -0.08688735961914062, -0.0814056396484375, -0.07592391967773438, -0.07044219970703125, -0.06496047973632812, -0.059478759765625, -0.053997039794921875, -0.04851531982421875, -0.043033599853515625, -0.0375518798828125, -0.032070159912109375, -0.02658843994140625, -0.021106719970703125, -0.015625, -0.010143280029296875, -0.00466156005859375, 0.000820159912109375, 0.0063018798828125, 0.011783599853515625, 0.01726531982421875, 0.022747039794921875, 0.028228759765625, 0.033710479736328125, 0.03919219970703125, 0.044673919677734375, 0.0501556396484375, 0.055637359619140625, 0.06111907958984375, 0.06660079956054688, 0.07208251953125, 0.07756423950195312, 0.08304595947265625, 0.08852767944335938, 0.0940093994140625, 0.09949111938476562, 0.10497283935546875, 0.11045455932617188, 0.115936279296875, 0.12141799926757812, 0.12689971923828125, 0.13238143920898438, 0.1378631591796875, 0.14334487915039062, 0.14882659912109375, 0.15430831909179688, 0.1597900390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 52.0, 148.0, 315.0, 301.0, 144.0, 24.0, 14.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9909214973449707, -0.914333701133728, -0.8377459645271301, -0.7611581683158875, -0.6845704317092896, -0.6079826354980469, -0.5313948392868042, -0.4548071026802063, -0.3782193064689636, -0.30163154006004333, -0.22504375874996185, -0.14845597743988037, -0.07186821103096008, 0.004719555377960205, 0.08130735158920288, 0.15789508819580078, 0.23448288440704346, 0.31107065081596375, 0.38765841722488403, 0.4642462134361267, 0.5408339500427246, 0.6174217462539673, 0.69400954246521, 0.7705972790718079, 0.8471850752830505, 0.9237728714942932, 1.0003606081008911, 1.0769484043121338, 1.1535362005233765, 1.2301239967346191, 1.3067116737365723, 1.383299469947815, 1.4598872661590576, 1.5364750623703003, 1.613062858581543, 1.689650535583496, 1.7662383317947388, 1.8428261280059814, 1.9194139242172241, 1.9960017204284668, 2.07258939743042, 2.149177074432373, 2.2257649898529053, 2.3023526668548584, 2.3789405822753906, 2.4555282592773438, 2.532115936279297, 2.608703851699829, 2.6852917671203613, 2.7618794441223145, 2.8384673595428467, 2.9150550365448, 2.991642951965332, 3.068230628967285, 3.1448183059692383, 3.2214062213897705, 3.2979938983917236, 3.3745815753936768, 3.451169490814209, 3.527757167816162, 3.6043450832366943, 3.6809327602386475, 3.7575206756591797, 3.834108352661133, 3.910696029663086]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 5.0, 9.0, 9.0, 14.0, 14.0, 15.0, 28.0, 29.0, 29.0, 37.0, 30.0, 35.0, 32.0, 34.0, 32.0, 32.0, 38.0, 36.0, 40.0, 45.0, 51.0, 33.0, 41.0, 27.0, 38.0, 33.0, 25.0, 26.0, 22.0, 22.0, 24.0, 20.0, 16.0, 16.0, 14.0, 10.0, 4.0, 12.0, 3.0, 4.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4834466576576233, -0.46743080019950867, -0.45141494274139404, -0.4353991150856018, -0.4193832576274872, -0.40336740016937256, -0.3873515725135803, -0.3713357150554657, -0.3553198575973511, -0.33930400013923645, -0.3232881426811218, -0.3072723150253296, -0.29125645756721497, -0.27524060010910034, -0.2592247724533081, -0.24320891499519348, -0.22719305753707886, -0.21117720007896423, -0.1951613575220108, -0.17914551496505737, -0.16312965750694275, -0.14711380004882812, -0.1310979574918747, -0.11508210748434067, -0.09906625747680664, -0.08305040746927261, -0.06703455746173859, -0.05101870745420456, -0.03500285744667053, -0.018987007439136505, -0.002971157431602478, 0.013044692575931549, 0.02906060218811035, 0.04507645219564438, 0.061092302203178406, 0.07710815221071243, 0.09312400221824646, 0.10913985222578049, 0.12515570223331451, 0.14117154479026794, 0.15718740224838257, 0.1732032597064972, 0.18921910226345062, 0.20523494482040405, 0.22125080227851868, 0.2372666597366333, 0.25328248739242554, 0.26929834485054016, 0.2853142023086548, 0.3013300597667694, 0.31734591722488403, 0.33336174488067627, 0.3493776023387909, 0.3653934597969055, 0.38140928745269775, 0.3974251449108124, 0.413441002368927, 0.4294568598270416, 0.44547271728515625, 0.4614885449409485, 0.4775044023990631, 0.49352025985717773, 0.50953608751297, 0.525551974773407, 0.5415678024291992]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 18.0, 38.0, 36.0, 82.0, 135.0, 248.0, 435.0, 741.0, 1388.0, 2505.0, 4747.0, 9559.0, 22604.0, 62877.0, 184845.0, 361945.0, 249845.0, 90438.0, 30919.0, 12503.0, 5679.0, 3194.0, 1656.0, 912.0, 536.0, 304.0, 137.0, 82.0, 48.0, 34.0, 20.0, 11.0, 12.0, 8.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.2540016174316406, -0.24481964111328125, -0.23563766479492188, -0.2264556884765625, -0.21727371215820312, -0.20809173583984375, -0.19890975952148438, -0.189727783203125, -0.18054580688476562, -0.17136383056640625, -0.16218185424804688, -0.1529998779296875, -0.14381790161132812, -0.13463592529296875, -0.12545394897460938, -0.11627197265625, -0.10708999633789062, -0.09790802001953125, -0.08872604370117188, -0.0795440673828125, -0.07036209106445312, -0.06118011474609375, -0.051998138427734375, -0.042816162109375, -0.033634185791015625, -0.02445220947265625, -0.015270233154296875, -0.0060882568359375, 0.003093719482421875, 0.01227569580078125, 0.021457672119140625, 0.0306396484375, 0.039821624755859375, 0.04900360107421875, 0.058185577392578125, 0.0673675537109375, 0.07654953002929688, 0.08573150634765625, 0.09491348266601562, 0.104095458984375, 0.11327743530273438, 0.12245941162109375, 0.13164138793945312, 0.1408233642578125, 0.15000534057617188, 0.15918731689453125, 0.16836929321289062, 0.17755126953125, 0.18673324584960938, 0.19591522216796875, 0.20509719848632812, 0.2142791748046875, 0.22346115112304688, 0.23264312744140625, 0.24182510375976562, 0.251007080078125, 0.2601890563964844, 0.26937103271484375, 0.2785530090332031, 0.2877349853515625, 0.2969169616699219, 0.30609893798828125, 0.3152809143066406, 0.324462890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 10.0, 10.0, 12.0, 23.0, 28.0, 26.0, 26.0, 32.0, 50.0, 30.0, 38.0, 55.0, 59.0, 44.0, 56.0, 74.0, 44.0, 35.0, 39.0, 23.0, 28.0, 41.0, 25.0, 27.0, 26.0, 30.0, 12.0, 12.0, 15.0, 16.0, 7.0, 11.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1156005859375, -0.11262226104736328, -0.10964393615722656, -0.10666561126708984, -0.10368728637695312, -0.1007089614868164, -0.09773063659667969, -0.09475231170654297, -0.09177398681640625, -0.08879566192626953, -0.08581733703613281, -0.0828390121459961, -0.07986068725585938, -0.07688236236572266, -0.07390403747558594, -0.07092571258544922, -0.0679473876953125, -0.06496906280517578, -0.06199073791503906, -0.059012413024902344, -0.056034088134765625, -0.053055763244628906, -0.05007743835449219, -0.04709911346435547, -0.04412078857421875, -0.04114246368408203, -0.03816413879394531, -0.035185813903808594, -0.032207489013671875, -0.029229164123535156, -0.026250839233398438, -0.02327251434326172, -0.020294189453125, -0.01731586456298828, -0.014337539672851562, -0.011359214782714844, -0.008380889892578125, -0.005402565002441406, -0.0024242401123046875, 0.0005540847778320312, 0.00353240966796875, 0.006510734558105469, 0.009489059448242188, 0.012467384338378906, 0.015445709228515625, 0.018424034118652344, 0.021402359008789062, 0.02438068389892578, 0.0273590087890625, 0.03033733367919922, 0.03331565856933594, 0.036293983459472656, 0.039272308349609375, 0.042250633239746094, 0.04522895812988281, 0.04820728302001953, 0.05118560791015625, 0.05416393280029297, 0.05714225769042969, 0.060120582580566406, 0.06309890747070312, 0.06607723236083984, 0.06905555725097656, 0.07203388214111328, 0.07501220703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 4.0, 7.0, 13.0, 14.0, 29.0, 37.0, 29.0, 54.0, 76.0, 143.0, 252.0, 516.0, 1258.0, 3194.0, 8202.0, 26637.0, 113239.0, 435504.0, 349711.0, 78389.0, 20012.0, 6618.0, 2514.0, 985.0, 461.0, 252.0, 140.0, 72.0, 52.0, 36.0, 34.0, 18.0, 13.0, 8.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.38525390625, -0.37277984619140625, -0.3603057861328125, -0.34783172607421875, -0.335357666015625, -0.32288360595703125, -0.3104095458984375, -0.29793548583984375, -0.28546142578125, -0.27298736572265625, -0.2605133056640625, -0.24803924560546875, -0.235565185546875, -0.22309112548828125, -0.2106170654296875, -0.19814300537109375, -0.1856689453125, -0.17319488525390625, -0.1607208251953125, -0.14824676513671875, -0.135772705078125, -0.12329864501953125, -0.1108245849609375, -0.09835052490234375, -0.08587646484375, -0.07340240478515625, -0.0609283447265625, -0.04845428466796875, -0.035980224609375, -0.02350616455078125, -0.0110321044921875, 0.00144195556640625, 0.013916015625, 0.02639007568359375, 0.0388641357421875, 0.05133819580078125, 0.063812255859375, 0.07628631591796875, 0.0887603759765625, 0.10123443603515625, 0.11370849609375, 0.12618255615234375, 0.1386566162109375, 0.15113067626953125, 0.163604736328125, 0.17607879638671875, 0.1885528564453125, 0.20102691650390625, 0.2135009765625, 0.22597503662109375, 0.2384490966796875, 0.25092315673828125, 0.263397216796875, 0.27587127685546875, 0.2883453369140625, 0.30081939697265625, 0.31329345703125, 0.32576751708984375, 0.3382415771484375, 0.35071563720703125, 0.363189697265625, 0.37566375732421875, 0.3881378173828125, 0.40061187744140625, 0.4130859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 8.0, 13.0, 13.0, 20.0, 23.0, 25.0, 30.0, 28.0, 41.0, 47.0, 49.0, 62.0, 64.0, 72.0, 55.0, 45.0, 46.0, 46.0, 50.0, 32.0, 32.0, 42.0, 25.0, 24.0, 12.0, 13.0, 19.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2354736328125, -0.22832489013671875, -0.2211761474609375, -0.21402740478515625, -0.206878662109375, -0.19972991943359375, -0.1925811767578125, -0.18543243408203125, -0.17828369140625, -0.17113494873046875, -0.1639862060546875, -0.15683746337890625, -0.149688720703125, -0.14253997802734375, -0.1353912353515625, -0.12824249267578125, -0.12109375, -0.11394500732421875, -0.1067962646484375, -0.09964752197265625, -0.092498779296875, -0.08535003662109375, -0.0782012939453125, -0.07105255126953125, -0.06390380859375, -0.05675506591796875, -0.0496063232421875, -0.04245758056640625, -0.035308837890625, -0.02816009521484375, -0.0210113525390625, -0.01386260986328125, -0.0067138671875, 0.00043487548828125, 0.0075836181640625, 0.01473236083984375, 0.021881103515625, 0.02902984619140625, 0.0361785888671875, 0.04332733154296875, 0.05047607421875, 0.05762481689453125, 0.0647735595703125, 0.07192230224609375, 0.079071044921875, 0.08621978759765625, 0.0933685302734375, 0.10051727294921875, 0.107666015625, 0.11481475830078125, 0.1219635009765625, 0.12911224365234375, 0.136260986328125, 0.14340972900390625, 0.1505584716796875, 0.15770721435546875, 0.16485595703125, 0.17200469970703125, 0.1791534423828125, 0.18630218505859375, 0.193450927734375, 0.20059967041015625, 0.2077484130859375, 0.21489715576171875, 0.2220458984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 12.0, 21.0, 22.0, 41.0, 40.0, 62.0, 88.0, 120.0, 166.0, 215.0, 284.0, 435.0, 577.0, 908.0, 1350.0, 2583.0, 5808.0, 17227.0, 78576.0, 503944.0, 360855.0, 51431.0, 12879.0, 4698.0, 2132.0, 1241.0, 757.0, 570.0, 376.0, 299.0, 208.0, 161.0, 139.0, 82.0, 59.0, 52.0, 35.0, 28.0, 20.0, 14.0, 9.0, 9.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24500083923339844, -0.23731613159179688, -0.2296314239501953, -0.22194671630859375, -0.2142620086669922, -0.20657730102539062, -0.19889259338378906, -0.1912078857421875, -0.18352317810058594, -0.17583847045898438, -0.1681537628173828, -0.16046905517578125, -0.1527843475341797, -0.14509963989257812, -0.13741493225097656, -0.129730224609375, -0.12204551696777344, -0.11436080932617188, -0.10667610168457031, -0.09899139404296875, -0.09130668640136719, -0.08362197875976562, -0.07593727111816406, -0.0682525634765625, -0.06056785583496094, -0.052883148193359375, -0.04519844055175781, -0.03751373291015625, -0.029829025268554688, -0.022144317626953125, -0.014459609985351562, -0.00677490234375, 0.0009098052978515625, 0.008594512939453125, 0.016279220581054688, 0.02396392822265625, 0.03164863586425781, 0.039333343505859375, 0.04701805114746094, 0.0547027587890625, 0.06238746643066406, 0.07007217407226562, 0.07775688171386719, 0.08544158935546875, 0.09312629699707031, 0.10081100463867188, 0.10849571228027344, 0.116180419921875, 0.12386512756347656, 0.13154983520507812, 0.1392345428466797, 0.14691925048828125, 0.1546039581298828, 0.16228866577148438, 0.16997337341308594, 0.1776580810546875, 0.18534278869628906, 0.19302749633789062, 0.2007122039794922, 0.20839691162109375, 0.2160816192626953, 0.22376632690429688, 0.23145103454589844, 0.2391357421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 13.0, 19.0, 88.0, 533.0, 286.0, 30.0, 13.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001354217529296875, -0.0001321788877248764, -0.0001289360225200653, -0.0001256931573152542, -0.00012245029211044312, -0.00011920742690563202, -0.00011596456170082092, -0.00011272169649600983, -0.00010947883129119873, -0.00010623596608638763, -0.00010299310088157654, -9.975023567676544e-05, -9.650737047195435e-05, -9.326450526714325e-05, -9.002164006233215e-05, -8.677877485752106e-05, -8.353590965270996e-05, -8.029304444789886e-05, -7.705017924308777e-05, -7.380731403827667e-05, -7.056444883346558e-05, -6.732158362865448e-05, -6.407871842384338e-05, -6.083585321903229e-05, -5.759298801422119e-05, -5.4350122809410095e-05, -5.1107257604599e-05, -4.78643923997879e-05, -4.462152719497681e-05, -4.137866199016571e-05, -3.8135796785354614e-05, -3.489293158054352e-05, -3.165006637573242e-05, -2.8407201170921326e-05, -2.516433596611023e-05, -2.1921470761299133e-05, -1.8678605556488037e-05, -1.543574035167694e-05, -1.2192875146865845e-05, -8.950009942054749e-06, -5.707144737243652e-06, -2.464279532432556e-06, 7.7858567237854e-07, 4.021450877189636e-06, 7.264316082000732e-06, 1.0507181286811829e-05, 1.3750046491622925e-05, 1.699291169643402e-05, 2.0235776901245117e-05, 2.3478642106056213e-05, 2.672150731086731e-05, 2.9964372515678406e-05, 3.32072377204895e-05, 3.64501029253006e-05, 3.9692968130111694e-05, 4.293583333492279e-05, 4.617869853973389e-05, 4.942156374454498e-05, 5.266442894935608e-05, 5.5907294154167175e-05, 5.915015935897827e-05, 6.239302456378937e-05, 6.563588976860046e-05, 6.887875497341156e-05, 7.212162017822266e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 22.0, 17.0, 30.0, 35.0, 64.0, 83.0, 176.0, 264.0, 430.0, 829.0, 1464.0, 2846.0, 5930.0, 12780.0, 30100.0, 82637.0, 217039.0, 338680.0, 217554.0, 82227.0, 30033.0, 12878.0, 6119.0, 2896.0, 1473.0, 807.0, 436.0, 253.0, 129.0, 102.0, 62.0, 43.0, 25.0, 20.0, 11.0, 16.0, 4.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.1217041015625, -0.11817646026611328, -0.11464881896972656, -0.11112117767333984, -0.10759353637695312, -0.1040658950805664, -0.10053825378417969, -0.09701061248779297, -0.09348297119140625, -0.08995532989501953, -0.08642768859863281, -0.0829000473022461, -0.07937240600585938, -0.07584476470947266, -0.07231712341308594, -0.06878948211669922, -0.0652618408203125, -0.06173419952392578, -0.05820655822753906, -0.054678916931152344, -0.051151275634765625, -0.047623634338378906, -0.04409599304199219, -0.04056835174560547, -0.03704071044921875, -0.03351306915283203, -0.029985427856445312, -0.026457786560058594, -0.022930145263671875, -0.019402503967285156, -0.015874862670898438, -0.012347221374511719, -0.008819580078125, -0.005291938781738281, -0.0017642974853515625, 0.0017633438110351562, 0.005290985107421875, 0.008818626403808594, 0.012346267700195312, 0.01587390899658203, 0.01940155029296875, 0.02292919158935547, 0.026456832885742188, 0.029984474182128906, 0.033512115478515625, 0.037039756774902344, 0.04056739807128906, 0.04409503936767578, 0.0476226806640625, 0.05115032196044922, 0.05467796325683594, 0.058205604553222656, 0.061733245849609375, 0.0652608871459961, 0.06878852844238281, 0.07231616973876953, 0.07584381103515625, 0.07937145233154297, 0.08289909362792969, 0.0864267349243164, 0.08995437622070312, 0.09348201751708984, 0.09700965881347656, 0.10053730010986328, 0.10406494140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 7.0, 16.0, 4.0, 12.0, 22.0, 26.0, 22.0, 44.0, 38.0, 64.0, 64.0, 67.0, 68.0, 54.0, 70.0, 64.0, 72.0, 52.0, 56.0, 28.0, 32.0, 23.0, 18.0, 19.0, 7.0, 9.0, 6.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07073974609375, -0.0687251091003418, -0.0667104721069336, -0.06469583511352539, -0.06268119812011719, -0.060666561126708984, -0.05865192413330078, -0.05663728713989258, -0.054622650146484375, -0.05260801315307617, -0.05059337615966797, -0.048578739166259766, -0.04656410217285156, -0.04454946517944336, -0.042534828186035156, -0.04052019119262695, -0.03850555419921875, -0.03649091720581055, -0.034476280212402344, -0.03246164321899414, -0.030447006225585938, -0.028432369232177734, -0.02641773223876953, -0.024403095245361328, -0.022388458251953125, -0.020373821258544922, -0.01835918426513672, -0.016344547271728516, -0.014329910278320312, -0.01231527328491211, -0.010300636291503906, -0.008285999298095703, -0.0062713623046875, -0.004256725311279297, -0.0022420883178710938, -0.00022745132446289062, 0.0017871856689453125, 0.0038018226623535156, 0.005816459655761719, 0.007831096649169922, 0.009845733642578125, 0.011860370635986328, 0.013875007629394531, 0.015889644622802734, 0.017904281616210938, 0.01991891860961914, 0.021933555603027344, 0.023948192596435547, 0.02596282958984375, 0.027977466583251953, 0.029992103576660156, 0.03200674057006836, 0.03402137756347656, 0.036036014556884766, 0.03805065155029297, 0.04006528854370117, 0.042079925537109375, 0.04409456253051758, 0.04610919952392578, 0.048123836517333984, 0.05013847351074219, 0.05215311050415039, 0.054167747497558594, 0.0561823844909668, 0.058197021484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 20.0, 46.0, 114.0, 240.0, 329.0, 175.0, 56.0, 17.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6358119249343872, -0.5733609199523926, -0.510909914970398, -0.4484589695930481, -0.38600796461105347, -0.32355695962905884, -0.2611059844493866, -0.19865500926971436, -0.13620400428771973, -0.07375301420688629, -0.011302024126052856, 0.05114896595478058, 0.11359995603561401, 0.17605096101760864, 0.23850193619728088, 0.3009529113769531, 0.36340391635894775, 0.4258549213409424, 0.4883058965206146, 0.5507568717002869, 0.6132078766822815, 0.6756588816642761, 0.738109827041626, 0.8005608320236206, 0.8630118370056152, 0.9254628419876099, 0.9879138469696045, 1.0503648519515991, 1.1128158569335938, 1.1752667427062988, 1.2377177476882935, 1.300168752670288, 1.3626198768615723, 1.425070881843567, 1.4875218868255615, 1.5499728918075562, 1.6124238967895508, 1.6748747825622559, 1.7373257875442505, 1.7997767925262451, 1.8622277975082397, 1.9246788024902344, 1.987129807472229, 2.0495808124542236, 2.1120316982269287, 2.174482822418213, 2.236933708190918, 2.299384593963623, 2.3618357181549072, 2.4242866039276123, 2.4867377281188965, 2.5491886138916016, 2.6116397380828857, 2.674090623855591, 2.736541748046875, 2.79899263381958, 2.861443519592285, 2.9238944053649902, 2.9863455295562744, 3.0487964153289795, 3.1112475395202637, 3.1736984252929688, 3.236149549484253, 3.298600435256958, 3.361051559448242]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 18.0, 12.0, 11.0, 14.0, 17.0, 11.0, 22.0, 32.0, 31.0, 34.0, 31.0, 50.0, 42.0, 45.0, 50.0, 47.0, 34.0, 35.0, 40.0, 43.0, 50.0, 37.0, 39.0, 33.0, 36.0, 19.0, 15.0, 28.0, 18.0, 16.0, 14.0, 11.0, 15.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5538691282272339, -0.5373659133911133, -0.5208627581596375, -0.5043595433235168, -0.48785635828971863, -0.4713531732559204, -0.4548499584197998, -0.4383467733860016, -0.42184358835220337, -0.40534040331840515, -0.38883718848228455, -0.37233400344848633, -0.3558308184146881, -0.3393276333808899, -0.3228244185447693, -0.30632123351097107, -0.28981801867485046, -0.27331483364105225, -0.25681161880493164, -0.24030843377113342, -0.2238052487373352, -0.2073020488023758, -0.19079884886741638, -0.17429566383361816, -0.15779246389865875, -0.14128926396369934, -0.12478607892990112, -0.10828287899494171, -0.0917796865105629, -0.07527649402618408, -0.05877329409122467, -0.042270101606845856, -0.02576690912246704, -0.009263714775443077, 0.007239479571580887, 0.02374267578125, 0.040245868265628815, 0.05674906075000763, 0.07325226068496704, 0.08975545316934586, 0.10625864565372467, 0.12276183813810349, 0.1392650306224823, 0.1557682305574417, 0.17227143049240112, 0.18877461552619934, 0.20527781546115875, 0.22178101539611816, 0.23828420042991638, 0.2547873854637146, 0.2712906002998352, 0.2877937853336334, 0.30429697036743164, 0.32080018520355225, 0.33730337023735046, 0.3538065552711487, 0.3703097701072693, 0.3868129551410675, 0.4033161699771881, 0.41981935501098633, 0.43632254004478455, 0.45282572507858276, 0.46932893991470337, 0.4858321249485016, 0.5023353099822998]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 12.0, 12.0, 13.0, 16.0, 31.0, 37.0, 42.0, 72.0, 105.0, 176.0, 292.0, 570.0, 982.0, 1963.0, 4019.0, 9414.0, 24315.0, 71845.0, 254559.0, 1104378.0, 1869029.0, 627949.0, 149625.0, 46022.0, 16165.0, 6660.0, 2852.0, 1424.0, 735.0, 380.0, 231.0, 115.0, 79.0, 65.0, 35.0, 28.0, 12.0, 10.0, 10.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1956787109375, -0.19028854370117188, -0.18489837646484375, -0.17950820922851562, -0.1741180419921875, -0.16872787475585938, -0.16333770751953125, -0.15794754028320312, -0.152557373046875, -0.14716720581054688, -0.14177703857421875, -0.13638687133789062, -0.1309967041015625, -0.12560653686523438, -0.12021636962890625, -0.11482620239257812, -0.10943603515625, -0.10404586791992188, -0.09865570068359375, -0.09326553344726562, -0.0878753662109375, -0.08248519897460938, -0.07709503173828125, -0.07170486450195312, -0.066314697265625, -0.060924530029296875, -0.05553436279296875, -0.050144195556640625, -0.0447540283203125, -0.039363861083984375, -0.03397369384765625, -0.028583526611328125, -0.023193359375, -0.017803192138671875, -0.01241302490234375, -0.007022857666015625, -0.0016326904296875, 0.003757476806640625, 0.00914764404296875, 0.014537811279296875, 0.019927978515625, 0.025318145751953125, 0.03070831298828125, 0.036098480224609375, 0.0414886474609375, 0.046878814697265625, 0.05226898193359375, 0.057659149169921875, 0.06304931640625, 0.06843948364257812, 0.07382965087890625, 0.07921981811523438, 0.0846099853515625, 0.09000015258789062, 0.09539031982421875, 0.10078048706054688, 0.106170654296875, 0.11156082153320312, 0.11695098876953125, 0.12234115600585938, 0.1277313232421875, 0.13312149047851562, 0.13851165771484375, 0.14390182495117188, 0.1492919921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 8.0, 8.0, 15.0, 17.0, 18.0, 25.0, 27.0, 30.0, 40.0, 42.0, 45.0, 40.0, 58.0, 43.0, 48.0, 56.0, 50.0, 42.0, 44.0, 50.0, 50.0, 23.0, 33.0, 31.0, 28.0, 22.0, 26.0, 15.0, 12.0, 5.0, 8.0, 2.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.12646484375, -0.12323760986328125, -0.1200103759765625, -0.11678314208984375, -0.113555908203125, -0.11032867431640625, -0.1071014404296875, -0.10387420654296875, -0.10064697265625, -0.09741973876953125, -0.0941925048828125, -0.09096527099609375, -0.087738037109375, -0.08451080322265625, -0.0812835693359375, -0.07805633544921875, -0.0748291015625, -0.07160186767578125, -0.0683746337890625, -0.06514739990234375, -0.061920166015625, -0.05869293212890625, -0.0554656982421875, -0.05223846435546875, -0.04901123046875, -0.04578399658203125, -0.0425567626953125, -0.03932952880859375, -0.036102294921875, -0.03287506103515625, -0.0296478271484375, -0.02642059326171875, -0.023193359375, -0.01996612548828125, -0.0167388916015625, -0.01351165771484375, -0.010284423828125, -0.00705718994140625, -0.0038299560546875, -0.00060272216796875, 0.00262451171875, 0.00585174560546875, 0.0090789794921875, 0.01230621337890625, 0.015533447265625, 0.01876068115234375, 0.0219879150390625, 0.02521514892578125, 0.0284423828125, 0.03166961669921875, 0.0348968505859375, 0.03812408447265625, 0.041351318359375, 0.04457855224609375, 0.0478057861328125, 0.05103302001953125, 0.05426025390625, 0.05748748779296875, 0.0607147216796875, 0.06394195556640625, 0.067169189453125, 0.07039642333984375, 0.0736236572265625, 0.07685089111328125, 0.080078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 6.0, 9.0, 10.0, 12.0, 25.0, 27.0, 48.0, 52.0, 64.0, 94.0, 169.0, 255.0, 452.0, 976.0, 2240.0, 5796.0, 18042.0, 62432.0, 231853.0, 850937.0, 1801944.0, 882783.0, 242035.0, 65099.0, 18627.0, 5951.0, 2185.0, 946.0, 439.0, 258.0, 148.0, 94.0, 59.0, 53.0, 43.0, 26.0, 16.0, 23.0, 15.0, 7.0, 6.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.22607421875, -0.2189006805419922, -0.21172714233398438, -0.20455360412597656, -0.19738006591796875, -0.19020652770996094, -0.18303298950195312, -0.1758594512939453, -0.1686859130859375, -0.1615123748779297, -0.15433883666992188, -0.14716529846191406, -0.13999176025390625, -0.13281822204589844, -0.12564468383789062, -0.11847114562988281, -0.111297607421875, -0.10412406921386719, -0.09695053100585938, -0.08977699279785156, -0.08260345458984375, -0.07542991638183594, -0.06825637817382812, -0.06108283996582031, -0.0539093017578125, -0.04673576354980469, -0.039562225341796875, -0.03238868713378906, -0.02521514892578125, -0.018041610717773438, -0.010868072509765625, -0.0036945343017578125, 0.00347900390625, 0.010652542114257812, 0.017826080322265625, 0.024999618530273438, 0.03217315673828125, 0.03934669494628906, 0.046520233154296875, 0.05369377136230469, 0.0608673095703125, 0.06804084777832031, 0.07521438598632812, 0.08238792419433594, 0.08956146240234375, 0.09673500061035156, 0.10390853881835938, 0.11108207702636719, 0.118255615234375, 0.1254291534423828, 0.13260269165039062, 0.13977622985839844, 0.14694976806640625, 0.15412330627441406, 0.16129684448242188, 0.1684703826904297, 0.1756439208984375, 0.1828174591064453, 0.18999099731445312, 0.19716453552246094, 0.20433807373046875, 0.21151161193847656, 0.21868515014648438, 0.2258586883544922, 0.2330322265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 10.0, 4.0, 7.0, 10.0, 10.0, 16.0, 15.0, 17.0, 24.0, 31.0, 46.0, 60.0, 62.0, 73.0, 98.0, 118.0, 162.0, 187.0, 216.0, 264.0, 299.0, 279.0, 317.0, 286.0, 264.0, 211.0, 172.0, 157.0, 123.0, 101.0, 88.0, 77.0, 52.0, 44.0, 42.0, 34.0, 25.0, 13.0, 19.0, 10.0, 5.0, 2.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.17578125, -0.17107009887695312, -0.16635894775390625, -0.16164779663085938, -0.1569366455078125, -0.15222549438476562, -0.14751434326171875, -0.14280319213867188, -0.138092041015625, -0.13338088989257812, -0.12866973876953125, -0.12395858764648438, -0.1192474365234375, -0.11453628540039062, -0.10982513427734375, -0.10511398315429688, -0.10040283203125, -0.09569168090820312, -0.09098052978515625, -0.08626937866210938, -0.0815582275390625, -0.07684707641601562, -0.07213592529296875, -0.06742477416992188, -0.062713623046875, -0.058002471923828125, -0.05329132080078125, -0.048580169677734375, -0.0438690185546875, -0.039157867431640625, -0.03444671630859375, -0.029735565185546875, -0.0250244140625, -0.020313262939453125, -0.01560211181640625, -0.010890960693359375, -0.0061798095703125, -0.001468658447265625, 0.00324249267578125, 0.007953643798828125, 0.012664794921875, 0.017375946044921875, 0.02208709716796875, 0.026798248291015625, 0.0315093994140625, 0.036220550537109375, 0.04093170166015625, 0.045642852783203125, 0.05035400390625, 0.055065155029296875, 0.05977630615234375, 0.06448745727539062, 0.0691986083984375, 0.07390975952148438, 0.07862091064453125, 0.08333206176757812, 0.088043212890625, 0.09275436401367188, 0.09746551513671875, 0.10217666625976562, 0.1068878173828125, 0.11159896850585938, 0.11631011962890625, 0.12102127075195312, 0.125732421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 14.0, 35.0, 48.0, 86.0, 164.0, 178.0, 204.0, 131.0, 75.0, 33.0, 19.0, 11.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.523817539215088, -1.4673365354537964, -1.4108556509017944, -1.354374647140503, -1.297893762588501, -1.2414127588272095, -1.184931755065918, -1.128450870513916, -1.071969985961914, -1.0154889822006226, -0.9590080976486206, -0.9025270938873291, -0.8460462093353271, -0.7895652055740356, -0.7330842614173889, -0.6766033172607422, -0.6201223134994507, -0.563641369342804, -0.5071604251861572, -0.4506794512271881, -0.3941985070705414, -0.33771756291389465, -0.28123658895492554, -0.2247556447982788, -0.16827470064163208, -0.11179374903440475, -0.05531279742717743, 0.0011681616306304932, 0.05764910578727722, 0.11413004994392395, 0.17061102390289307, 0.2270919680595398, 0.2835729122161865, 0.34005385637283325, 0.39653480052948, 0.4530157744884491, 0.5094966888427734, 0.5659776926040649, 0.6224586367607117, 0.6789395809173584, 0.7354205250740051, 0.7919014692306519, 0.8483824133872986, 0.9048633575439453, 0.9613443613052368, 1.0178252458572388, 1.0743062496185303, 1.1307871341705322, 1.1872681379318237, 1.2437491416931152, 1.3002300262451172, 1.3567110300064087, 1.4131919145584106, 1.4696729183197021, 1.526153802871704, 1.5826348066329956, 1.639115810394287, 1.6955968141555786, 1.7520776987075806, 1.808558702468872, 1.865039587020874, 1.9215205907821655, 1.978001594543457, 2.034482479095459, 2.090963363647461]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 12.0, 8.0, 11.0, 11.0, 13.0, 19.0, 27.0, 23.0, 28.0, 37.0, 33.0, 24.0, 43.0, 29.0, 45.0, 37.0, 29.0, 39.0, 40.0, 50.0, 41.0, 52.0, 30.0, 36.0, 35.0, 28.0, 23.0, 23.0, 21.0, 22.0, 12.0, 22.0, 21.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.695074737071991, -0.6724916100502014, -0.6499085426330566, -0.6273254156112671, -0.6047423481941223, -0.5821592211723328, -0.559576153755188, -0.5369930267333984, -0.5144098997116089, -0.4918268024921417, -0.46924370527267456, -0.446660578250885, -0.42407748103141785, -0.4014943838119507, -0.3789112865924835, -0.35632818937301636, -0.3337450921535492, -0.31116199493408203, -0.28857889771461487, -0.2659958004951477, -0.24341267347335815, -0.220829576253891, -0.19824647903442383, -0.17566336691379547, -0.1530802696943283, -0.13049717247486115, -0.10791406035423279, -0.08533096313476562, -0.06274785846471786, -0.040164753794670105, -0.017581656575202942, 0.005001455545425415, 0.027584552764892578, 0.05016765743494034, 0.0727507621049881, 0.09533385932445526, 0.11791696399450302, 0.14050006866455078, 0.16308316588401794, 0.1856662780046463, 0.20824937522411346, 0.23083247244358063, 0.253415584564209, 0.27599868178367615, 0.2985817790031433, 0.32116490602493286, 0.34374797344207764, 0.3663311004638672, 0.38891419768333435, 0.4114972949028015, 0.4340803921222687, 0.45666348934173584, 0.4792466163635254, 0.5018297433853149, 0.5244128108024597, 0.5469959378242493, 0.569579005241394, 0.5921621322631836, 0.6147451996803284, 0.6373283267021179, 0.6599113941192627, 0.6824945211410522, 0.7050776481628418, 0.7276607155799866, 0.7502438426017761]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 15.0, 18.0, 31.0, 51.0, 65.0, 107.0, 137.0, 305.0, 460.0, 891.0, 1584.0, 3183.0, 6110.0, 11627.0, 22612.0, 43356.0, 79786.0, 137362.0, 197771.0, 204773.0, 148467.0, 88430.0, 48365.0, 25408.0, 13147.0, 6704.0, 3608.0, 1804.0, 1000.0, 528.0, 310.0, 185.0, 110.0, 69.0, 49.0, 33.0, 24.0, 12.0, 10.0, 13.0, 3.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1893310546875, -0.1832408905029297, -0.17715072631835938, -0.17106056213378906, -0.16497039794921875, -0.15888023376464844, -0.15279006958007812, -0.1466999053955078, -0.1406097412109375, -0.1345195770263672, -0.12842941284179688, -0.12233924865722656, -0.11624908447265625, -0.11015892028808594, -0.10406875610351562, -0.09797859191894531, -0.091888427734375, -0.08579826354980469, -0.07970809936523438, -0.07361793518066406, -0.06752777099609375, -0.06143760681152344, -0.055347442626953125, -0.04925727844238281, -0.0431671142578125, -0.03707695007324219, -0.030986785888671875, -0.024896621704101562, -0.01880645751953125, -0.012716293334960938, -0.006626129150390625, -0.0005359649658203125, 0.00555419921875, 0.011644363403320312, 0.017734527587890625, 0.023824691772460938, 0.02991485595703125, 0.03600502014160156, 0.042095184326171875, 0.04818534851074219, 0.0542755126953125, 0.06036567687988281, 0.06645584106445312, 0.07254600524902344, 0.07863616943359375, 0.08472633361816406, 0.09081649780273438, 0.09690666198730469, 0.102996826171875, 0.10908699035644531, 0.11517715454101562, 0.12126731872558594, 0.12735748291015625, 0.13344764709472656, 0.13953781127929688, 0.1456279754638672, 0.1517181396484375, 0.1578083038330078, 0.16389846801757812, 0.16998863220214844, 0.17607879638671875, 0.18216896057128906, 0.18825912475585938, 0.1943492889404297, 0.200439453125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 11.0, 11.0, 11.0, 16.0, 20.0, 21.0, 36.0, 26.0, 39.0, 32.0, 45.0, 55.0, 47.0, 55.0, 65.0, 65.0, 51.0, 55.0, 44.0, 37.0, 35.0, 36.0, 33.0, 33.0, 31.0, 20.0, 13.0, 11.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1312255859375, -0.1279439926147461, -0.12466239929199219, -0.12138080596923828, -0.11809921264648438, -0.11481761932373047, -0.11153602600097656, -0.10825443267822266, -0.10497283935546875, -0.10169124603271484, -0.09840965270996094, -0.09512805938720703, -0.09184646606445312, -0.08856487274169922, -0.08528327941894531, -0.0820016860961914, -0.0787200927734375, -0.0754384994506836, -0.07215690612792969, -0.06887531280517578, -0.06559371948242188, -0.06231212615966797, -0.05903053283691406, -0.055748939514160156, -0.05246734619140625, -0.049185752868652344, -0.04590415954589844, -0.04262256622314453, -0.039340972900390625, -0.03605937957763672, -0.03277778625488281, -0.029496192932128906, -0.026214599609375, -0.022933006286621094, -0.019651412963867188, -0.01636981964111328, -0.013088226318359375, -0.009806632995605469, -0.0065250396728515625, -0.0032434463500976562, 3.814697265625e-05, 0.0033197402954101562, 0.0066013336181640625, 0.009882926940917969, 0.013164520263671875, 0.01644611358642578, 0.019727706909179688, 0.023009300231933594, 0.0262908935546875, 0.029572486877441406, 0.03285408020019531, 0.03613567352294922, 0.039417266845703125, 0.04269886016845703, 0.04598045349121094, 0.049262046813964844, 0.05254364013671875, 0.055825233459472656, 0.05910682678222656, 0.06238842010498047, 0.06567001342773438, 0.06895160675048828, 0.07223320007324219, 0.0755147933959961, 0.07879638671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 12.0, 27.0, 25.0, 38.0, 72.0, 74.0, 110.0, 158.0, 276.0, 400.0, 618.0, 959.0, 1677.0, 3017.0, 5428.0, 9451.0, 17431.0, 32669.0, 59130.0, 101178.0, 160085.0, 202781.0, 178547.0, 118694.0, 69085.0, 38832.0, 21293.0, 11756.0, 6279.0, 3379.0, 1979.0, 1105.0, 658.0, 416.0, 288.0, 158.0, 153.0, 88.0, 52.0, 35.0, 35.0, 21.0, 18.0, 7.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.2147216796875, -0.2081470489501953, -0.20157241821289062, -0.19499778747558594, -0.18842315673828125, -0.18184852600097656, -0.17527389526367188, -0.1686992645263672, -0.1621246337890625, -0.1555500030517578, -0.14897537231445312, -0.14240074157714844, -0.13582611083984375, -0.12925148010253906, -0.12267684936523438, -0.11610221862792969, -0.109527587890625, -0.10295295715332031, -0.09637832641601562, -0.08980369567871094, -0.08322906494140625, -0.07665443420410156, -0.07007980346679688, -0.06350517272949219, -0.0569305419921875, -0.05035591125488281, -0.043781280517578125, -0.03720664978027344, -0.03063201904296875, -0.024057388305664062, -0.017482757568359375, -0.010908126831054688, -0.00433349609375, 0.0022411346435546875, 0.008815765380859375, 0.015390396118164062, 0.02196502685546875, 0.028539657592773438, 0.035114288330078125, 0.04168891906738281, 0.0482635498046875, 0.05483818054199219, 0.061412811279296875, 0.06798744201660156, 0.07456207275390625, 0.08113670349121094, 0.08771133422851562, 0.09428596496582031, 0.100860595703125, 0.10743522644042969, 0.11400985717773438, 0.12058448791503906, 0.12715911865234375, 0.13373374938964844, 0.14030838012695312, 0.1468830108642578, 0.1534576416015625, 0.1600322723388672, 0.16660690307617188, 0.17318153381347656, 0.17975616455078125, 0.18633079528808594, 0.19290542602539062, 0.1994800567626953, 0.2060546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 11.0, 7.0, 8.0, 11.0, 12.0, 15.0, 20.0, 20.0, 23.0, 27.0, 28.0, 35.0, 27.0, 35.0, 34.0, 35.0, 47.0, 52.0, 46.0, 38.0, 49.0, 41.0, 41.0, 48.0, 34.0, 37.0, 29.0, 22.0, 23.0, 24.0, 17.0, 13.0, 15.0, 20.0, 13.0, 12.0, 3.0, 5.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.27685546875, -0.26931190490722656, -0.2617683410644531, -0.2542247772216797, -0.24668121337890625, -0.2391376495361328, -0.23159408569335938, -0.22405052185058594, -0.2165069580078125, -0.20896339416503906, -0.20141983032226562, -0.1938762664794922, -0.18633270263671875, -0.1787891387939453, -0.17124557495117188, -0.16370201110839844, -0.156158447265625, -0.14861488342285156, -0.14107131958007812, -0.1335277557373047, -0.12598419189453125, -0.11844062805175781, -0.11089706420898438, -0.10335350036621094, -0.0958099365234375, -0.08826637268066406, -0.08072280883789062, -0.07317924499511719, -0.06563568115234375, -0.05809211730957031, -0.050548553466796875, -0.04300498962402344, -0.03546142578125, -0.027917861938476562, -0.020374298095703125, -0.012830734252929688, -0.00528717041015625, 0.0022563934326171875, 0.009799957275390625, 0.017343521118164062, 0.0248870849609375, 0.03243064880371094, 0.039974212646484375, 0.04751777648925781, 0.05506134033203125, 0.06260490417480469, 0.07014846801757812, 0.07769203186035156, 0.085235595703125, 0.09277915954589844, 0.10032272338867188, 0.10786628723144531, 0.11540985107421875, 0.12295341491699219, 0.13049697875976562, 0.13804054260253906, 0.1455841064453125, 0.15312767028808594, 0.16067123413085938, 0.1682147979736328, 0.17575836181640625, 0.1833019256591797, 0.19084548950195312, 0.19838905334472656, 0.2059326171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 1.0, 8.0, 13.0, 17.0, 33.0, 54.0, 61.0, 91.0, 149.0, 243.0, 412.0, 743.0, 1494.0, 3306.0, 9560.0, 850603.0, 171118.0, 5603.0, 2433.0, 1104.0, 609.0, 323.0, 222.0, 105.0, 73.0, 42.0, 46.0, 24.0, 19.0, 10.0, 11.0, 10.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80810546875, -0.7826995849609375, -0.757293701171875, -0.7318878173828125, -0.70648193359375, -0.6810760498046875, -0.655670166015625, -0.6302642822265625, -0.6048583984375, -0.5794525146484375, -0.554046630859375, -0.5286407470703125, -0.50323486328125, -0.4778289794921875, -0.452423095703125, -0.4270172119140625, -0.401611328125, -0.3762054443359375, -0.350799560546875, -0.3253936767578125, -0.29998779296875, -0.2745819091796875, -0.249176025390625, -0.2237701416015625, -0.1983642578125, -0.1729583740234375, -0.147552490234375, -0.1221466064453125, -0.09674072265625, -0.0713348388671875, -0.045928955078125, -0.0205230712890625, 0.0048828125, 0.0302886962890625, 0.055694580078125, 0.0811004638671875, 0.10650634765625, 0.1319122314453125, 0.157318115234375, 0.1827239990234375, 0.2081298828125, 0.2335357666015625, 0.258941650390625, 0.2843475341796875, 0.30975341796875, 0.3351593017578125, 0.360565185546875, 0.3859710693359375, 0.411376953125, 0.4367828369140625, 0.462188720703125, 0.4875946044921875, 0.51300048828125, 0.5384063720703125, 0.563812255859375, 0.5892181396484375, 0.6146240234375, 0.6400299072265625, 0.665435791015625, 0.6908416748046875, 0.71624755859375, 0.7416534423828125, 0.767059326171875, 0.7924652099609375, 0.81787109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 55.0, 132.0, 330.0, 278.0, 115.0, 44.0, 16.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012314319610595703, -0.00012033339589834213, -0.00011752359569072723, -0.00011471379548311234, -0.00011190399527549744, -0.00010909419506788254, -0.00010628439486026764, -0.00010347459465265274, -0.00010066479444503784, -9.785499423742294e-05, -9.504519402980804e-05, -9.223539382219315e-05, -8.942559361457825e-05, -8.661579340696335e-05, -8.380599319934845e-05, -8.099619299173355e-05, -7.818639278411865e-05, -7.537659257650375e-05, -7.256679236888885e-05, -6.975699216127396e-05, -6.694719195365906e-05, -6.413739174604416e-05, -6.132759153842926e-05, -5.851779133081436e-05, -5.570799112319946e-05, -5.2898190915584564e-05, -5.0088390707969666e-05, -4.727859050035477e-05, -4.446879029273987e-05, -4.165899008512497e-05, -3.884918987751007e-05, -3.603938966989517e-05, -3.3229589462280273e-05, -3.0419789254665375e-05, -2.7609989047050476e-05, -2.4800188839435577e-05, -2.199038863182068e-05, -1.918058842420578e-05, -1.637078821659088e-05, -1.3560988008975983e-05, -1.0751187801361084e-05, -7.941387593746185e-06, -5.131587386131287e-06, -2.321787178516388e-06, 4.880130290985107e-07, 3.2978132367134094e-06, 6.107613444328308e-06, 8.917413651943207e-06, 1.1727213859558105e-05, 1.4537014067173004e-05, 1.7346814274787903e-05, 2.01566144824028e-05, 2.29664146900177e-05, 2.57762148976326e-05, 2.8586015105247498e-05, 3.1395815312862396e-05, 3.4205615520477295e-05, 3.7015415728092194e-05, 3.982521593570709e-05, 4.263501614332199e-05, 4.544481635093689e-05, 4.825461655855179e-05, 5.106441676616669e-05, 5.3874216973781586e-05, 5.6684017181396484e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 15.0, 21.0, 23.0, 45.0, 65.0, 81.0, 113.0, 182.0, 315.0, 480.0, 766.0, 1209.0, 2097.0, 3644.0, 6689.0, 12123.0, 22341.0, 39211.0, 67703.0, 108774.0, 152512.0, 174890.0, 160545.0, 117711.0, 75613.0, 44665.0, 24933.0, 13940.0, 7681.0, 4178.0, 2402.0, 1402.0, 788.0, 457.0, 302.0, 215.0, 130.0, 84.0, 64.0, 46.0, 24.0, 21.0, 11.0, 13.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.06219482421875, -0.06034421920776367, -0.058493614196777344, -0.056643009185791016, -0.05479240417480469, -0.05294179916381836, -0.05109119415283203, -0.0492405891418457, -0.047389984130859375, -0.04553937911987305, -0.04368877410888672, -0.04183816909790039, -0.03998756408691406, -0.038136959075927734, -0.036286354064941406, -0.03443574905395508, -0.03258514404296875, -0.030734539031982422, -0.028883934020996094, -0.027033329010009766, -0.025182723999023438, -0.02333211898803711, -0.02148151397705078, -0.019630908966064453, -0.017780303955078125, -0.015929698944091797, -0.014079093933105469, -0.01222848892211914, -0.010377883911132812, -0.008527278900146484, -0.006676673889160156, -0.004826068878173828, -0.0029754638671875, -0.0011248588562011719, 0.0007257461547851562, 0.0025763511657714844, 0.0044269561767578125, 0.006277561187744141, 0.008128166198730469, 0.009978771209716797, 0.011829376220703125, 0.013679981231689453, 0.015530586242675781, 0.01738119125366211, 0.019231796264648438, 0.021082401275634766, 0.022933006286621094, 0.024783611297607422, 0.02663421630859375, 0.028484821319580078, 0.030335426330566406, 0.032186031341552734, 0.03403663635253906, 0.03588724136352539, 0.03773784637451172, 0.03958845138549805, 0.041439056396484375, 0.0432896614074707, 0.04514026641845703, 0.04699087142944336, 0.04884147644042969, 0.050692081451416016, 0.052542686462402344, 0.05439329147338867, 0.056243896484375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 12.0, 16.0, 9.0, 20.0, 17.0, 36.0, 31.0, 25.0, 30.0, 31.0, 45.0, 47.0, 63.0, 41.0, 51.0, 65.0, 46.0, 47.0, 52.0, 49.0, 38.0, 27.0, 24.0, 33.0, 26.0, 26.0, 20.0, 16.0, 9.0, 14.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06103515625, -0.05908393859863281, -0.057132720947265625, -0.05518150329589844, -0.05323028564453125, -0.05127906799316406, -0.049327850341796875, -0.04737663269042969, -0.0454254150390625, -0.04347419738769531, -0.041522979736328125, -0.03957176208496094, -0.03762054443359375, -0.03566932678222656, -0.033718109130859375, -0.03176689147949219, -0.029815673828125, -0.027864456176757812, -0.025913238525390625, -0.023962020874023438, -0.02201080322265625, -0.020059585571289062, -0.018108367919921875, -0.016157150268554688, -0.0142059326171875, -0.012254714965820312, -0.010303497314453125, -0.008352279663085938, -0.00640106201171875, -0.0044498443603515625, -0.002498626708984375, -0.0005474090576171875, 0.00140380859375, 0.0033550262451171875, 0.005306243896484375, 0.0072574615478515625, 0.00920867919921875, 0.011159896850585938, 0.013111114501953125, 0.015062332153320312, 0.0170135498046875, 0.018964767456054688, 0.020915985107421875, 0.022867202758789062, 0.02481842041015625, 0.026769638061523438, 0.028720855712890625, 0.030672073364257812, 0.032623291015625, 0.03457450866699219, 0.036525726318359375, 0.03847694396972656, 0.04042816162109375, 0.04237937927246094, 0.044330596923828125, 0.04628181457519531, 0.0482330322265625, 0.05018424987792969, 0.052135467529296875, 0.05408668518066406, 0.05603790283203125, 0.05798912048339844, 0.059940338134765625, 0.06189155578613281, 0.0638427734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 12.0, 14.0, 45.0, 87.0, 150.0, 175.0, 199.0, 149.0, 95.0, 42.0, 19.0, 11.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8242602348327637, -1.7692161798477173, -1.7141720056533813, -1.659127950668335, -1.604083776473999, -1.5490397214889526, -1.4939955472946167, -1.4389514923095703, -1.3839073181152344, -1.328863263130188, -1.273819088935852, -1.2187750339508057, -1.1637308597564697, -1.1086868047714233, -1.0536426305770874, -0.998598575592041, -0.9435544610023499, -0.8885103464126587, -0.8334662318229675, -0.7784221172332764, -0.7233780026435852, -0.668333888053894, -0.6132898330688477, -0.5582456588745117, -0.5032016038894653, -0.44815748929977417, -0.393113374710083, -0.33806926012039185, -0.2830251455307007, -0.2279810607433319, -0.17293694615364075, -0.11789283156394958, -0.06284868717193604, -0.0078045763075351715, 0.04723953455686569, 0.10228364169597626, 0.15732775628566742, 0.2123718559741974, 0.26741597056388855, 0.3224600851535797, 0.3775041997432709, 0.43254831433296204, 0.4875924289226532, 0.542636513710022, 0.5976806282997131, 0.6527247428894043, 0.7077688574790955, 0.7628129720687866, 0.8178570866584778, 0.872901201248169, 0.9279453158378601, 0.9829894304275513, 1.0380334854125977, 1.0930776596069336, 1.14812171459198, 1.203165888786316, 1.2582099437713623, 1.3132539987564087, 1.3682981729507446, 1.423342227935791, 1.478386402130127, 1.5334304571151733, 1.5884746313095093, 1.6435186862945557, 1.6985628604888916]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 8.0, 2.0, 8.0, 10.0, 15.0, 18.0, 18.0, 22.0, 37.0, 22.0, 37.0, 40.0, 57.0, 59.0, 49.0, 59.0, 63.0, 50.0, 60.0, 70.0, 57.0, 36.0, 37.0, 29.0, 17.0, 32.0, 23.0, 17.0, 15.0, 14.0, 7.0, 4.0, 7.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.872351348400116, -0.8431990146636963, -0.8140467405319214, -0.7848944067955017, -0.7557421326637268, -0.7265897989273071, -0.6974375247955322, -0.6682851910591125, -0.6391328573226929, -0.6099805235862732, -0.5808282494544983, -0.5516759157180786, -0.5225236415863037, -0.49337130784988403, -0.46421900391578674, -0.43506669998168945, -0.40591442584991455, -0.37676212191581726, -0.34760981798171997, -0.3184574842453003, -0.2893052101135254, -0.2601528763771057, -0.23100057244300842, -0.20184826850891113, -0.17269596457481384, -0.14354366064071655, -0.11439134925603867, -0.08523903787136078, -0.05608673393726349, -0.0269344300031662, 0.002217888832092285, 0.031370192766189575, 0.060522496700286865, 0.08967480063438416, 0.11882711201906204, 0.14797942340373993, 0.17713172733783722, 0.2062840312719345, 0.235436350107193, 0.2645886540412903, 0.2937409579753876, 0.32289326190948486, 0.35204556584358215, 0.38119786977767944, 0.4103502035140991, 0.439502477645874, 0.4686548113822937, 0.497807115316391, 0.5269594192504883, 0.556111752986908, 0.5852640271186829, 0.6144163608551025, 0.6435686349868774, 0.6727209687232971, 0.7018733024597168, 0.7310255765914917, 0.7601778507232666, 0.7893301844596863, 0.8184824585914612, 0.8476347923278809, 0.8767870664596558, 0.9059394001960754, 0.9350917339324951, 0.96424400806427, 0.9933963418006897]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 18.0, 18.0, 14.0, 40.0, 54.0, 97.0, 125.0, 233.0, 508.0, 953.0, 2250.0, 5856.0, 18324.0, 70909.0, 413593.0, 2204838.0, 1246676.0, 174411.0, 37523.0, 10823.0, 3833.0, 1607.0, 641.0, 393.0, 216.0, 111.0, 59.0, 45.0, 30.0, 16.0, 18.0, 13.0, 5.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.21021080017089844, -0.20338058471679688, -0.1965503692626953, -0.18972015380859375, -0.1828899383544922, -0.17605972290039062, -0.16922950744628906, -0.1623992919921875, -0.15556907653808594, -0.14873886108398438, -0.1419086456298828, -0.13507843017578125, -0.1282482147216797, -0.12141799926757812, -0.11458778381347656, -0.107757568359375, -0.10092735290527344, -0.09409713745117188, -0.08726692199707031, -0.08043670654296875, -0.07360649108886719, -0.06677627563476562, -0.05994606018066406, -0.0531158447265625, -0.04628562927246094, -0.039455413818359375, -0.03262519836425781, -0.02579498291015625, -0.018964767456054688, -0.012134552001953125, -0.0053043365478515625, 0.00152587890625, 0.008356094360351562, 0.015186309814453125, 0.022016525268554688, 0.02884674072265625, 0.03567695617675781, 0.042507171630859375, 0.04933738708496094, 0.0561676025390625, 0.06299781799316406, 0.06982803344726562, 0.07665824890136719, 0.08348846435546875, 0.09031867980957031, 0.09714889526367188, 0.10397911071777344, 0.110809326171875, 0.11763954162597656, 0.12446975708007812, 0.1312999725341797, 0.13813018798828125, 0.1449604034423828, 0.15179061889648438, 0.15862083435058594, 0.1654510498046875, 0.17228126525878906, 0.17911148071289062, 0.1859416961669922, 0.19277191162109375, 0.1996021270751953, 0.20643234252929688, 0.21326255798339844, 0.2200927734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 16.0, 19.0, 22.0, 18.0, 28.0, 39.0, 34.0, 46.0, 56.0, 58.0, 61.0, 52.0, 60.0, 69.0, 47.0, 48.0, 45.0, 44.0, 34.0, 30.0, 23.0, 35.0, 18.0, 23.0, 16.0, 6.0, 9.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1263427734375, -0.12254047393798828, -0.11873817443847656, -0.11493587493896484, -0.11113357543945312, -0.1073312759399414, -0.10352897644042969, -0.09972667694091797, -0.09592437744140625, -0.09212207794189453, -0.08831977844238281, -0.0845174789428711, -0.08071517944335938, -0.07691287994384766, -0.07311058044433594, -0.06930828094482422, -0.0655059814453125, -0.06170368194580078, -0.05790138244628906, -0.054099082946777344, -0.050296783447265625, -0.046494483947753906, -0.04269218444824219, -0.03888988494873047, -0.03508758544921875, -0.03128528594970703, -0.027482986450195312, -0.023680686950683594, -0.019878387451171875, -0.016076087951660156, -0.012273788452148438, -0.008471488952636719, -0.004669189453125, -0.0008668899536132812, 0.0029354095458984375, 0.006737709045410156, 0.010540008544921875, 0.014342308044433594, 0.018144607543945312, 0.02194690704345703, 0.02574920654296875, 0.02955150604248047, 0.03335380554199219, 0.037156105041503906, 0.040958404541015625, 0.044760704040527344, 0.04856300354003906, 0.05236530303955078, 0.0561676025390625, 0.05996990203857422, 0.06377220153808594, 0.06757450103759766, 0.07137680053710938, 0.0751791000366211, 0.07898139953613281, 0.08278369903564453, 0.08658599853515625, 0.09038829803466797, 0.09419059753417969, 0.0979928970336914, 0.10179519653320312, 0.10559749603271484, 0.10939979553222656, 0.11320209503173828, 0.11700439453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 11.0, 10.0, 21.0, 36.0, 55.0, 69.0, 117.0, 209.0, 389.0, 1156.0, 4028.0, 18431.0, 105960.0, 687084.0, 2429976.0, 796690.0, 122236.0, 20994.0, 4542.0, 1270.0, 446.0, 212.0, 120.0, 80.0, 50.0, 31.0, 20.0, 7.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.365234375, -0.35599708557128906, -0.3467597961425781, -0.3375225067138672, -0.32828521728515625, -0.3190479278564453, -0.3098106384277344, -0.30057334899902344, -0.2913360595703125, -0.28209877014160156, -0.2728614807128906, -0.2636241912841797, -0.25438690185546875, -0.2451496124267578, -0.23591232299804688, -0.22667503356933594, -0.217437744140625, -0.20820045471191406, -0.19896316528320312, -0.1897258758544922, -0.18048858642578125, -0.1712512969970703, -0.16201400756835938, -0.15277671813964844, -0.1435394287109375, -0.13430213928222656, -0.12506484985351562, -0.11582756042480469, -0.10659027099609375, -0.09735298156738281, -0.08811569213867188, -0.07887840270996094, -0.06964111328125, -0.06040382385253906, -0.051166534423828125, -0.04192924499511719, -0.03269195556640625, -0.023454666137695312, -0.014217376708984375, -0.0049800872802734375, 0.0042572021484375, 0.013494491577148438, 0.022731781005859375, 0.03196907043457031, 0.04120635986328125, 0.05044364929199219, 0.059680938720703125, 0.06891822814941406, 0.078155517578125, 0.08739280700683594, 0.09663009643554688, 0.10586738586425781, 0.11510467529296875, 0.12434196472167969, 0.13357925415039062, 0.14281654357910156, 0.1520538330078125, 0.16129112243652344, 0.17052841186523438, 0.1797657012939453, 0.18900299072265625, 0.1982402801513672, 0.20747756958007812, 0.21671485900878906, 0.2259521484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 14.0, 23.0, 25.0, 26.0, 42.0, 54.0, 54.0, 75.0, 92.0, 122.0, 130.0, 196.0, 246.0, 294.0, 337.0, 361.0, 351.0, 292.0, 253.0, 209.0, 169.0, 132.0, 138.0, 80.0, 78.0, 56.0, 46.0, 34.0, 34.0, 23.0, 17.0, 10.0, 8.0, 11.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1461181640625, -0.1413555145263672, -0.13659286499023438, -0.13183021545410156, -0.12706756591796875, -0.12230491638183594, -0.11754226684570312, -0.11277961730957031, -0.1080169677734375, -0.10325431823730469, -0.09849166870117188, -0.09372901916503906, -0.08896636962890625, -0.08420372009277344, -0.07944107055664062, -0.07467842102050781, -0.069915771484375, -0.06515312194824219, -0.060390472412109375, -0.05562782287597656, -0.05086517333984375, -0.04610252380371094, -0.041339874267578125, -0.03657722473144531, -0.0318145751953125, -0.027051925659179688, -0.022289276123046875, -0.017526626586914062, -0.01276397705078125, -0.008001327514648438, -0.003238677978515625, 0.0015239715576171875, 0.00628662109375, 0.011049270629882812, 0.015811920166015625, 0.020574569702148438, 0.02533721923828125, 0.030099868774414062, 0.034862518310546875, 0.03962516784667969, 0.0443878173828125, 0.04915046691894531, 0.053913116455078125, 0.05867576599121094, 0.06343841552734375, 0.06820106506347656, 0.07296371459960938, 0.07772636413574219, 0.082489013671875, 0.08725166320800781, 0.09201431274414062, 0.09677696228027344, 0.10153961181640625, 0.10630226135253906, 0.11106491088867188, 0.11582756042480469, 0.1205902099609375, 0.1253528594970703, 0.13011550903320312, 0.13487815856933594, 0.13964080810546875, 0.14440345764160156, 0.14916610717773438, 0.1539287567138672, 0.15869140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 9.0, 14.0, 26.0, 38.0, 47.0, 66.0, 69.0, 66.0, 95.0, 66.0, 89.0, 74.0, 76.0, 57.0, 44.0, 42.0, 11.0, 20.0, 31.0, 13.0, 8.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7011125087738037, -0.6788405179977417, -0.6565684676170349, -0.6342964768409729, -0.6120244264602661, -0.5897524356842041, -0.5674804449081421, -0.5452084541320801, -0.5229364037513733, -0.5006644129753113, -0.4783923625946045, -0.4561203718185425, -0.4338483512401581, -0.4115763306617737, -0.38930433988571167, -0.36703231930732727, -0.34476029872894287, -0.32248827815055847, -0.3002162575721741, -0.27794426679611206, -0.25567224621772766, -0.23340022563934326, -0.21112821996212006, -0.18885621428489685, -0.16658419370651245, -0.14431217312812805, -0.12204016745090485, -0.09976815432310104, -0.07749614119529724, -0.05522412806749344, -0.032952114939689636, -0.01068010926246643, 0.011591911315917969, 0.03386392444372177, 0.056135937571525574, 0.07840795069932938, 0.10067996382713318, 0.12295197695493698, 0.14522399008274078, 0.167495995759964, 0.1897680163383484, 0.2120400369167328, 0.234312042593956, 0.2565840482711792, 0.2788560688495636, 0.301128089427948, 0.32340008020401, 0.3456721007823944, 0.3679441213607788, 0.3902161419391632, 0.4124881625175476, 0.4347601532936096, 0.457032173871994, 0.4793041944503784, 0.5015761852264404, 0.5238481760025024, 0.5461202263832092, 0.5683922171592712, 0.590664267539978, 0.61293625831604, 0.635208249092102, 0.6574802994728088, 0.6797522902488708, 0.7020243406295776, 0.7242963314056396]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 10.0, 10.0, 8.0, 16.0, 13.0, 18.0, 22.0, 28.0, 18.0, 30.0, 26.0, 32.0, 29.0, 30.0, 47.0, 34.0, 32.0, 44.0, 42.0, 36.0, 38.0, 41.0, 30.0, 40.0, 29.0, 35.0, 17.0, 28.0, 27.0, 20.0, 40.0, 21.0, 13.0, 17.0, 9.0, 10.0, 10.0, 7.0, 9.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5093606114387512, -0.49331536889076233, -0.47727009654045105, -0.46122485399246216, -0.4451795816421509, -0.429134339094162, -0.4130890965461731, -0.3970438241958618, -0.3809985816478729, -0.36495333909988403, -0.34890806674957275, -0.33286282420158386, -0.31681758165359497, -0.3007723093032837, -0.2847270667552948, -0.2686818242073059, -0.25263655185699463, -0.23659129440784454, -0.22054603695869446, -0.20450079441070557, -0.18845553696155548, -0.1724102795124054, -0.1563650369644165, -0.14031977951526642, -0.12427452206611633, -0.10822926461696625, -0.09218401461839676, -0.07613876461982727, -0.060093507170677185, -0.0440482497215271, -0.02800299972295761, -0.011957749724388123, 0.004087507724761963, 0.02013276144862175, 0.03617801517248154, 0.052223268896341324, 0.06826852262020111, 0.0843137800693512, 0.10035903006792068, 0.11640428006649017, 0.13244953751564026, 0.14849479496479034, 0.16454005241394043, 0.18058529496192932, 0.1966305524110794, 0.2126758098602295, 0.22872105240821838, 0.24476630985736847, 0.26081156730651855, 0.27685680985450745, 0.2929020822048187, 0.3089473247528076, 0.3249925971031189, 0.3410378396511078, 0.3570830821990967, 0.37312835454940796, 0.38917359709739685, 0.40521883964538574, 0.421264111995697, 0.4373093545436859, 0.4533545970916748, 0.4693998694419861, 0.485445111989975, 0.5014903545379639, 0.5175356268882751]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 9.0, 14.0, 24.0, 34.0, 34.0, 47.0, 65.0, 147.0, 296.0, 438.0, 811.0, 1600.0, 2880.0, 5545.0, 10803.0, 21478.0, 42861.0, 86249.0, 159114.0, 226860.0, 212335.0, 135383.0, 70395.0, 35000.0, 17357.0, 8979.0, 4450.0, 2366.0, 1291.0, 703.0, 404.0, 236.0, 140.0, 79.0, 41.0, 25.0, 18.0, 11.0, 8.0, 4.0, 4.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.218017578125, -0.21071434020996094, -0.20341110229492188, -0.1961078643798828, -0.18880462646484375, -0.1815013885498047, -0.17419815063476562, -0.16689491271972656, -0.1595916748046875, -0.15228843688964844, -0.14498519897460938, -0.1376819610595703, -0.13037872314453125, -0.12307548522949219, -0.11577224731445312, -0.10846900939941406, -0.101165771484375, -0.09386253356933594, -0.08655929565429688, -0.07925605773925781, -0.07195281982421875, -0.06464958190917969, -0.057346343994140625, -0.05004310607910156, -0.0427398681640625, -0.03543663024902344, -0.028133392333984375, -0.020830154418945312, -0.01352691650390625, -0.0062236785888671875, 0.001079559326171875, 0.008382797241210938, 0.01568603515625, 0.022989273071289062, 0.030292510986328125, 0.03759574890136719, 0.04489898681640625, 0.05220222473144531, 0.059505462646484375, 0.06680870056152344, 0.0741119384765625, 0.08141517639160156, 0.08871841430664062, 0.09602165222167969, 0.10332489013671875, 0.11062812805175781, 0.11793136596679688, 0.12523460388183594, 0.132537841796875, 0.13984107971191406, 0.14714431762695312, 0.1544475555419922, 0.16175079345703125, 0.1690540313720703, 0.17635726928710938, 0.18366050720214844, 0.1909637451171875, 0.19826698303222656, 0.20557022094726562, 0.2128734588623047, 0.22017669677734375, 0.2274799346923828, 0.23478317260742188, 0.24208641052246094, 0.2493896484375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 11.0, 10.0, 11.0, 6.0, 17.0, 20.0, 27.0, 40.0, 37.0, 42.0, 53.0, 70.0, 55.0, 54.0, 57.0, 62.0, 63.0, 66.0, 45.0, 41.0, 37.0, 33.0, 34.0, 27.0, 23.0, 21.0, 13.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.13524341583251953, -0.13144874572753906, -0.1276540756225586, -0.12385940551757812, -0.12006473541259766, -0.11627006530761719, -0.11247539520263672, -0.10868072509765625, -0.10488605499267578, -0.10109138488769531, -0.09729671478271484, -0.09350204467773438, -0.0897073745727539, -0.08591270446777344, -0.08211803436279297, -0.0783233642578125, -0.07452869415283203, -0.07073402404785156, -0.0669393539428711, -0.06314468383789062, -0.059350013732910156, -0.05555534362792969, -0.05176067352294922, -0.04796600341796875, -0.04417133331298828, -0.04037666320800781, -0.036581993103027344, -0.032787322998046875, -0.028992652893066406, -0.025197982788085938, -0.02140331268310547, -0.017608642578125, -0.013813972473144531, -0.010019302368164062, -0.006224632263183594, -0.002429962158203125, 0.0013647079467773438, 0.0051593780517578125, 0.008954048156738281, 0.01274871826171875, 0.01654338836669922, 0.020338058471679688, 0.024132728576660156, 0.027927398681640625, 0.031722068786621094, 0.03551673889160156, 0.03931140899658203, 0.0431060791015625, 0.04690074920654297, 0.05069541931152344, 0.054490089416503906, 0.058284759521484375, 0.062079429626464844, 0.06587409973144531, 0.06966876983642578, 0.07346343994140625, 0.07725811004638672, 0.08105278015136719, 0.08484745025634766, 0.08864212036132812, 0.0924367904663086, 0.09623146057128906, 0.10002613067626953, 0.10382080078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 15.0, 16.0, 23.0, 64.0, 58.0, 83.0, 106.0, 156.0, 261.0, 399.0, 650.0, 1143.0, 2197.0, 4363.0, 9099.0, 19435.0, 41104.0, 84359.0, 152733.0, 219157.0, 214973.0, 145535.0, 78701.0, 38564.0, 17791.0, 8497.0, 4082.0, 2087.0, 1134.0, 600.0, 356.0, 231.0, 181.0, 109.0, 79.0, 61.0, 43.0, 26.0, 18.0, 18.0, 11.0, 9.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2178955078125, -0.21085548400878906, -0.20381546020507812, -0.1967754364013672, -0.18973541259765625, -0.1826953887939453, -0.17565536499023438, -0.16861534118652344, -0.1615753173828125, -0.15453529357910156, -0.14749526977539062, -0.1404552459716797, -0.13341522216796875, -0.1263751983642578, -0.11933517456054688, -0.11229515075683594, -0.105255126953125, -0.09821510314941406, -0.09117507934570312, -0.08413505554199219, -0.07709503173828125, -0.07005500793457031, -0.06301498413085938, -0.05597496032714844, -0.0489349365234375, -0.04189491271972656, -0.034854888916015625, -0.027814865112304688, -0.02077484130859375, -0.013734817504882812, -0.006694793701171875, 0.0003452301025390625, 0.00738525390625, 0.014425277709960938, 0.021465301513671875, 0.028505325317382812, 0.03554534912109375, 0.04258537292480469, 0.049625396728515625, 0.05666542053222656, 0.0637054443359375, 0.07074546813964844, 0.07778549194335938, 0.08482551574707031, 0.09186553955078125, 0.09890556335449219, 0.10594558715820312, 0.11298561096191406, 0.120025634765625, 0.12706565856933594, 0.13410568237304688, 0.1411457061767578, 0.14818572998046875, 0.1552257537841797, 0.16226577758789062, 0.16930580139160156, 0.1763458251953125, 0.18338584899902344, 0.19042587280273438, 0.1974658966064453, 0.20450592041015625, 0.2115459442138672, 0.21858596801757812, 0.22562599182128906, 0.232666015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 5.0, 10.0, 14.0, 7.0, 8.0, 26.0, 13.0, 22.0, 25.0, 28.0, 22.0, 26.0, 27.0, 40.0, 28.0, 24.0, 46.0, 38.0, 39.0, 36.0, 36.0, 39.0, 56.0, 36.0, 31.0, 43.0, 41.0, 30.0, 32.0, 19.0, 19.0, 23.0, 10.0, 13.0, 10.0, 16.0, 10.0, 9.0, 14.0, 5.0, 1.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.21048736572265625, -0.2033233642578125, -0.19615936279296875, -0.188995361328125, -0.18183135986328125, -0.1746673583984375, -0.16750335693359375, -0.16033935546875, -0.15317535400390625, -0.1460113525390625, -0.13884735107421875, -0.131683349609375, -0.12451934814453125, -0.1173553466796875, -0.11019134521484375, -0.10302734375, -0.09586334228515625, -0.0886993408203125, -0.08153533935546875, -0.074371337890625, -0.06720733642578125, -0.0600433349609375, -0.05287933349609375, -0.04571533203125, -0.03855133056640625, -0.0313873291015625, -0.02422332763671875, -0.017059326171875, -0.00989532470703125, -0.0027313232421875, 0.00443267822265625, 0.0115966796875, 0.01876068115234375, 0.0259246826171875, 0.03308868408203125, 0.040252685546875, 0.04741668701171875, 0.0545806884765625, 0.06174468994140625, 0.06890869140625, 0.07607269287109375, 0.0832366943359375, 0.09040069580078125, 0.097564697265625, 0.10472869873046875, 0.1118927001953125, 0.11905670166015625, 0.126220703125, 0.13338470458984375, 0.1405487060546875, 0.14771270751953125, 0.154876708984375, 0.16204071044921875, 0.1692047119140625, 0.17636871337890625, 0.18353271484375, 0.19069671630859375, 0.1978607177734375, 0.20502471923828125, 0.212188720703125, 0.21935272216796875, 0.2265167236328125, 0.23368072509765625, 0.2408447265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 9.0, 21.0, 33.0, 73.0, 144.0, 472.0, 1819.0, 9435.0, 71095.0, 461240.0, 430736.0, 62457.0, 8602.0, 1675.0, 439.0, 161.0, 57.0, 34.0, 22.0, 13.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2364501953125, -0.23038291931152344, -0.22431564331054688, -0.2182483673095703, -0.21218109130859375, -0.2061138153076172, -0.20004653930664062, -0.19397926330566406, -0.1879119873046875, -0.18184471130371094, -0.17577743530273438, -0.1697101593017578, -0.16364288330078125, -0.1575756072998047, -0.15150833129882812, -0.14544105529785156, -0.139373779296875, -0.13330650329589844, -0.12723922729492188, -0.12117195129394531, -0.11510467529296875, -0.10903739929199219, -0.10297012329101562, -0.09690284729003906, -0.0908355712890625, -0.08476829528808594, -0.07870101928710938, -0.07263374328613281, -0.06656646728515625, -0.06049919128417969, -0.054431915283203125, -0.04836463928222656, -0.04229736328125, -0.03623008728027344, -0.030162811279296875, -0.024095535278320312, -0.01802825927734375, -0.011960983276367188, -0.005893707275390625, 0.0001735687255859375, 0.0062408447265625, 0.012308120727539062, 0.018375396728515625, 0.024442672729492188, 0.03050994873046875, 0.03657722473144531, 0.042644500732421875, 0.04871177673339844, 0.054779052734375, 0.06084632873535156, 0.06691360473632812, 0.07298088073730469, 0.07904815673828125, 0.08511543273925781, 0.09118270874023438, 0.09724998474121094, 0.1033172607421875, 0.10938453674316406, 0.11545181274414062, 0.12151908874511719, 0.12758636474609375, 0.1336536407470703, 0.13972091674804688, 0.14578819274902344, 0.15185546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 5.0, 7.0, 13.0, 14.0, 21.0, 17.0, 28.0, 34.0, 36.0, 54.0, 54.0, 79.0, 84.0, 76.0, 83.0, 57.0, 59.0, 54.0, 41.0, 40.0, 34.0, 25.0, 21.0, 14.0, 9.0, 9.0, 2.0, 5.0, 5.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6987323760986328e-05, -1.644343137741089e-05, -1.589953899383545e-05, -1.535564661026001e-05, -1.481175422668457e-05, -1.4267861843109131e-05, -1.3723969459533691e-05, -1.3180077075958252e-05, -1.2636184692382812e-05, -1.2092292308807373e-05, -1.1548399925231934e-05, -1.1004507541656494e-05, -1.0460615158081055e-05, -9.916722774505615e-06, -9.372830390930176e-06, -8.828938007354736e-06, -8.285045623779297e-06, -7.741153240203857e-06, -7.197260856628418e-06, -6.6533684730529785e-06, -6.109476089477539e-06, -5.5655837059021e-06, -5.02169132232666e-06, -4.477798938751221e-06, -3.933906555175781e-06, -3.390014171600342e-06, -2.8461217880249023e-06, -2.302229404449463e-06, -1.7583370208740234e-06, -1.214444637298584e-06, -6.705522537231445e-07, -1.2665987014770508e-07, 4.172325134277344e-07, 9.611248970031738e-07, 1.5050172805786133e-06, 2.0489096641540527e-06, 2.592802047729492e-06, 3.1366944313049316e-06, 3.680586814880371e-06, 4.2244791984558105e-06, 4.76837158203125e-06, 5.3122639656066895e-06, 5.856156349182129e-06, 6.400048732757568e-06, 6.943941116333008e-06, 7.487833499908447e-06, 8.031725883483887e-06, 8.575618267059326e-06, 9.119510650634766e-06, 9.663403034210205e-06, 1.0207295417785645e-05, 1.0751187801361084e-05, 1.1295080184936523e-05, 1.1838972568511963e-05, 1.2382864952087402e-05, 1.2926757335662842e-05, 1.3470649719238281e-05, 1.401454210281372e-05, 1.455843448638916e-05, 1.51023268699646e-05, 1.564621925354004e-05, 1.619011163711548e-05, 1.6734004020690918e-05, 1.7277896404266357e-05, 1.7821788787841797e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 8.0, 9.0, 8.0, 18.0, 24.0, 34.0, 47.0, 84.0, 112.0, 204.0, 339.0, 701.0, 1642.0, 4509.0, 13865.0, 48107.0, 170640.0, 383303.0, 290514.0, 94619.0, 26658.0, 8056.0, 2769.0, 1096.0, 499.0, 277.0, 150.0, 84.0, 68.0, 25.0, 23.0, 19.0, 16.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10357666015625, -0.0999755859375, -0.09637451171875, -0.0927734375, -0.08917236328125, -0.0855712890625, -0.08197021484375, -0.078369140625, -0.07476806640625, -0.0711669921875, -0.06756591796875, -0.06396484375, -0.06036376953125, -0.0567626953125, -0.05316162109375, -0.049560546875, -0.04595947265625, -0.0423583984375, -0.03875732421875, -0.03515625, -0.03155517578125, -0.0279541015625, -0.02435302734375, -0.020751953125, -0.01715087890625, -0.0135498046875, -0.00994873046875, -0.00634765625, -0.00274658203125, 0.0008544921875, 0.00445556640625, 0.008056640625, 0.01165771484375, 0.0152587890625, 0.01885986328125, 0.0224609375, 0.02606201171875, 0.0296630859375, 0.03326416015625, 0.036865234375, 0.04046630859375, 0.0440673828125, 0.04766845703125, 0.05126953125, 0.05487060546875, 0.0584716796875, 0.06207275390625, 0.065673828125, 0.06927490234375, 0.0728759765625, 0.07647705078125, 0.080078125, 0.08367919921875, 0.0872802734375, 0.09088134765625, 0.094482421875, 0.09808349609375, 0.1016845703125, 0.10528564453125, 0.10888671875, 0.11248779296875, 0.1160888671875, 0.11968994140625, 0.123291015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 6.0, 8.0, 8.0, 17.0, 24.0, 24.0, 40.0, 38.0, 46.0, 73.0, 99.0, 102.0, 96.0, 97.0, 73.0, 72.0, 47.0, 42.0, 31.0, 27.0, 8.0, 11.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0], "bins": [-0.142822265625, -0.13979053497314453, -0.13675880432128906, -0.1337270736694336, -0.13069534301757812, -0.12766361236572266, -0.12463188171386719, -0.12160015106201172, -0.11856842041015625, -0.11553668975830078, -0.11250495910644531, -0.10947322845458984, -0.10644149780273438, -0.1034097671508789, -0.10037803649902344, -0.09734630584716797, -0.0943145751953125, -0.09128284454345703, -0.08825111389160156, -0.0852193832397461, -0.08218765258789062, -0.07915592193603516, -0.07612419128417969, -0.07309246063232422, -0.07006072998046875, -0.06702899932861328, -0.06399726867675781, -0.060965538024902344, -0.057933807373046875, -0.054902076721191406, -0.05187034606933594, -0.04883861541748047, -0.045806884765625, -0.04277515411376953, -0.03974342346191406, -0.036711692810058594, -0.033679962158203125, -0.030648231506347656, -0.027616500854492188, -0.02458477020263672, -0.02155303955078125, -0.01852130889892578, -0.015489578247070312, -0.012457847595214844, -0.009426116943359375, -0.006394386291503906, -0.0033626556396484375, -0.00033092498779296875, 0.0027008056640625, 0.005732536315917969, 0.008764266967773438, 0.011795997619628906, 0.014827728271484375, 0.017859458923339844, 0.020891189575195312, 0.02392292022705078, 0.02695465087890625, 0.02998638153076172, 0.03301811218261719, 0.036049842834472656, 0.039081573486328125, 0.042113304138183594, 0.04514503479003906, 0.04817676544189453, 0.05120849609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 6.0, 19.0, 50.0, 106.0, 209.0, 254.0, 199.0, 89.0, 44.0, 19.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.942764401435852, -1.871865153312683, -1.8009659051895142, -1.7300666570663452, -1.6591674089431763, -1.5882681608200073, -1.5173687934875488, -1.4464695453643799, -1.375570297241211, -1.304671049118042, -1.233771800994873, -1.162872552871704, -1.0919733047485352, -1.0210740566253662, -0.9501747488975525, -0.8792755007743835, -0.8083763122558594, -0.7374770641326904, -0.6665778160095215, -0.5956785678863525, -0.5247793197631836, -0.45388004183769226, -0.3829807639122009, -0.312081515789032, -0.24118226766586304, -0.1702830195426941, -0.09938375651836395, -0.028484493494033813, 0.04241475462913513, 0.11331400275230408, 0.1842132806777954, 0.25511252880096436, 0.32601189613342285, 0.3969111442565918, 0.46781039237976074, 0.5387096405029297, 0.6096088886260986, 0.6805081367492676, 0.7514074444770813, 0.8223066926002502, 0.8932059407234192, 0.9641051888465881, 1.0350044965744019, 1.1059037446975708, 1.1768029928207397, 1.2477022409439087, 1.3186014890670776, 1.3895007371902466, 1.4603999853134155, 1.5312992334365845, 1.6021984815597534, 1.6730977296829224, 1.7439969778060913, 1.8148962259292603, 1.8857955932617188, 1.9566948413848877, 2.0275940895080566, 2.0984933376312256, 2.1693925857543945, 2.2402918338775635, 2.3111910820007324, 2.3820903301239014, 2.4529895782470703, 2.5238888263702393, 2.594788074493408]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 15.0, 19.0, 18.0, 25.0, 20.0, 27.0, 21.0, 25.0, 37.0, 39.0, 41.0, 54.0, 43.0, 30.0, 40.0, 56.0, 37.0, 38.0, 45.0, 37.0, 43.0, 49.0, 36.0, 26.0, 28.0, 21.0, 23.0, 26.0, 22.0, 8.0, 10.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.915500819683075, -0.891193151473999, -0.8668854236602783, -0.8425776958465576, -0.8182700276374817, -0.7939623594284058, -0.7696546316146851, -0.7453469038009644, -0.7210392355918884, -0.6967315673828125, -0.6724238395690918, -0.6481161117553711, -0.6238084435462952, -0.5995007753372192, -0.5751930475234985, -0.5508853197097778, -0.5265776515007019, -0.502269983291626, -0.4779622554779053, -0.45365455746650696, -0.42934685945510864, -0.4050391614437103, -0.380731463432312, -0.3564237654209137, -0.3321160674095154, -0.30780836939811707, -0.28350067138671875, -0.25919297337532043, -0.23488527536392212, -0.2105775773525238, -0.1862698793411255, -0.16196218132972717, -0.13765442371368408, -0.11334672570228577, -0.08903902769088745, -0.06473132967948914, -0.04042363166809082, -0.016115933656692505, 0.00819176435470581, 0.032499462366104126, 0.05680716037750244, 0.08111485838890076, 0.10542255640029907, 0.1297302544116974, 0.1540379524230957, 0.17834565043449402, 0.20265334844589233, 0.22696104645729065, 0.25126874446868896, 0.2755764424800873, 0.2998841404914856, 0.3241918385028839, 0.3484995365142822, 0.37280723452568054, 0.39711493253707886, 0.4214226305484772, 0.4457303285598755, 0.4700380265712738, 0.4943457245826721, 0.518653392791748, 0.5429611206054688, 0.5672688484191895, 0.5915765166282654, 0.6158841848373413, 0.640191912651062]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 14.0, 13.0, 17.0, 33.0, 60.0, 132.0, 224.0, 387.0, 682.0, 1366.0, 2786.0, 5960.0, 13984.0, 35361.0, 104623.0, 413836.0, 1643286.0, 1481357.0, 344960.0, 90955.0, 31392.0, 12409.0, 5436.0, 2463.0, 1201.0, 620.0, 351.0, 161.0, 92.0, 49.0, 36.0, 14.0, 5.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.2193603515625, -0.21413040161132812, -0.20890045166015625, -0.20367050170898438, -0.1984405517578125, -0.19321060180664062, -0.18798065185546875, -0.18275070190429688, -0.177520751953125, -0.17229080200195312, -0.16706085205078125, -0.16183090209960938, -0.1566009521484375, -0.15137100219726562, -0.14614105224609375, -0.14091110229492188, -0.13568115234375, -0.13045120239257812, -0.12522125244140625, -0.11999130249023438, -0.1147613525390625, -0.10953140258789062, -0.10430145263671875, -0.09907150268554688, -0.093841552734375, -0.08861160278320312, -0.08338165283203125, -0.07815170288085938, -0.0729217529296875, -0.06769180297851562, -0.06246185302734375, -0.057231903076171875, -0.052001953125, -0.046772003173828125, -0.04154205322265625, -0.036312103271484375, -0.0310821533203125, -0.025852203369140625, -0.02062225341796875, -0.015392303466796875, -0.010162353515625, -0.004932403564453125, 0.00029754638671875, 0.005527496337890625, 0.0107574462890625, 0.015987396240234375, 0.02121734619140625, 0.026447296142578125, 0.03167724609375, 0.036907196044921875, 0.04213714599609375, 0.047367095947265625, 0.0525970458984375, 0.057826995849609375, 0.06305694580078125, 0.06828689575195312, 0.073516845703125, 0.07874679565429688, 0.08397674560546875, 0.08920669555664062, 0.0944366455078125, 0.09966659545898438, 0.10489654541015625, 0.11012649536132812, 0.1153564453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 6.0, 6.0, 16.0, 14.0, 12.0, 29.0, 26.0, 21.0, 31.0, 33.0, 33.0, 61.0, 48.0, 61.0, 53.0, 53.0, 55.0, 52.0, 45.0, 37.0, 44.0, 39.0, 41.0, 36.0, 23.0, 26.0, 23.0, 16.0, 19.0, 11.0, 13.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1240234375, -0.1205759048461914, -0.11712837219238281, -0.11368083953857422, -0.11023330688476562, -0.10678577423095703, -0.10333824157714844, -0.09989070892333984, -0.09644317626953125, -0.09299564361572266, -0.08954811096191406, -0.08610057830810547, -0.08265304565429688, -0.07920551300048828, -0.07575798034667969, -0.0723104476928711, -0.0688629150390625, -0.0654153823852539, -0.06196784973144531, -0.05852031707763672, -0.055072784423828125, -0.05162525177001953, -0.04817771911621094, -0.044730186462402344, -0.04128265380859375, -0.037835121154785156, -0.03438758850097656, -0.03094005584716797, -0.027492523193359375, -0.02404499053955078, -0.020597457885742188, -0.017149925231933594, -0.013702392578125, -0.010254859924316406, -0.0068073272705078125, -0.0033597946166992188, 8.7738037109375e-05, 0.0035352706909179688, 0.0069828033447265625, 0.010430335998535156, 0.01387786865234375, 0.017325401306152344, 0.020772933959960938, 0.02422046661376953, 0.027667999267578125, 0.03111553192138672, 0.03456306457519531, 0.038010597229003906, 0.0414581298828125, 0.044905662536621094, 0.04835319519042969, 0.05180072784423828, 0.055248260498046875, 0.05869579315185547, 0.06214332580566406, 0.06559085845947266, 0.06903839111328125, 0.07248592376708984, 0.07593345642089844, 0.07938098907470703, 0.08282852172851562, 0.08627605438232422, 0.08972358703613281, 0.0931711196899414, 0.09661865234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 9.0, 24.0, 24.0, 33.0, 43.0, 77.0, 100.0, 201.0, 376.0, 703.0, 2066.0, 7689.0, 36873.0, 213361.0, 1387394.0, 2100129.0, 367493.0, 60491.0, 12071.0, 3032.0, 1001.0, 447.0, 225.0, 145.0, 87.0, 62.0, 28.0, 28.0, 19.0, 18.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.3007621765136719, -0.29195404052734375, -0.2831459045410156, -0.2743377685546875, -0.2655296325683594, -0.25672149658203125, -0.24791336059570312, -0.239105224609375, -0.23029708862304688, -0.22148895263671875, -0.21268081665039062, -0.2038726806640625, -0.19506454467773438, -0.18625640869140625, -0.17744827270507812, -0.16864013671875, -0.15983200073242188, -0.15102386474609375, -0.14221572875976562, -0.1334075927734375, -0.12459945678710938, -0.11579132080078125, -0.10698318481445312, -0.098175048828125, -0.08936691284179688, -0.08055877685546875, -0.07175064086914062, -0.0629425048828125, -0.054134368896484375, -0.04532623291015625, -0.036518096923828125, -0.0277099609375, -0.018901824951171875, -0.01009368896484375, -0.001285552978515625, 0.0075225830078125, 0.016330718994140625, 0.02513885498046875, 0.033946990966796875, 0.042755126953125, 0.051563262939453125, 0.06037139892578125, 0.06917953491210938, 0.0779876708984375, 0.08679580688476562, 0.09560394287109375, 0.10441207885742188, 0.11322021484375, 0.12202835083007812, 0.13083648681640625, 0.13964462280273438, 0.1484527587890625, 0.15726089477539062, 0.16606903076171875, 0.17487716674804688, 0.183685302734375, 0.19249343872070312, 0.20130157470703125, 0.21010971069335938, 0.2189178466796875, 0.22772598266601562, 0.23653411865234375, 0.24534225463867188, 0.254150390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 15.0, 10.0, 15.0, 23.0, 29.0, 40.0, 50.0, 64.0, 80.0, 128.0, 152.0, 210.0, 293.0, 353.0, 485.0, 432.0, 410.0, 326.0, 242.0, 177.0, 142.0, 98.0, 88.0, 49.0, 40.0, 34.0, 21.0, 11.0, 9.0, 15.0, 8.0, 1.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.17004013061523438, -0.16442108154296875, -0.15880203247070312, -0.1531829833984375, -0.14756393432617188, -0.14194488525390625, -0.13632583618164062, -0.130706787109375, -0.12508773803710938, -0.11946868896484375, -0.11384963989257812, -0.1082305908203125, -0.10261154174804688, -0.09699249267578125, -0.09137344360351562, -0.08575439453125, -0.08013534545898438, -0.07451629638671875, -0.06889724731445312, -0.0632781982421875, -0.057659149169921875, -0.05204010009765625, -0.046421051025390625, -0.040802001953125, -0.035182952880859375, -0.02956390380859375, -0.023944854736328125, -0.0183258056640625, -0.012706756591796875, -0.00708770751953125, -0.001468658447265625, 0.004150390625, 0.009769439697265625, 0.01538848876953125, 0.021007537841796875, 0.0266265869140625, 0.032245635986328125, 0.03786468505859375, 0.043483734130859375, 0.049102783203125, 0.054721832275390625, 0.06034088134765625, 0.06595993041992188, 0.0715789794921875, 0.07719802856445312, 0.08281707763671875, 0.08843612670898438, 0.09405517578125, 0.09967422485351562, 0.10529327392578125, 0.11091232299804688, 0.1165313720703125, 0.12215042114257812, 0.12776947021484375, 0.13338851928710938, 0.139007568359375, 0.14462661743164062, 0.15024566650390625, 0.15586471557617188, 0.1614837646484375, 0.16710281372070312, 0.17272186279296875, 0.17834091186523438, 0.1839599609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 16.0, 27.0, 36.0, 72.0, 114.0, 160.0, 188.0, 167.0, 106.0, 61.0, 30.0, 16.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0630645751953125, -1.0114120244979858, -0.959759533405304, -0.9081069827079773, -0.8564544916152954, -0.8048019409179688, -0.7531493902206421, -0.7014968395233154, -0.6498443484306335, -0.5981917977333069, -0.546539306640625, -0.49488675594329834, -0.44323423504829407, -0.3915817141532898, -0.33992916345596313, -0.28827664256095886, -0.2366241216659546, -0.18497160077095032, -0.13331906497478485, -0.08166652917861938, -0.030014008283615112, 0.02163851261138916, 0.07329106330871582, 0.12494358420372009, 0.17659610509872437, 0.22824862599372864, 0.2799011468887329, 0.33155369758605957, 0.38320621848106384, 0.4348587393760681, 0.4865112900733948, 0.5381637811660767, 0.5898163318634033, 0.64146888256073, 0.6931213736534119, 0.7447739243507385, 0.7964264154434204, 0.8480789661407471, 0.8997315168380737, 0.9513840675354004, 1.0030364990234375, 1.0546890497207642, 1.1063416004180908, 1.157994031906128, 1.2096465826034546, 1.2612991333007812, 1.312951683998108, 1.3646042346954346, 1.4162567853927612, 1.467909336090088, 1.5195618867874146, 1.5712144374847412, 1.6228668689727783, 1.674519419670105, 1.7261719703674316, 1.7778245210647583, 1.829477071762085, 1.8811296224594116, 1.9327821731567383, 1.9844346046447754, 2.0360872745513916, 2.0877397060394287, 2.139392375946045, 2.191044807434082, 2.242697238922119]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 6.0, 5.0, 5.0, 7.0, 4.0, 8.0, 5.0, 13.0, 14.0, 14.0, 13.0, 24.0, 23.0, 20.0, 16.0, 23.0, 25.0, 34.0, 39.0, 41.0, 42.0, 39.0, 32.0, 39.0, 31.0, 39.0, 47.0, 38.0, 32.0, 37.0, 34.0, 36.0, 25.0, 26.0, 30.0, 13.0, 13.0, 23.0, 13.0, 18.0, 11.0, 8.0, 10.0, 12.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4638877511024475, -0.4488920271396637, -0.4338963031768799, -0.4189005494117737, -0.40390482544898987, -0.38890910148620605, -0.37391337752342224, -0.3589176535606384, -0.3439219295978546, -0.3289262056350708, -0.313930481672287, -0.2989347577095032, -0.283939003944397, -0.26894327998161316, -0.25394755601882935, -0.23895183205604553, -0.22395609319210052, -0.2089603692293167, -0.1939646303653717, -0.1789689064025879, -0.16397318243980408, -0.14897745847702026, -0.13398171961307526, -0.11898599565029144, -0.10399026423692703, -0.08899453282356262, -0.07399880886077881, -0.0590030774474144, -0.044007349759340286, -0.029011622071266174, -0.014015890657901764, 0.0009798333048820496, 0.01597556471824646, 0.030971292406320572, 0.045967020094394684, 0.060962751507759094, 0.07595847547054291, 0.09095420688390732, 0.10594993829727173, 0.12094566226005554, 0.13594138622283936, 0.15093711018562317, 0.16593284904956818, 0.180928573012352, 0.1959242969751358, 0.2109200358390808, 0.22591575980186462, 0.24091148376464844, 0.25590723752975464, 0.27090296149253845, 0.28589868545532227, 0.30089443922042847, 0.3158901631832123, 0.3308858871459961, 0.3458816111087799, 0.3608773350715637, 0.37587305903434753, 0.39086878299713135, 0.40586450695991516, 0.420860230922699, 0.4358559846878052, 0.450851708650589, 0.4658474326133728, 0.4808431565761566, 0.49583888053894043]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 16.0, 28.0, 36.0, 45.0, 82.0, 121.0, 247.0, 401.0, 681.0, 1339.0, 2449.0, 4766.0, 9416.0, 18121.0, 34616.0, 66075.0, 116828.0, 182318.0, 212761.0, 171028.0, 105770.0, 58158.0, 30354.0, 15658.0, 7987.0, 4246.0, 2215.0, 1178.0, 664.0, 355.0, 198.0, 145.0, 89.0, 55.0, 31.0, 30.0, 13.0, 9.0, 5.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20361328125, -0.19751739501953125, -0.1914215087890625, -0.18532562255859375, -0.179229736328125, -0.17313385009765625, -0.1670379638671875, -0.16094207763671875, -0.15484619140625, -0.14875030517578125, -0.1426544189453125, -0.13655853271484375, -0.130462646484375, -0.12436676025390625, -0.1182708740234375, -0.11217498779296875, -0.1060791015625, -0.09998321533203125, -0.0938873291015625, -0.08779144287109375, -0.081695556640625, -0.07559967041015625, -0.0695037841796875, -0.06340789794921875, -0.05731201171875, -0.05121612548828125, -0.0451202392578125, -0.03902435302734375, -0.032928466796875, -0.02683258056640625, -0.0207366943359375, -0.01464080810546875, -0.008544921875, -0.00244903564453125, 0.0036468505859375, 0.00974273681640625, 0.015838623046875, 0.02193450927734375, 0.0280303955078125, 0.03412628173828125, 0.04022216796875, 0.04631805419921875, 0.0524139404296875, 0.05850982666015625, 0.064605712890625, 0.07070159912109375, 0.0767974853515625, 0.08289337158203125, 0.0889892578125, 0.09508514404296875, 0.1011810302734375, 0.10727691650390625, 0.113372802734375, 0.11946868896484375, 0.1255645751953125, 0.13166046142578125, 0.13775634765625, 0.14385223388671875, 0.1499481201171875, 0.15604400634765625, 0.162139892578125, 0.16823577880859375, 0.1743316650390625, 0.18042755126953125, 0.1865234375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 3.0, 2.0, 10.0, 14.0, 18.0, 28.0, 23.0, 24.0, 31.0, 43.0, 45.0, 49.0, 45.0, 79.0, 64.0, 71.0, 52.0, 44.0, 65.0, 51.0, 43.0, 44.0, 32.0, 34.0, 25.0, 16.0, 14.0, 15.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.1260843276977539, -0.12228584289550781, -0.11848735809326172, -0.11468887329101562, -0.11089038848876953, -0.10709190368652344, -0.10329341888427734, -0.09949493408203125, -0.09569644927978516, -0.09189796447753906, -0.08809947967529297, -0.08430099487304688, -0.08050251007080078, -0.07670402526855469, -0.0729055404663086, -0.0691070556640625, -0.0653085708618164, -0.06151008605957031, -0.05771160125732422, -0.053913116455078125, -0.05011463165283203, -0.04631614685058594, -0.042517662048339844, -0.03871917724609375, -0.034920692443847656, -0.031122207641601562, -0.02732372283935547, -0.023525238037109375, -0.01972675323486328, -0.015928268432617188, -0.012129783630371094, -0.008331298828125, -0.004532814025878906, -0.0007343292236328125, 0.0030641555786132812, 0.006862640380859375, 0.010661125183105469, 0.014459609985351562, 0.018258094787597656, 0.02205657958984375, 0.025855064392089844, 0.029653549194335938, 0.03345203399658203, 0.037250518798828125, 0.04104900360107422, 0.04484748840332031, 0.048645973205566406, 0.0524444580078125, 0.056242942810058594, 0.06004142761230469, 0.06383991241455078, 0.06763839721679688, 0.07143688201904297, 0.07523536682128906, 0.07903385162353516, 0.08283233642578125, 0.08663082122802734, 0.09042930603027344, 0.09422779083251953, 0.09802627563476562, 0.10182476043701172, 0.10562324523925781, 0.1094217300415039, 0.11322021484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 7.0, 16.0, 29.0, 36.0, 43.0, 80.0, 116.0, 235.0, 447.0, 916.0, 1990.0, 4473.0, 10212.0, 21544.0, 46547.0, 92688.0, 164315.0, 228789.0, 208875.0, 132530.0, 70803.0, 34390.0, 16086.0, 7090.0, 3271.0, 1492.0, 716.0, 340.0, 147.0, 92.0, 67.0, 40.0, 27.0, 18.0, 17.0, 7.0, 13.0, 8.0, 3.0, 8.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.214111328125, -0.20715904235839844, -0.20020675659179688, -0.1932544708251953, -0.18630218505859375, -0.1793498992919922, -0.17239761352539062, -0.16544532775878906, -0.1584930419921875, -0.15154075622558594, -0.14458847045898438, -0.1376361846923828, -0.13068389892578125, -0.12373161315917969, -0.11677932739257812, -0.10982704162597656, -0.102874755859375, -0.09592247009277344, -0.08897018432617188, -0.08201789855957031, -0.07506561279296875, -0.06811332702636719, -0.061161041259765625, -0.05420875549316406, -0.0472564697265625, -0.04030418395996094, -0.033351898193359375, -0.026399612426757812, -0.01944732666015625, -0.012495040893554688, -0.005542755126953125, 0.0014095306396484375, 0.00836181640625, 0.015314102172851562, 0.022266387939453125, 0.029218673706054688, 0.03617095947265625, 0.04312324523925781, 0.050075531005859375, 0.05702781677246094, 0.0639801025390625, 0.07093238830566406, 0.07788467407226562, 0.08483695983886719, 0.09178924560546875, 0.09874153137207031, 0.10569381713867188, 0.11264610290527344, 0.119598388671875, 0.12655067443847656, 0.13350296020507812, 0.1404552459716797, 0.14740753173828125, 0.1543598175048828, 0.16131210327148438, 0.16826438903808594, 0.1752166748046875, 0.18216896057128906, 0.18912124633789062, 0.1960735321044922, 0.20302581787109375, 0.2099781036376953, 0.21693038940429688, 0.22388267517089844, 0.2308349609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 15.0, 13.0, 17.0, 21.0, 27.0, 19.0, 26.0, 30.0, 27.0, 25.0, 38.0, 41.0, 50.0, 41.0, 52.0, 51.0, 46.0, 32.0, 38.0, 24.0, 38.0, 27.0, 37.0, 39.0, 26.0, 31.0, 23.0, 28.0, 22.0, 18.0, 10.0, 12.0, 9.0, 7.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.234619140625, -0.22724342346191406, -0.21986770629882812, -0.2124919891357422, -0.20511627197265625, -0.1977405548095703, -0.19036483764648438, -0.18298912048339844, -0.1756134033203125, -0.16823768615722656, -0.16086196899414062, -0.1534862518310547, -0.14611053466796875, -0.1387348175048828, -0.13135910034179688, -0.12398338317871094, -0.116607666015625, -0.10923194885253906, -0.10185623168945312, -0.09448051452636719, -0.08710479736328125, -0.07972908020019531, -0.07235336303710938, -0.06497764587402344, -0.0576019287109375, -0.05022621154785156, -0.042850494384765625, -0.03547477722167969, -0.02809906005859375, -0.020723342895507812, -0.013347625732421875, -0.0059719085693359375, 0.00140380859375, 0.008779525756835938, 0.016155242919921875, 0.023530960083007812, 0.03090667724609375, 0.03828239440917969, 0.045658111572265625, 0.05303382873535156, 0.0604095458984375, 0.06778526306152344, 0.07516098022460938, 0.08253669738769531, 0.08991241455078125, 0.09728813171386719, 0.10466384887695312, 0.11203956604003906, 0.119415283203125, 0.12679100036621094, 0.13416671752929688, 0.1415424346923828, 0.14891815185546875, 0.1562938690185547, 0.16366958618164062, 0.17104530334472656, 0.1784210205078125, 0.18579673767089844, 0.19317245483398438, 0.2005481719970703, 0.20792388916015625, 0.2152996063232422, 0.22267532348632812, 0.23005104064941406, 0.2374267578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 19.0, 26.0, 64.0, 78.0, 144.0, 191.0, 376.0, 704.0, 1202.0, 2236.0, 4428.0, 9151.0, 19062.0, 39210.0, 77238.0, 136834.0, 196541.0, 207808.0, 159341.0, 95966.0, 50175.0, 24299.0, 11618.0, 5589.0, 2797.0, 1451.0, 826.0, 433.0, 290.0, 170.0, 75.0, 50.0, 39.0, 22.0, 17.0, 17.0, 13.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.06292724609375, -0.06108570098876953, -0.05924415588378906, -0.057402610778808594, -0.055561065673828125, -0.053719520568847656, -0.05187797546386719, -0.05003643035888672, -0.04819488525390625, -0.04635334014892578, -0.04451179504394531, -0.042670249938964844, -0.040828704833984375, -0.038987159729003906, -0.03714561462402344, -0.03530406951904297, -0.0334625244140625, -0.03162097930908203, -0.029779434204101562, -0.027937889099121094, -0.026096343994140625, -0.024254798889160156, -0.022413253784179688, -0.02057170867919922, -0.01873016357421875, -0.01688861846923828, -0.015047073364257812, -0.013205528259277344, -0.011363983154296875, -0.009522438049316406, -0.0076808929443359375, -0.005839347839355469, -0.003997802734375, -0.0021562576293945312, -0.0003147125244140625, 0.0015268325805664062, 0.003368377685546875, 0.005209922790527344, 0.0070514678955078125, 0.008893013000488281, 0.01073455810546875, 0.012576103210449219, 0.014417648315429688, 0.016259193420410156, 0.018100738525390625, 0.019942283630371094, 0.021783828735351562, 0.02362537384033203, 0.0254669189453125, 0.02730846405029297, 0.029150009155273438, 0.030991554260253906, 0.032833099365234375, 0.034674644470214844, 0.03651618957519531, 0.03835773468017578, 0.04019927978515625, 0.04204082489013672, 0.04388236999511719, 0.045723915100097656, 0.047565460205078125, 0.049407005310058594, 0.05124855041503906, 0.05309009552001953, 0.054931640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 4.0, 7.0, 9.0, 22.0, 12.0, 22.0, 27.0, 39.0, 45.0, 46.0, 67.0, 63.0, 90.0, 62.0, 97.0, 76.0, 45.0, 43.0, 37.0, 34.0, 19.0, 16.0, 28.0, 14.0, 14.0, 12.0, 6.0, 6.0, 6.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.0205974578857422e-05, -1.9698403775691986e-05, -1.919083297252655e-05, -1.8683262169361115e-05, -1.817569136619568e-05, -1.7668120563030243e-05, -1.7160549759864807e-05, -1.665297895669937e-05, -1.6145408153533936e-05, -1.56378373503685e-05, -1.5130266547203064e-05, -1.4622695744037628e-05, -1.4115124940872192e-05, -1.3607554137706757e-05, -1.309998333454132e-05, -1.2592412531375885e-05, -1.208484172821045e-05, -1.1577270925045013e-05, -1.1069700121879578e-05, -1.0562129318714142e-05, -1.0054558515548706e-05, -9.54698771238327e-06, -9.039416909217834e-06, -8.531846106052399e-06, -8.024275302886963e-06, -7.516704499721527e-06, -7.009133696556091e-06, -6.5015628933906555e-06, -5.99399209022522e-06, -5.486421287059784e-06, -4.978850483894348e-06, -4.471279680728912e-06, -3.9637088775634766e-06, -3.4561380743980408e-06, -2.948567271232605e-06, -2.440996468067169e-06, -1.9334256649017334e-06, -1.4258548617362976e-06, -9.182840585708618e-07, -4.10713255405426e-07, 9.685754776000977e-08, 6.044283509254456e-07, 1.1119991540908813e-06, 1.6195699572563171e-06, 2.127140760421753e-06, 2.6347115635871887e-06, 3.1422823667526245e-06, 3.6498531699180603e-06, 4.157423973083496e-06, 4.664994776248932e-06, 5.172565579414368e-06, 5.6801363825798035e-06, 6.187707185745239e-06, 6.695277988910675e-06, 7.202848792076111e-06, 7.710419595241547e-06, 8.217990398406982e-06, 8.725561201572418e-06, 9.233132004737854e-06, 9.74070280790329e-06, 1.0248273611068726e-05, 1.0755844414234161e-05, 1.1263415217399597e-05, 1.1770986020565033e-05, 1.2278556823730469e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 8.0, 16.0, 29.0, 54.0, 79.0, 131.0, 211.0, 465.0, 831.0, 1557.0, 3111.0, 6665.0, 13755.0, 29914.0, 62582.0, 117617.0, 185878.0, 217919.0, 181603.0, 112927.0, 59034.0, 28450.0, 13160.0, 6242.0, 2925.0, 1536.0, 782.0, 448.0, 241.0, 143.0, 79.0, 56.0, 29.0, 10.0, 19.0, 15.0, 6.0, 3.0, 2.0, 5.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053802490234375, -0.052092552185058594, -0.05038261413574219, -0.04867267608642578, -0.046962738037109375, -0.04525279998779297, -0.04354286193847656, -0.041832923889160156, -0.04012298583984375, -0.038413047790527344, -0.03670310974121094, -0.03499317169189453, -0.033283233642578125, -0.03157329559326172, -0.029863357543945312, -0.028153419494628906, -0.0264434814453125, -0.024733543395996094, -0.023023605346679688, -0.02131366729736328, -0.019603729248046875, -0.01789379119873047, -0.016183853149414062, -0.014473915100097656, -0.01276397705078125, -0.011054039001464844, -0.009344100952148438, -0.007634162902832031, -0.005924224853515625, -0.004214286804199219, -0.0025043487548828125, -0.0007944107055664062, 0.00091552734375, 0.0026254653930664062, 0.0043354034423828125, 0.006045341491699219, 0.007755279541015625, 0.009465217590332031, 0.011175155639648438, 0.012885093688964844, 0.01459503173828125, 0.016304969787597656, 0.018014907836914062, 0.01972484588623047, 0.021434783935546875, 0.02314472198486328, 0.024854660034179688, 0.026564598083496094, 0.0282745361328125, 0.029984474182128906, 0.03169441223144531, 0.03340435028076172, 0.035114288330078125, 0.03682422637939453, 0.03853416442871094, 0.040244102478027344, 0.04195404052734375, 0.043663978576660156, 0.04537391662597656, 0.04708385467529297, 0.048793792724609375, 0.05050373077392578, 0.05221366882324219, 0.053923606872558594, 0.055633544921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 8.0, 15.0, 12.0, 24.0, 9.0, 23.0, 34.0, 28.0, 26.0, 41.0, 33.0, 53.0, 48.0, 62.0, 52.0, 66.0, 60.0, 47.0, 52.0, 44.0, 47.0, 29.0, 31.0, 19.0, 22.0, 15.0, 14.0, 16.0, 8.0, 12.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04351806640625, -0.042061805725097656, -0.04060554504394531, -0.03914928436279297, -0.037693023681640625, -0.03623676300048828, -0.03478050231933594, -0.033324241638183594, -0.03186798095703125, -0.030411720275878906, -0.028955459594726562, -0.02749919891357422, -0.026042938232421875, -0.02458667755126953, -0.023130416870117188, -0.021674156188964844, -0.0202178955078125, -0.018761634826660156, -0.017305374145507812, -0.01584911346435547, -0.014392852783203125, -0.012936592102050781, -0.011480331420898438, -0.010024070739746094, -0.00856781005859375, -0.007111549377441406, -0.0056552886962890625, -0.004199028015136719, -0.002742767333984375, -0.0012865066528320312, 0.0001697540283203125, 0.0016260147094726562, 0.003082275390625, 0.004538536071777344, 0.0059947967529296875, 0.007451057434082031, 0.008907318115234375, 0.010363578796386719, 0.011819839477539062, 0.013276100158691406, 0.01473236083984375, 0.016188621520996094, 0.017644882202148438, 0.01910114288330078, 0.020557403564453125, 0.02201366424560547, 0.023469924926757812, 0.024926185607910156, 0.0263824462890625, 0.027838706970214844, 0.029294967651367188, 0.03075122833251953, 0.032207489013671875, 0.03366374969482422, 0.03512001037597656, 0.036576271057128906, 0.03803253173828125, 0.039488792419433594, 0.04094505310058594, 0.04240131378173828, 0.043857574462890625, 0.04531383514404297, 0.04677009582519531, 0.048226356506347656, 0.0496826171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 22.0, 38.0, 54.0, 69.0, 122.0, 116.0, 129.0, 132.0, 90.0, 77.0, 64.0, 37.0, 12.0, 13.0, 10.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67084801197052, -0.6326574087142944, -0.5944667458534241, -0.5562760829925537, -0.5180854797363281, -0.47989484667778015, -0.4417042136192322, -0.4035135805606842, -0.36532294750213623, -0.32713231444358826, -0.2889416813850403, -0.2507510483264923, -0.21256041526794434, -0.17436978220939636, -0.1361791491508484, -0.09798851609230042, -0.05979788303375244, -0.021607249975204468, 0.016583383083343506, 0.05477401614189148, 0.09296464920043945, 0.13115528225898743, 0.1693459153175354, 0.20753654837608337, 0.24572718143463135, 0.2839178144931793, 0.3221084475517273, 0.36029908061027527, 0.39848971366882324, 0.4366803467273712, 0.4748709797859192, 0.5130616426467896, 0.5512523651123047, 0.5894429683685303, 0.6276336312294006, 0.665824294090271, 0.7040148973464966, 0.7422055006027222, 0.7803961634635925, 0.8185868263244629, 0.8567774295806885, 0.8949680328369141, 0.9331586956977844, 0.9713493585586548, 1.0095399618148804, 1.047730565071106, 1.085921287536621, 1.1241118907928467, 1.1623024940490723, 1.2004930973052979, 1.2386837005615234, 1.2768744230270386, 1.3150650262832642, 1.3532556295394897, 1.3914463520050049, 1.4296369552612305, 1.467827558517456, 1.5060181617736816, 1.5442087650299072, 1.5823994874954224, 1.620590090751648, 1.6587806940078735, 1.6969714164733887, 1.7351620197296143, 1.7733526229858398]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 10.0, 9.0, 9.0, 8.0, 9.0, 16.0, 20.0, 15.0, 31.0, 21.0, 30.0, 19.0, 34.0, 31.0, 37.0, 29.0, 36.0, 36.0, 39.0, 42.0, 45.0, 53.0, 44.0, 41.0, 37.0, 31.0, 38.0, 32.0, 29.0, 27.0, 21.0, 22.0, 18.0, 18.0, 11.0, 17.0, 11.0, 5.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.7696053981781006, -0.7479040026664734, -0.726202666759491, -0.7045012712478638, -0.6827998757362366, -0.6610984802246094, -0.639397144317627, -0.6176957488059998, -0.5959943532943726, -0.5742929577827454, -0.5525916218757629, -0.5308902263641357, -0.5091888308525085, -0.48748746514320374, -0.4657860994338989, -0.44408470392227173, -0.4223833680152893, -0.4006820023059845, -0.3789806067943573, -0.3572792410850525, -0.3355778455734253, -0.3138764798641205, -0.2921751141548157, -0.2704737186431885, -0.24877235293388367, -0.22707097232341766, -0.20536959171295166, -0.18366822600364685, -0.16196684539318085, -0.14026546478271484, -0.11856409907341003, -0.09686271846294403, -0.0751613974571228, -0.0534600205719471, -0.03175864368677139, -0.010057270526885986, 0.011644110083580017, 0.03334549069404602, 0.05504685640335083, 0.07674823701381683, 0.09844961762428284, 0.12015099823474884, 0.14185237884521484, 0.16355374455451965, 0.18525512516498566, 0.20695650577545166, 0.22865787148475647, 0.2503592371940613, 0.2720606327056885, 0.2937619984149933, 0.3154633939266205, 0.3371647596359253, 0.3588661551475525, 0.3805675208568573, 0.4022688865661621, 0.4239702820777893, 0.4456716477870941, 0.4673730134963989, 0.4890744090080261, 0.5107758045196533, 0.5324771404266357, 0.5541785359382629, 0.5758799314498901, 0.5975812673568726, 0.6192826628684998]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 10.0, 21.0, 33.0, 39.0, 69.0, 101.0, 142.0, 272.0, 611.0, 1305.0, 2952.0, 8157.0, 23798.0, 81032.0, 400450.0, 2070904.0, 1317436.0, 211006.0, 50322.0, 15721.0, 5595.0, 2245.0, 1039.0, 473.0, 248.0, 114.0, 73.0, 28.0, 32.0, 15.0, 12.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.19405364990234375, -0.1875457763671875, -0.18103790283203125, -0.174530029296875, -0.16802215576171875, -0.1615142822265625, -0.15500640869140625, -0.14849853515625, -0.14199066162109375, -0.1354827880859375, -0.12897491455078125, -0.122467041015625, -0.11595916748046875, -0.1094512939453125, -0.10294342041015625, -0.096435546875, -0.08992767333984375, -0.0834197998046875, -0.07691192626953125, -0.070404052734375, -0.06389617919921875, -0.0573883056640625, -0.05088043212890625, -0.04437255859375, -0.03786468505859375, -0.0313568115234375, -0.02484893798828125, -0.018341064453125, -0.01183319091796875, -0.0053253173828125, 0.00118255615234375, 0.0076904296875, 0.01419830322265625, 0.0207061767578125, 0.02721405029296875, 0.033721923828125, 0.04022979736328125, 0.0467376708984375, 0.05324554443359375, 0.05975341796875, 0.06626129150390625, 0.0727691650390625, 0.07927703857421875, 0.085784912109375, 0.09229278564453125, 0.0988006591796875, 0.10530853271484375, 0.11181640625, 0.11832427978515625, 0.1248321533203125, 0.13134002685546875, 0.137847900390625, 0.14435577392578125, 0.1508636474609375, 0.15737152099609375, 0.16387939453125, 0.17038726806640625, 0.1768951416015625, 0.18340301513671875, 0.189910888671875, 0.19641876220703125, 0.2029266357421875, 0.20943450927734375, 0.2159423828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 6.0, 11.0, 14.0, 15.0, 21.0, 21.0, 31.0, 24.0, 34.0, 36.0, 34.0, 43.0, 38.0, 54.0, 57.0, 52.0, 62.0, 44.0, 52.0, 54.0, 36.0, 36.0, 33.0, 35.0, 37.0, 19.0, 17.0, 19.0, 8.0, 15.0, 10.0, 7.0, 3.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.115478515625, -0.11205482482910156, -0.10863113403320312, -0.10520744323730469, -0.10178375244140625, -0.09836006164550781, -0.09493637084960938, -0.09151268005371094, -0.0880889892578125, -0.08466529846191406, -0.08124160766601562, -0.07781791687011719, -0.07439422607421875, -0.07097053527832031, -0.06754684448242188, -0.06412315368652344, -0.060699462890625, -0.05727577209472656, -0.053852081298828125, -0.05042839050292969, -0.04700469970703125, -0.04358100891113281, -0.040157318115234375, -0.03673362731933594, -0.0333099365234375, -0.029886245727539062, -0.026462554931640625, -0.023038864135742188, -0.01961517333984375, -0.016191482543945312, -0.012767791748046875, -0.009344100952148438, -0.00592041015625, -0.0024967193603515625, 0.000926971435546875, 0.0043506622314453125, 0.00777435302734375, 0.011198043823242188, 0.014621734619140625, 0.018045425415039062, 0.0214691162109375, 0.024892807006835938, 0.028316497802734375, 0.03174018859863281, 0.03516387939453125, 0.03858757019042969, 0.042011260986328125, 0.04543495178222656, 0.048858642578125, 0.05228233337402344, 0.055706024169921875, 0.05912971496582031, 0.06255340576171875, 0.06597709655761719, 0.06940078735351562, 0.07282447814941406, 0.0762481689453125, 0.07967185974121094, 0.08309555053710938, 0.08651924133300781, 0.08994293212890625, 0.09336662292480469, 0.09679031372070312, 0.10021400451660156, 0.1036376953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 12.0, 6.0, 11.0, 12.0, 19.0, 24.0, 31.0, 44.0, 58.0, 103.0, 184.0, 361.0, 823.0, 2088.0, 6567.0, 23836.0, 97149.0, 459000.0, 2026533.0, 1252525.0, 248919.0, 55049.0, 13909.0, 4308.0, 1421.0, 569.0, 284.0, 141.0, 88.0, 62.0, 52.0, 35.0, 12.0, 14.0, 10.0, 4.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.220458984375, -0.2133026123046875, -0.206146240234375, -0.1989898681640625, -0.19183349609375, -0.1846771240234375, -0.177520751953125, -0.1703643798828125, -0.1632080078125, -0.1560516357421875, -0.148895263671875, -0.1417388916015625, -0.13458251953125, -0.1274261474609375, -0.120269775390625, -0.1131134033203125, -0.10595703125, -0.0988006591796875, -0.091644287109375, -0.0844879150390625, -0.07733154296875, -0.0701751708984375, -0.063018798828125, -0.0558624267578125, -0.0487060546875, -0.0415496826171875, -0.034393310546875, -0.0272369384765625, -0.02008056640625, -0.0129241943359375, -0.005767822265625, 0.0013885498046875, 0.008544921875, 0.0157012939453125, 0.022857666015625, 0.0300140380859375, 0.03717041015625, 0.0443267822265625, 0.051483154296875, 0.0586395263671875, 0.0657958984375, 0.0729522705078125, 0.080108642578125, 0.0872650146484375, 0.09442138671875, 0.1015777587890625, 0.108734130859375, 0.1158905029296875, 0.123046875, 0.1302032470703125, 0.137359619140625, 0.1445159912109375, 0.15167236328125, 0.1588287353515625, 0.165985107421875, 0.1731414794921875, 0.1802978515625, 0.1874542236328125, 0.194610595703125, 0.2017669677734375, 0.20892333984375, 0.2160797119140625, 0.223236083984375, 0.2303924560546875, 0.237548828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 6.0, 8.0, 8.0, 15.0, 16.0, 13.0, 19.0, 45.0, 62.0, 65.0, 98.0, 116.0, 151.0, 171.0, 249.0, 336.0, 375.0, 449.0, 415.0, 326.0, 276.0, 199.0, 147.0, 124.0, 101.0, 60.0, 52.0, 42.0, 31.0, 22.0, 21.0, 15.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.155029296875, -0.15012359619140625, -0.1452178955078125, -0.14031219482421875, -0.135406494140625, -0.13050079345703125, -0.1255950927734375, -0.12068939208984375, -0.11578369140625, -0.11087799072265625, -0.1059722900390625, -0.10106658935546875, -0.096160888671875, -0.09125518798828125, -0.0863494873046875, -0.08144378662109375, -0.0765380859375, -0.07163238525390625, -0.0667266845703125, -0.06182098388671875, -0.056915283203125, -0.05200958251953125, -0.0471038818359375, -0.04219818115234375, -0.03729248046875, -0.03238677978515625, -0.0274810791015625, -0.02257537841796875, -0.017669677734375, -0.01276397705078125, -0.0078582763671875, -0.00295257568359375, 0.001953125, 0.00685882568359375, 0.0117645263671875, 0.01667022705078125, 0.021575927734375, 0.02648162841796875, 0.0313873291015625, 0.03629302978515625, 0.04119873046875, 0.04610443115234375, 0.0510101318359375, 0.05591583251953125, 0.060821533203125, 0.06572723388671875, 0.0706329345703125, 0.07553863525390625, 0.0804443359375, 0.08535003662109375, 0.0902557373046875, 0.09516143798828125, 0.100067138671875, 0.10497283935546875, 0.1098785400390625, 0.11478424072265625, 0.11968994140625, 0.12459564208984375, 0.1295013427734375, 0.13440704345703125, 0.139312744140625, 0.14421844482421875, 0.1491241455078125, 0.15402984619140625, 0.158935546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 15.0, 22.0, 28.0, 49.0, 62.0, 90.0, 108.0, 80.0, 104.0, 91.0, 89.0, 71.0, 57.0, 45.0, 25.0, 24.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9745577573776245, -0.945487916469574, -0.9164180755615234, -0.8873481750488281, -0.8582783341407776, -0.829208493232727, -0.8001386523246765, -0.771068811416626, -0.7419989109039307, -0.7129290699958801, -0.6838592290878296, -0.6547893285751343, -0.6257194876670837, -0.5966496467590332, -0.5675798058509827, -0.5385099649429321, -0.5094401240348816, -0.48037028312683105, -0.45130041241645813, -0.4222305715084076, -0.39316070079803467, -0.36409085988998413, -0.3350210189819336, -0.30595117807388306, -0.27688130736351013, -0.2478114515542984, -0.21874159574508667, -0.18967175483703613, -0.1606018990278244, -0.13153204321861267, -0.10246220231056213, -0.0733923465013504, -0.04432249069213867, -0.01525263860821724, 0.013817213475704193, 0.04288706183433533, 0.07195691764354706, 0.10102677345275879, 0.13009661436080933, 0.15916647017002106, 0.1882363259792328, 0.21730618178844452, 0.24637603759765625, 0.2754458785057068, 0.3045157194137573, 0.33358559012413025, 0.3626554310321808, 0.3917253017425537, 0.42079514265060425, 0.4498649835586548, 0.4789348542690277, 0.5080046653747559, 0.5370745658874512, 0.5661444067955017, 0.5952142477035522, 0.6242840886116028, 0.6533539295196533, 0.6824237704277039, 0.7114936113357544, 0.7405635118484497, 0.7696333527565002, 0.7987031936645508, 0.8277730345726013, 0.8568428754806519, 0.8859127759933472]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 7.0, 8.0, 8.0, 10.0, 10.0, 14.0, 18.0, 24.0, 24.0, 20.0, 19.0, 30.0, 26.0, 34.0, 33.0, 34.0, 47.0, 47.0, 40.0, 49.0, 30.0, 37.0, 43.0, 36.0, 41.0, 36.0, 26.0, 32.0, 25.0, 24.0, 26.0, 25.0, 21.0, 17.0, 19.0, 10.0, 9.0, 7.0, 7.0, 9.0, 4.0, 7.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4969825744628906, -0.4806017279624939, -0.46422088146209717, -0.44784003496170044, -0.4314591884613037, -0.415078341960907, -0.39869749546051025, -0.3823166489601135, -0.3659358024597168, -0.34955495595932007, -0.33317410945892334, -0.3167932629585266, -0.3004124164581299, -0.28403156995773315, -0.2676507234573364, -0.2512698769569397, -0.23488903045654297, -0.21850818395614624, -0.2021273374557495, -0.18574649095535278, -0.16936564445495605, -0.15298479795455933, -0.1366039514541626, -0.12022310495376587, -0.10384225845336914, -0.08746141195297241, -0.07108056545257568, -0.054699718952178955, -0.03831887245178223, -0.021938025951385498, -0.0055571794509887695, 0.010823667049407959, 0.027204573154449463, 0.04358541965484619, 0.05996626615524292, 0.07634711265563965, 0.09272795915603638, 0.1091088056564331, 0.12548965215682983, 0.14187049865722656, 0.1582513451576233, 0.17463219165802002, 0.19101303815841675, 0.20739388465881348, 0.2237747311592102, 0.24015557765960693, 0.25653642416000366, 0.2729172706604004, 0.2892981171607971, 0.30567896366119385, 0.3220598101615906, 0.3384406566619873, 0.35482150316238403, 0.37120234966278076, 0.3875831961631775, 0.4039640426635742, 0.42034488916397095, 0.4367257356643677, 0.4531065821647644, 0.46948742866516113, 0.48586827516555786, 0.5022491216659546, 0.5186299681663513, 0.535010814666748, 0.5513916611671448]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 6.0, 8.0, 6.0, 16.0, 15.0, 17.0, 38.0, 51.0, 118.0, 190.0, 311.0, 678.0, 1462.0, 2897.0, 6324.0, 13949.0, 32301.0, 73899.0, 154895.0, 247885.0, 242042.0, 147175.0, 69134.0, 30594.0, 13101.0, 5976.0, 2763.0, 1320.0, 645.0, 323.0, 184.0, 94.0, 56.0, 28.0, 17.0, 19.0, 3.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27213287353515625, -0.2620391845703125, -0.25194549560546875, -0.241851806640625, -0.23175811767578125, -0.2216644287109375, -0.21157073974609375, -0.20147705078125, -0.19138336181640625, -0.1812896728515625, -0.17119598388671875, -0.161102294921875, -0.15100860595703125, -0.1409149169921875, -0.13082122802734375, -0.1207275390625, -0.11063385009765625, -0.1005401611328125, -0.09044647216796875, -0.080352783203125, -0.07025909423828125, -0.0601654052734375, -0.05007171630859375, -0.03997802734375, -0.02988433837890625, -0.0197906494140625, -0.00969696044921875, 0.000396728515625, 0.01049041748046875, 0.0205841064453125, 0.03067779541015625, 0.040771484375, 0.05086517333984375, 0.0609588623046875, 0.07105255126953125, 0.081146240234375, 0.09123992919921875, 0.1013336181640625, 0.11142730712890625, 0.12152099609375, 0.13161468505859375, 0.1417083740234375, 0.15180206298828125, 0.161895751953125, 0.17198944091796875, 0.1820831298828125, 0.19217681884765625, 0.2022705078125, 0.21236419677734375, 0.2224578857421875, 0.23255157470703125, 0.242645263671875, 0.25273895263671875, 0.2628326416015625, 0.27292633056640625, 0.28302001953125, 0.29311370849609375, 0.3032073974609375, 0.31330108642578125, 0.323394775390625, 0.33348846435546875, 0.3435821533203125, 0.35367584228515625, 0.36376953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 11.0, 7.0, 6.0, 13.0, 17.0, 19.0, 25.0, 40.0, 36.0, 45.0, 44.0, 53.0, 60.0, 63.0, 69.0, 52.0, 51.0, 64.0, 56.0, 46.0, 32.0, 48.0, 29.0, 28.0, 9.0, 13.0, 17.0, 16.0, 7.0, 3.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117919921875, -0.11431407928466797, -0.11070823669433594, -0.1071023941040039, -0.10349655151367188, -0.09989070892333984, -0.09628486633300781, -0.09267902374267578, -0.08907318115234375, -0.08546733856201172, -0.08186149597167969, -0.07825565338134766, -0.07464981079101562, -0.0710439682006836, -0.06743812561035156, -0.06383228302001953, -0.0602264404296875, -0.05662059783935547, -0.05301475524902344, -0.049408912658691406, -0.045803070068359375, -0.042197227478027344, -0.03859138488769531, -0.03498554229736328, -0.03137969970703125, -0.02777385711669922, -0.024168014526367188, -0.020562171936035156, -0.016956329345703125, -0.013350486755371094, -0.009744644165039062, -0.006138801574707031, -0.002532958984375, 0.0010728836059570312, 0.0046787261962890625, 0.008284568786621094, 0.011890411376953125, 0.015496253967285156, 0.019102096557617188, 0.02270793914794922, 0.02631378173828125, 0.02991962432861328, 0.03352546691894531, 0.037131309509277344, 0.040737152099609375, 0.044342994689941406, 0.04794883728027344, 0.05155467987060547, 0.0551605224609375, 0.05876636505126953, 0.06237220764160156, 0.0659780502319336, 0.06958389282226562, 0.07318973541259766, 0.07679557800292969, 0.08040142059326172, 0.08400726318359375, 0.08761310577392578, 0.09121894836425781, 0.09482479095458984, 0.09843063354492188, 0.1020364761352539, 0.10564231872558594, 0.10924816131591797, 0.11285400390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 24.0, 28.0, 57.0, 55.0, 88.0, 152.0, 252.0, 360.0, 567.0, 917.0, 1504.0, 2554.0, 4494.0, 7745.0, 14491.0, 26272.0, 47291.0, 80291.0, 124569.0, 165878.0, 177194.0, 148162.0, 102002.0, 62698.0, 35610.0, 19895.0, 10982.0, 5887.0, 3411.0, 1961.0, 1181.0, 692.0, 411.0, 277.0, 184.0, 118.0, 71.0, 65.0, 44.0, 34.0, 11.0, 16.0, 6.0, 6.0, 7.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.193115234375, -0.1869373321533203, -0.18075942993164062, -0.17458152770996094, -0.16840362548828125, -0.16222572326660156, -0.15604782104492188, -0.1498699188232422, -0.1436920166015625, -0.1375141143798828, -0.13133621215820312, -0.12515830993652344, -0.11898040771484375, -0.11280250549316406, -0.10662460327148438, -0.10044670104980469, -0.094268798828125, -0.08809089660644531, -0.08191299438476562, -0.07573509216308594, -0.06955718994140625, -0.06337928771972656, -0.057201385498046875, -0.05102348327636719, -0.0448455810546875, -0.03866767883300781, -0.032489776611328125, -0.026311874389648438, -0.02013397216796875, -0.013956069946289062, -0.007778167724609375, -0.0016002655029296875, 0.00457763671875, 0.010755538940429688, 0.016933441162109375, 0.023111343383789062, 0.02928924560546875, 0.03546714782714844, 0.041645050048828125, 0.04782295227050781, 0.0540008544921875, 0.06017875671386719, 0.06635665893554688, 0.07253456115722656, 0.07871246337890625, 0.08489036560058594, 0.09106826782226562, 0.09724617004394531, 0.103424072265625, 0.10960197448730469, 0.11577987670898438, 0.12195777893066406, 0.12813568115234375, 0.13431358337402344, 0.14049148559570312, 0.1466693878173828, 0.1528472900390625, 0.1590251922607422, 0.16520309448242188, 0.17138099670410156, 0.17755889892578125, 0.18373680114746094, 0.18991470336914062, 0.1960926055908203, 0.2022705078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 7.0, 6.0, 5.0, 9.0, 12.0, 14.0, 22.0, 16.0, 24.0, 19.0, 24.0, 28.0, 37.0, 39.0, 45.0, 45.0, 38.0, 36.0, 57.0, 42.0, 38.0, 26.0, 39.0, 45.0, 42.0, 39.0, 34.0, 43.0, 14.0, 23.0, 18.0, 16.0, 11.0, 23.0, 10.0, 5.0, 16.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.277099609375, -0.26943397521972656, -0.2617683410644531, -0.2541027069091797, -0.24643707275390625, -0.2387714385986328, -0.23110580444335938, -0.22344017028808594, -0.2157745361328125, -0.20810890197753906, -0.20044326782226562, -0.1927776336669922, -0.18511199951171875, -0.1774463653564453, -0.16978073120117188, -0.16211509704589844, -0.154449462890625, -0.14678382873535156, -0.13911819458007812, -0.1314525604248047, -0.12378692626953125, -0.11612129211425781, -0.10845565795898438, -0.10079002380371094, -0.0931243896484375, -0.08545875549316406, -0.07779312133789062, -0.07012748718261719, -0.06246185302734375, -0.05479621887207031, -0.047130584716796875, -0.03946495056152344, -0.03179931640625, -0.024133682250976562, -0.016468048095703125, -0.008802413940429688, -0.00113677978515625, 0.0065288543701171875, 0.014194488525390625, 0.021860122680664062, 0.0295257568359375, 0.03719139099121094, 0.044857025146484375, 0.05252265930175781, 0.06018829345703125, 0.06785392761230469, 0.07551956176757812, 0.08318519592285156, 0.090850830078125, 0.09851646423339844, 0.10618209838867188, 0.11384773254394531, 0.12151336669921875, 0.1291790008544922, 0.13684463500976562, 0.14451026916503906, 0.1521759033203125, 0.15984153747558594, 0.16750717163085938, 0.1751728057861328, 0.18283843994140625, 0.1905040740966797, 0.19816970825195312, 0.20583534240722656, 0.2135009765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 2.0, 6.0, 15.0, 21.0, 37.0, 60.0, 82.0, 116.0, 168.0, 264.0, 441.0, 742.0, 1232.0, 2175.0, 3936.0, 7378.0, 15055.0, 31690.0, 70374.0, 149009.0, 244633.0, 242042.0, 147464.0, 69109.0, 31238.0, 14988.0, 7185.0, 3813.0, 2103.0, 1165.0, 704.0, 478.0, 278.0, 188.0, 108.0, 72.0, 51.0, 39.0, 33.0, 15.0, 9.0, 12.0, 10.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0914306640625, -0.08857250213623047, -0.08571434020996094, -0.0828561782836914, -0.07999801635742188, -0.07713985443115234, -0.07428169250488281, -0.07142353057861328, -0.06856536865234375, -0.06570720672607422, -0.06284904479980469, -0.059990882873535156, -0.057132720947265625, -0.054274559020996094, -0.05141639709472656, -0.04855823516845703, -0.0457000732421875, -0.04284191131591797, -0.03998374938964844, -0.037125587463378906, -0.034267425537109375, -0.031409263610839844, -0.028551101684570312, -0.02569293975830078, -0.02283477783203125, -0.01997661590576172, -0.017118453979492188, -0.014260292053222656, -0.011402130126953125, -0.008543968200683594, -0.0056858062744140625, -0.0028276443481445312, 3.0517578125e-05, 0.0028886795043945312, 0.0057468414306640625, 0.008605003356933594, 0.011463165283203125, 0.014321327209472656, 0.017179489135742188, 0.02003765106201172, 0.02289581298828125, 0.02575397491455078, 0.028612136840820312, 0.031470298767089844, 0.034328460693359375, 0.037186622619628906, 0.04004478454589844, 0.04290294647216797, 0.0457611083984375, 0.04861927032470703, 0.05147743225097656, 0.054335594177246094, 0.057193756103515625, 0.060051918029785156, 0.06291007995605469, 0.06576824188232422, 0.06862640380859375, 0.07148456573486328, 0.07434272766113281, 0.07720088958740234, 0.08005905151367188, 0.0829172134399414, 0.08577537536621094, 0.08863353729248047, 0.09149169921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 12.0, 9.0, 20.0, 24.0, 34.0, 32.0, 58.0, 50.0, 89.0, 89.0, 78.0, 73.0, 87.0, 69.0, 39.0, 40.0, 38.0, 31.0, 20.0, 12.0, 18.0, 13.0, 5.0, 6.0, 5.0, 9.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.765655517578125e-05, -2.682860940694809e-05, -2.600066363811493e-05, -2.517271786928177e-05, -2.434477210044861e-05, -2.3516826331615448e-05, -2.2688880562782288e-05, -2.1860934793949127e-05, -2.1032989025115967e-05, -2.0205043256282806e-05, -1.9377097487449646e-05, -1.8549151718616486e-05, -1.7721205949783325e-05, -1.6893260180950165e-05, -1.6065314412117004e-05, -1.5237368643283844e-05, -1.4409422874450684e-05, -1.3581477105617523e-05, -1.2753531336784363e-05, -1.1925585567951202e-05, -1.1097639799118042e-05, -1.0269694030284882e-05, -9.441748261451721e-06, -8.61380249261856e-06, -7.7858567237854e-06, -6.95791095495224e-06, -6.12996518611908e-06, -5.302019417285919e-06, -4.474073648452759e-06, -3.6461278796195984e-06, -2.818182110786438e-06, -1.9902363419532776e-06, -1.1622905731201172e-06, -3.343448042869568e-07, 4.936009645462036e-07, 1.321546733379364e-06, 2.1494925022125244e-06, 2.977438271045685e-06, 3.8053840398788452e-06, 4.633329808712006e-06, 5.461275577545166e-06, 6.289221346378326e-06, 7.117167115211487e-06, 7.945112884044647e-06, 8.773058652877808e-06, 9.601004421710968e-06, 1.0428950190544128e-05, 1.1256895959377289e-05, 1.208484172821045e-05, 1.291278749704361e-05, 1.374073326587677e-05, 1.456867903470993e-05, 1.539662480354309e-05, 1.622457057237625e-05, 1.705251634120941e-05, 1.7880462110042572e-05, 1.8708407878875732e-05, 1.9536353647708893e-05, 2.0364299416542053e-05, 2.1192245185375214e-05, 2.2020190954208374e-05, 2.2848136723041534e-05, 2.3676082491874695e-05, 2.4504028260707855e-05, 2.5331974029541016e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 9.0, 12.0, 21.0, 34.0, 46.0, 51.0, 86.0, 119.0, 156.0, 246.0, 426.0, 649.0, 952.0, 1709.0, 2848.0, 5234.0, 10405.0, 23477.0, 58747.0, 149239.0, 285082.0, 274880.0, 136923.0, 53687.0, 21558.0, 9926.0, 4976.0, 2760.0, 1619.0, 998.0, 588.0, 368.0, 266.0, 145.0, 106.0, 64.0, 42.0, 36.0, 24.0, 14.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.091064453125, -0.08802413940429688, -0.08498382568359375, -0.08194351196289062, -0.0789031982421875, -0.07586288452148438, -0.07282257080078125, -0.06978225708007812, -0.066741943359375, -0.06370162963867188, -0.06066131591796875, -0.057621002197265625, -0.0545806884765625, -0.051540374755859375, -0.04850006103515625, -0.045459747314453125, -0.04241943359375, -0.039379119873046875, -0.03633880615234375, -0.033298492431640625, -0.0302581787109375, -0.027217864990234375, -0.02417755126953125, -0.021137237548828125, -0.018096923828125, -0.015056610107421875, -0.01201629638671875, -0.008975982666015625, -0.0059356689453125, -0.002895355224609375, 0.00014495849609375, 0.003185272216796875, 0.0062255859375, 0.009265899658203125, 0.01230621337890625, 0.015346527099609375, 0.0183868408203125, 0.021427154541015625, 0.02446746826171875, 0.027507781982421875, 0.030548095703125, 0.033588409423828125, 0.03662872314453125, 0.039669036865234375, 0.0427093505859375, 0.045749664306640625, 0.04878997802734375, 0.051830291748046875, 0.05487060546875, 0.057910919189453125, 0.06095123291015625, 0.06399154663085938, 0.0670318603515625, 0.07007217407226562, 0.07311248779296875, 0.07615280151367188, 0.079193115234375, 0.08223342895507812, 0.08527374267578125, 0.08831405639648438, 0.0913543701171875, 0.09439468383789062, 0.09743499755859375, 0.10047531127929688, 0.103515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 21.0, 20.0, 22.0, 29.0, 29.0, 43.0, 54.0, 65.0, 74.0, 77.0, 74.0, 78.0, 69.0, 53.0, 57.0, 33.0, 29.0, 27.0, 26.0, 16.0, 11.0, 12.0, 12.0, 5.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1009521484375, -0.09824275970458984, -0.09553337097167969, -0.09282398223876953, -0.09011459350585938, -0.08740520477294922, -0.08469581604003906, -0.0819864273071289, -0.07927703857421875, -0.0765676498413086, -0.07385826110839844, -0.07114887237548828, -0.06843948364257812, -0.06573009490966797, -0.06302070617675781, -0.060311317443847656, -0.0576019287109375, -0.054892539978027344, -0.05218315124511719, -0.04947376251220703, -0.046764373779296875, -0.04405498504638672, -0.04134559631347656, -0.038636207580566406, -0.03592681884765625, -0.033217430114746094, -0.030508041381835938, -0.02779865264892578, -0.025089263916015625, -0.02237987518310547, -0.019670486450195312, -0.016961097717285156, -0.014251708984375, -0.011542320251464844, -0.008832931518554688, -0.006123542785644531, -0.003414154052734375, -0.0007047653198242188, 0.0020046234130859375, 0.004714012145996094, 0.00742340087890625, 0.010132789611816406, 0.012842178344726562, 0.015551567077636719, 0.018260955810546875, 0.02097034454345703, 0.023679733276367188, 0.026389122009277344, 0.0290985107421875, 0.031807899475097656, 0.03451728820800781, 0.03722667694091797, 0.039936065673828125, 0.04264545440673828, 0.04535484313964844, 0.048064231872558594, 0.05077362060546875, 0.053483009338378906, 0.05619239807128906, 0.05890178680419922, 0.061611175537109375, 0.06432056427001953, 0.06702995300292969, 0.06973934173583984, 0.07244873046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 14.0, 25.0, 37.0, 67.0, 106.0, 141.0, 145.0, 163.0, 114.0, 85.0, 49.0, 25.0, 18.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7828733921051025, -0.7252159118652344, -0.6675584316253662, -0.609900951385498, -0.5522434711456299, -0.4945860207080841, -0.43692854046821594, -0.3792710602283478, -0.3216135799884796, -0.26395609974861145, -0.2062986195087433, -0.14864115417003632, -0.09098367393016815, -0.03332620859146118, 0.024331271648406982, 0.08198875188827515, 0.1396462321281433, 0.19730371236801147, 0.25496119260787964, 0.3126186728477478, 0.37027615308761597, 0.42793360352516174, 0.4855910837650299, 0.5432485342025757, 0.6009060144424438, 0.658563494682312, 0.7162209749221802, 0.7738784551620483, 0.8315359354019165, 0.8891934156417847, 0.9468508958816528, 1.004508376121521, 1.0621658563613892, 1.1198233366012573, 1.1774808168411255, 1.2351382970809937, 1.2927957773208618, 1.35045325756073, 1.4081107378005981, 1.4657682180404663, 1.5234256982803345, 1.5810831785202026, 1.6387406587600708, 1.696398138999939, 1.7540556192398071, 1.8117130994796753, 1.8693705797195435, 1.9270280599594116, 1.9846854209899902, 2.0423429012298584, 2.1000003814697266, 2.1576578617095947, 2.215315341949463, 2.272972822189331, 2.330630302429199, 2.3882877826690674, 2.4459452629089355, 2.5036027431488037, 2.561260223388672, 2.61891770362854, 2.676575183868408, 2.7342326641082764, 2.7918901443481445, 2.8495476245880127, 2.907205104827881]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 8.0, 14.0, 16.0, 20.0, 20.0, 18.0, 27.0, 23.0, 29.0, 27.0, 40.0, 21.0, 30.0, 35.0, 54.0, 38.0, 62.0, 37.0, 31.0, 43.0, 44.0, 38.0, 32.0, 34.0, 41.0, 32.0, 24.0, 25.0, 15.0, 21.0, 22.0, 17.0, 14.0, 4.0, 7.0, 2.0, 4.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7255238890647888, -0.7000626921653748, -0.6746014356613159, -0.6491402387619019, -0.6236790418624878, -0.5982178449630737, -0.5727565884590149, -0.5472953915596008, -0.521834135055542, -0.49637290835380554, -0.4709117114543915, -0.44545048475265503, -0.41998928785324097, -0.3945280611515045, -0.36906683444976807, -0.343605637550354, -0.31814444065093994, -0.2926832139492035, -0.26722201704978943, -0.24176079034805298, -0.21629957854747772, -0.19083836674690247, -0.16537714004516602, -0.13991592824459076, -0.1144547164440155, -0.08899350464344025, -0.0635322853922844, -0.03807106614112854, -0.012609854340553284, 0.012851357460021973, 0.03831258416175842, 0.06377379596233368, 0.08923506736755371, 0.11469627916812897, 0.14015749096870422, 0.16561871767044067, 0.19107992947101593, 0.2165411412715912, 0.24200236797332764, 0.2674635648727417, 0.29292479157447815, 0.3183860182762146, 0.34384721517562866, 0.3693084418773651, 0.39476966857910156, 0.4202308654785156, 0.4456920921802521, 0.4711533188819885, 0.4966145157814026, 0.5220757126808167, 0.5475369691848755, 0.5729981660842896, 0.5984593629837036, 0.6239205598831177, 0.6493818163871765, 0.6748430132865906, 0.7003042697906494, 0.7257654666900635, 0.7512267231941223, 0.7766879200935364, 0.8021491169929504, 0.8276103734970093, 0.8530715703964233, 0.8785327672958374, 0.9039939641952515]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 7.0, 7.0, 7.0, 16.0, 15.0, 36.0, 61.0, 85.0, 127.0, 165.0, 325.0, 478.0, 794.0, 1280.0, 2087.0, 3568.0, 6186.0, 11153.0, 21521.0, 43980.0, 100314.0, 270745.0, 791471.0, 1481206.0, 925992.0, 318682.0, 113179.0, 48430.0, 23477.0, 12254.0, 6651.0, 3875.0, 2318.0, 1365.0, 876.0, 537.0, 377.0, 212.0, 146.0, 87.0, 71.0, 40.0, 32.0, 17.0, 13.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0], "bins": [-0.1451416015625, -0.1411733627319336, -0.1372051239013672, -0.13323688507080078, -0.12926864624023438, -0.12530040740966797, -0.12133216857910156, -0.11736392974853516, -0.11339569091796875, -0.10942745208740234, -0.10545921325683594, -0.10149097442626953, -0.09752273559570312, -0.09355449676513672, -0.08958625793457031, -0.0856180191040039, -0.0816497802734375, -0.0776815414428711, -0.07371330261230469, -0.06974506378173828, -0.06577682495117188, -0.06180858612060547, -0.05784034729003906, -0.053872108459472656, -0.04990386962890625, -0.045935630798339844, -0.04196739196777344, -0.03799915313720703, -0.034030914306640625, -0.03006267547607422, -0.026094436645507812, -0.022126197814941406, -0.018157958984375, -0.014189720153808594, -0.010221481323242188, -0.006253242492675781, -0.002285003662109375, 0.0016832351684570312, 0.0056514739990234375, 0.009619712829589844, 0.01358795166015625, 0.017556190490722656, 0.021524429321289062, 0.02549266815185547, 0.029460906982421875, 0.03342914581298828, 0.03739738464355469, 0.041365623474121094, 0.0453338623046875, 0.049302101135253906, 0.05327033996582031, 0.05723857879638672, 0.061206817626953125, 0.06517505645751953, 0.06914329528808594, 0.07311153411865234, 0.07707977294921875, 0.08104801177978516, 0.08501625061035156, 0.08898448944091797, 0.09295272827148438, 0.09692096710205078, 0.10088920593261719, 0.1048574447631836, 0.10882568359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 8.0, 6.0, 9.0, 13.0, 10.0, 15.0, 20.0, 16.0, 21.0, 21.0, 19.0, 32.0, 39.0, 38.0, 34.0, 34.0, 30.0, 38.0, 51.0, 41.0, 42.0, 44.0, 44.0, 36.0, 26.0, 25.0, 36.0, 31.0, 36.0, 17.0, 28.0, 16.0, 20.0, 12.0, 14.0, 14.0, 9.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.10125732421875, -0.0980844497680664, -0.09491157531738281, -0.09173870086669922, -0.08856582641601562, -0.08539295196533203, -0.08222007751464844, -0.07904720306396484, -0.07587432861328125, -0.07270145416259766, -0.06952857971191406, -0.06635570526123047, -0.06318283081054688, -0.06000995635986328, -0.05683708190917969, -0.053664207458496094, -0.0504913330078125, -0.047318458557128906, -0.04414558410644531, -0.04097270965576172, -0.037799835205078125, -0.03462696075439453, -0.03145408630371094, -0.028281211853027344, -0.02510833740234375, -0.021935462951660156, -0.018762588500976562, -0.015589714050292969, -0.012416839599609375, -0.009243965148925781, -0.0060710906982421875, -0.0028982162475585938, 0.000274658203125, 0.0034475326538085938, 0.0066204071044921875, 0.009793281555175781, 0.012966156005859375, 0.01613903045654297, 0.019311904907226562, 0.022484779357910156, 0.02565765380859375, 0.028830528259277344, 0.03200340270996094, 0.03517627716064453, 0.038349151611328125, 0.04152202606201172, 0.04469490051269531, 0.047867774963378906, 0.0510406494140625, 0.054213523864746094, 0.05738639831542969, 0.06055927276611328, 0.06373214721679688, 0.06690502166748047, 0.07007789611816406, 0.07325077056884766, 0.07642364501953125, 0.07959651947021484, 0.08276939392089844, 0.08594226837158203, 0.08911514282226562, 0.09228801727294922, 0.09546089172363281, 0.0986337661743164, 0.101806640625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 6.0, 5.0, 13.0, 12.0, 17.0, 30.0, 39.0, 53.0, 86.0, 160.0, 238.0, 348.0, 603.0, 1022.0, 1817.0, 3687.0, 7765.0, 18109.0, 46421.0, 128257.0, 383409.0, 1216986.0, 1572201.0, 532797.0, 175316.0, 61496.0, 23905.0, 9950.0, 4381.0, 2140.0, 1207.0, 654.0, 376.0, 266.0, 163.0, 104.0, 70.0, 44.0, 50.0, 26.0, 15.0, 10.0, 6.0, 10.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16357421875, -0.15814781188964844, -0.15272140502929688, -0.1472949981689453, -0.14186859130859375, -0.1364421844482422, -0.13101577758789062, -0.12558937072753906, -0.1201629638671875, -0.11473655700683594, -0.10931015014648438, -0.10388374328613281, -0.09845733642578125, -0.09303092956542969, -0.08760452270507812, -0.08217811584472656, -0.076751708984375, -0.07132530212402344, -0.06589889526367188, -0.06047248840332031, -0.05504608154296875, -0.04961967468261719, -0.044193267822265625, -0.03876686096191406, -0.0333404541015625, -0.027914047241210938, -0.022487640380859375, -0.017061233520507812, -0.01163482666015625, -0.0062084197998046875, -0.000782012939453125, 0.0046443939208984375, 0.01007080078125, 0.015497207641601562, 0.020923614501953125, 0.026350021362304688, 0.03177642822265625, 0.03720283508300781, 0.042629241943359375, 0.04805564880371094, 0.0534820556640625, 0.05890846252441406, 0.06433486938476562, 0.06976127624511719, 0.07518768310546875, 0.08061408996582031, 0.08604049682617188, 0.09146690368652344, 0.096893310546875, 0.10231971740722656, 0.10774612426757812, 0.11317253112792969, 0.11859893798828125, 0.12402534484863281, 0.12945175170898438, 0.13487815856933594, 0.1403045654296875, 0.14573097229003906, 0.15115737915039062, 0.1565837860107422, 0.16201019287109375, 0.1674365997314453, 0.17286300659179688, 0.17828941345214844, 0.1837158203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 13.0, 10.0, 21.0, 21.0, 41.0, 62.0, 63.0, 100.0, 142.0, 216.0, 292.0, 392.0, 553.0, 599.0, 479.0, 297.0, 236.0, 165.0, 106.0, 77.0, 54.0, 33.0, 24.0, 17.0, 13.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208740234375, -0.201568603515625, -0.19439697265625, -0.187225341796875, -0.1800537109375, -0.172882080078125, -0.16571044921875, -0.158538818359375, -0.1513671875, -0.144195556640625, -0.13702392578125, -0.129852294921875, -0.1226806640625, -0.115509033203125, -0.10833740234375, -0.101165771484375, -0.093994140625, -0.086822509765625, -0.07965087890625, -0.072479248046875, -0.0653076171875, -0.058135986328125, -0.05096435546875, -0.043792724609375, -0.03662109375, -0.029449462890625, -0.02227783203125, -0.015106201171875, -0.0079345703125, -0.000762939453125, 0.00640869140625, 0.013580322265625, 0.020751953125, 0.027923583984375, 0.03509521484375, 0.042266845703125, 0.0494384765625, 0.056610107421875, 0.06378173828125, 0.070953369140625, 0.078125, 0.085296630859375, 0.09246826171875, 0.099639892578125, 0.1068115234375, 0.113983154296875, 0.12115478515625, 0.128326416015625, 0.135498046875, 0.142669677734375, 0.14984130859375, 0.157012939453125, 0.1641845703125, 0.171356201171875, 0.17852783203125, 0.185699462890625, 0.19287109375, 0.200042724609375, 0.20721435546875, 0.214385986328125, 0.2215576171875, 0.228729248046875, 0.23590087890625, 0.243072509765625, 0.250244140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 8.0, 14.0, 28.0, 37.0, 51.0, 79.0, 93.0, 96.0, 108.0, 124.0, 111.0, 84.0, 80.0, 27.0, 22.0, 17.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6676549911499023, -1.6285581588745117, -1.589461326599121, -1.55036461353302, -1.5112677812576294, -1.4721709489822388, -1.4330742359161377, -1.393977403640747, -1.3548805713653564, -1.3157837390899658, -1.2766869068145752, -1.2375901937484741, -1.1984933614730835, -1.1593965291976929, -1.1202998161315918, -1.0812029838562012, -1.0421061515808105, -1.00300931930542, -0.9639125466346741, -0.9248157739639282, -0.8857189416885376, -0.846622109413147, -0.8075253367424011, -0.7684285640716553, -0.7293317317962646, -0.690234899520874, -0.6511381268501282, -0.6120413541793823, -0.5729445219039917, -0.5338476896286011, -0.4947509169578552, -0.455654114484787, -0.4165573716163635, -0.3774605691432953, -0.33836376667022705, -0.2992669641971588, -0.2601701617240906, -0.22107335925102234, -0.1819765567779541, -0.14287975430488586, -0.10378295183181763, -0.06468614935874939, -0.025589346885681152, 0.013507455587387085, 0.05260425806045532, 0.09170106053352356, 0.1307978630065918, 0.16989466547966003, 0.20899146795272827, 0.2480882704257965, 0.28718507289886475, 0.326281875371933, 0.3653786778450012, 0.40447548031806946, 0.4435722827911377, 0.48266908526420593, 0.5217658877372742, 0.56086266040802, 0.5999594926834106, 0.6390563249588013, 0.6781530976295471, 0.717249870300293, 0.7563467025756836, 0.7954435348510742, 0.8345403075218201]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 2.0, 7.0, 11.0, 9.0, 5.0, 18.0, 13.0, 16.0, 29.0, 17.0, 26.0, 19.0, 32.0, 35.0, 29.0, 31.0, 49.0, 27.0, 44.0, 44.0, 44.0, 43.0, 40.0, 38.0, 29.0, 40.0, 27.0, 29.0, 36.0, 21.0, 24.0, 27.0, 24.0, 16.0, 17.0, 13.0, 7.0, 13.0, 10.0, 4.0, 5.0, 3.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5224376320838928, -0.5041913390159607, -0.4859449863433838, -0.4676986634731293, -0.44945234060287476, -0.4312060475349426, -0.4129597246646881, -0.3947134017944336, -0.3764670789241791, -0.35822075605392456, -0.33997443318367004, -0.3217281103134155, -0.3034818172454834, -0.2852354645729065, -0.26698917150497437, -0.24874284863471985, -0.23049652576446533, -0.21225020289421082, -0.1940038800239563, -0.17575757205486298, -0.15751124918460846, -0.13926492631435394, -0.12101861089468002, -0.1027722954750061, -0.08452597260475159, -0.06627964973449707, -0.04803333431482315, -0.029787015169858932, -0.011540696024894714, 0.006705626845359802, 0.024951942265033722, 0.04319825768470764, 0.06144458055496216, 0.07969090342521667, 0.0979372188448906, 0.11618353426456451, 0.13442985713481903, 0.15267618000507355, 0.17092248797416687, 0.1891688108444214, 0.2074151337146759, 0.22566145658493042, 0.24390777945518494, 0.26215410232543945, 0.2804003953933716, 0.2986467480659485, 0.3168930411338806, 0.33513936400413513, 0.35338568687438965, 0.37163200974464417, 0.3898783326148987, 0.4081246554851532, 0.4263709783554077, 0.44461727142333984, 0.46286359429359436, 0.4811099171638489, 0.4993562400341034, 0.5176025629043579, 0.53584885597229, 0.5540952086448669, 0.5723415017127991, 0.590587854385376, 0.6088341474533081, 0.6270804405212402, 0.6453267931938171]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 5.0, 6.0, 14.0, 25.0, 50.0, 48.0, 82.0, 110.0, 219.0, 320.0, 632.0, 1142.0, 2062.0, 3993.0, 7419.0, 14202.0, 26008.0, 48730.0, 89184.0, 156166.0, 219852.0, 200051.0, 126229.0, 69933.0, 38064.0, 20605.0, 10869.0, 5723.0, 3089.0, 1551.0, 900.0, 481.0, 291.0, 174.0, 110.0, 64.0, 40.0, 26.0, 21.0, 19.0, 4.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2195606231689453, -0.21219253540039062, -0.20482444763183594, -0.19745635986328125, -0.19008827209472656, -0.18272018432617188, -0.1753520965576172, -0.1679840087890625, -0.1606159210205078, -0.15324783325195312, -0.14587974548339844, -0.13851165771484375, -0.13114356994628906, -0.12377548217773438, -0.11640739440917969, -0.109039306640625, -0.10167121887207031, -0.09430313110351562, -0.08693504333496094, -0.07956695556640625, -0.07219886779785156, -0.06483078002929688, -0.05746269226074219, -0.0500946044921875, -0.04272651672363281, -0.035358428955078125, -0.027990341186523438, -0.02062225341796875, -0.013254165649414062, -0.005886077880859375, 0.0014820098876953125, 0.00885009765625, 0.016218185424804688, 0.023586273193359375, 0.030954360961914062, 0.03832244873046875, 0.04569053649902344, 0.053058624267578125, 0.06042671203613281, 0.0677947998046875, 0.07516288757324219, 0.08253097534179688, 0.08989906311035156, 0.09726715087890625, 0.10463523864746094, 0.11200332641601562, 0.11937141418457031, 0.126739501953125, 0.1341075897216797, 0.14147567749023438, 0.14884376525878906, 0.15621185302734375, 0.16357994079589844, 0.17094802856445312, 0.1783161163330078, 0.1856842041015625, 0.1930522918701172, 0.20042037963867188, 0.20778846740722656, 0.21515655517578125, 0.22252464294433594, 0.22989273071289062, 0.2372608184814453, 0.24462890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 2.0, 3.0, 10.0, 6.0, 10.0, 7.0, 19.0, 16.0, 23.0, 15.0, 24.0, 29.0, 31.0, 38.0, 38.0, 50.0, 37.0, 47.0, 45.0, 42.0, 43.0, 42.0, 45.0, 36.0, 48.0, 40.0, 35.0, 30.0, 19.0, 26.0, 19.0, 27.0, 16.0, 18.0, 13.0, 9.0, 8.0, 10.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08538055419921875, -0.0820159912109375, -0.07865142822265625, -0.075286865234375, -0.07192230224609375, -0.0685577392578125, -0.06519317626953125, -0.06182861328125, -0.05846405029296875, -0.0550994873046875, -0.05173492431640625, -0.048370361328125, -0.04500579833984375, -0.0416412353515625, -0.03827667236328125, -0.034912109375, -0.03154754638671875, -0.0281829833984375, -0.02481842041015625, -0.021453857421875, -0.01808929443359375, -0.0147247314453125, -0.01136016845703125, -0.00799560546875, -0.00463104248046875, -0.0012664794921875, 0.00209808349609375, 0.005462646484375, 0.00882720947265625, 0.0121917724609375, 0.01555633544921875, 0.0189208984375, 0.02228546142578125, 0.0256500244140625, 0.02901458740234375, 0.032379150390625, 0.03574371337890625, 0.0391082763671875, 0.04247283935546875, 0.04583740234375, 0.04920196533203125, 0.0525665283203125, 0.05593109130859375, 0.059295654296875, 0.06266021728515625, 0.0660247802734375, 0.06938934326171875, 0.07275390625, 0.07611846923828125, 0.0794830322265625, 0.08284759521484375, 0.086212158203125, 0.08957672119140625, 0.0929412841796875, 0.09630584716796875, 0.09967041015625, 0.10303497314453125, 0.1063995361328125, 0.10976409912109375, 0.113128662109375, 0.11649322509765625, 0.1198577880859375, 0.12322235107421875, 0.1265869140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 8.0, 11.0, 10.0, 18.0, 30.0, 47.0, 70.0, 122.0, 190.0, 370.0, 797.0, 1752.0, 4449.0, 11932.0, 31874.0, 82702.0, 187318.0, 302215.0, 238022.0, 112471.0, 45493.0, 17393.0, 6605.0, 2420.0, 1040.0, 543.0, 242.0, 133.0, 84.0, 46.0, 42.0, 27.0, 18.0, 9.0, 9.0, 5.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3154296875, -0.30633544921875, -0.2972412109375, -0.28814697265625, -0.279052734375, -0.26995849609375, -0.2608642578125, -0.25177001953125, -0.24267578125, -0.23358154296875, -0.2244873046875, -0.21539306640625, -0.206298828125, -0.19720458984375, -0.1881103515625, -0.17901611328125, -0.169921875, -0.16082763671875, -0.1517333984375, -0.14263916015625, -0.133544921875, -0.12445068359375, -0.1153564453125, -0.10626220703125, -0.09716796875, -0.08807373046875, -0.0789794921875, -0.06988525390625, -0.060791015625, -0.05169677734375, -0.0426025390625, -0.03350830078125, -0.0244140625, -0.01531982421875, -0.0062255859375, 0.00286865234375, 0.011962890625, 0.02105712890625, 0.0301513671875, 0.03924560546875, 0.04833984375, 0.05743408203125, 0.0665283203125, 0.07562255859375, 0.084716796875, 0.09381103515625, 0.1029052734375, 0.11199951171875, 0.12109375, 0.13018798828125, 0.1392822265625, 0.14837646484375, 0.157470703125, 0.16656494140625, 0.1756591796875, 0.18475341796875, 0.19384765625, 0.20294189453125, 0.2120361328125, 0.22113037109375, 0.230224609375, 0.23931884765625, 0.2484130859375, 0.25750732421875, 0.2666015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 3.0, 5.0, 7.0, 7.0, 6.0, 15.0, 11.0, 12.0, 17.0, 22.0, 21.0, 18.0, 29.0, 32.0, 27.0, 45.0, 45.0, 39.0, 56.0, 46.0, 53.0, 58.0, 53.0, 38.0, 46.0, 34.0, 43.0, 33.0, 34.0, 16.0, 22.0, 23.0, 15.0, 14.0, 10.0, 10.0, 9.0, 6.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.30106353759765625, -0.2910919189453125, -0.28112030029296875, -0.271148681640625, -0.26117706298828125, -0.2512054443359375, -0.24123382568359375, -0.23126220703125, -0.22129058837890625, -0.2113189697265625, -0.20134735107421875, -0.191375732421875, -0.18140411376953125, -0.1714324951171875, -0.16146087646484375, -0.1514892578125, -0.14151763916015625, -0.1315460205078125, -0.12157440185546875, -0.111602783203125, -0.10163116455078125, -0.0916595458984375, -0.08168792724609375, -0.07171630859375, -0.06174468994140625, -0.0517730712890625, -0.04180145263671875, -0.031829833984375, -0.02185821533203125, -0.0118865966796875, -0.00191497802734375, 0.008056640625, 0.01802825927734375, 0.0279998779296875, 0.03797149658203125, 0.047943115234375, 0.05791473388671875, 0.0678863525390625, 0.07785797119140625, 0.08782958984375, 0.09780120849609375, 0.1077728271484375, 0.11774444580078125, 0.127716064453125, 0.13768768310546875, 0.1476593017578125, 0.15763092041015625, 0.1676025390625, 0.17757415771484375, 0.1875457763671875, 0.19751739501953125, 0.207489013671875, 0.21746063232421875, 0.2274322509765625, 0.23740386962890625, 0.24737548828125, 0.25734710693359375, 0.2673187255859375, 0.27729034423828125, 0.287261962890625, 0.29723358154296875, 0.3072052001953125, 0.31717681884765625, 0.3271484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 11.0, 30.0, 43.0, 65.0, 73.0, 151.0, 227.0, 408.0, 638.0, 1124.0, 1857.0, 3131.0, 5346.0, 9539.0, 16325.0, 26757.0, 47353.0, 82799.0, 141833.0, 197655.0, 193518.0, 134084.0, 78837.0, 44618.0, 25530.0, 14978.0, 8819.0, 5253.0, 3053.0, 1825.0, 1039.0, 601.0, 363.0, 236.0, 133.0, 101.0, 54.0, 38.0, 30.0, 22.0, 11.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06420135498046875, -0.0620574951171875, -0.05991363525390625, -0.057769775390625, -0.05562591552734375, -0.0534820556640625, -0.05133819580078125, -0.0491943359375, -0.04705047607421875, -0.0449066162109375, -0.04276275634765625, -0.040618896484375, -0.03847503662109375, -0.0363311767578125, -0.03418731689453125, -0.03204345703125, -0.02989959716796875, -0.0277557373046875, -0.02561187744140625, -0.023468017578125, -0.02132415771484375, -0.0191802978515625, -0.01703643798828125, -0.014892578125, -0.01274871826171875, -0.0106048583984375, -0.00846099853515625, -0.006317138671875, -0.00417327880859375, -0.0020294189453125, 0.00011444091796875, 0.00225830078125, 0.00440216064453125, 0.0065460205078125, 0.00868988037109375, 0.010833740234375, 0.01297760009765625, 0.0151214599609375, 0.01726531982421875, 0.0194091796875, 0.02155303955078125, 0.0236968994140625, 0.02584075927734375, 0.027984619140625, 0.03012847900390625, 0.0322723388671875, 0.03441619873046875, 0.03656005859375, 0.03870391845703125, 0.0408477783203125, 0.04299163818359375, 0.045135498046875, 0.04727935791015625, 0.0494232177734375, 0.05156707763671875, 0.0537109375, 0.05585479736328125, 0.0579986572265625, 0.06014251708984375, 0.062286376953125, 0.06443023681640625, 0.0665740966796875, 0.06871795654296875, 0.07086181640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 7.0, 3.0, 9.0, 12.0, 14.0, 17.0, 16.0, 12.0, 30.0, 28.0, 31.0, 32.0, 57.0, 59.0, 69.0, 68.0, 82.0, 75.0, 70.0, 53.0, 49.0, 38.0, 27.0, 15.0, 25.0, 15.0, 9.0, 11.0, 9.0, 9.0, 10.0, 12.0, 3.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-05, -2.0816922187805176e-05, -2.0176172256469727e-05, -1.9535422325134277e-05, -1.8894672393798828e-05, -1.825392246246338e-05, -1.761317253112793e-05, -1.697242259979248e-05, -1.633167266845703e-05, -1.5690922737121582e-05, -1.5050172805786133e-05, -1.4409422874450684e-05, -1.3768672943115234e-05, -1.3127923011779785e-05, -1.2487173080444336e-05, -1.1846423149108887e-05, -1.1205673217773438e-05, -1.0564923286437988e-05, -9.924173355102539e-06, -9.28342342376709e-06, -8.64267349243164e-06, -8.001923561096191e-06, -7.361173629760742e-06, -6.720423698425293e-06, -6.079673767089844e-06, -5.4389238357543945e-06, -4.798173904418945e-06, -4.157423973083496e-06, -3.516674041748047e-06, -2.8759241104125977e-06, -2.2351741790771484e-06, -1.5944242477416992e-06, -9.5367431640625e-07, -3.129243850708008e-07, 3.2782554626464844e-07, 9.685754776000977e-07, 1.6093254089355469e-06, 2.250075340270996e-06, 2.8908252716064453e-06, 3.5315752029418945e-06, 4.172325134277344e-06, 4.813075065612793e-06, 5.453824996948242e-06, 6.094574928283691e-06, 6.735324859619141e-06, 7.37607479095459e-06, 8.016824722290039e-06, 8.657574653625488e-06, 9.298324584960938e-06, 9.939074516296387e-06, 1.0579824447631836e-05, 1.1220574378967285e-05, 1.1861324310302734e-05, 1.2502074241638184e-05, 1.3142824172973633e-05, 1.3783574104309082e-05, 1.4424324035644531e-05, 1.506507396697998e-05, 1.570582389831543e-05, 1.634657382965088e-05, 1.6987323760986328e-05, 1.7628073692321777e-05, 1.8268823623657227e-05, 1.8909573554992676e-05, 1.9550323486328125e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 11.0, 13.0, 17.0, 34.0, 44.0, 59.0, 86.0, 144.0, 205.0, 316.0, 512.0, 983.0, 1605.0, 2820.0, 4894.0, 8593.0, 14333.0, 24520.0, 42627.0, 78975.0, 151456.0, 230395.0, 211495.0, 125192.0, 64376.0, 34890.0, 20678.0, 12282.0, 7144.0, 4108.0, 2372.0, 1327.0, 752.0, 456.0, 300.0, 172.0, 108.0, 78.0, 53.0, 37.0, 26.0, 24.0, 16.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059814453125, -0.05766582489013672, -0.05551719665527344, -0.053368568420410156, -0.051219940185546875, -0.049071311950683594, -0.04692268371582031, -0.04477405548095703, -0.04262542724609375, -0.04047679901123047, -0.03832817077636719, -0.036179542541503906, -0.034030914306640625, -0.031882286071777344, -0.029733657836914062, -0.02758502960205078, -0.0254364013671875, -0.02328777313232422, -0.021139144897460938, -0.018990516662597656, -0.016841888427734375, -0.014693260192871094, -0.012544631958007812, -0.010396003723144531, -0.00824737548828125, -0.006098747253417969, -0.0039501190185546875, -0.0018014907836914062, 0.000347137451171875, 0.0024957656860351562, 0.0046443939208984375, 0.006793022155761719, 0.008941650390625, 0.011090278625488281, 0.013238906860351562, 0.015387535095214844, 0.017536163330078125, 0.019684791564941406, 0.021833419799804688, 0.02398204803466797, 0.02613067626953125, 0.02827930450439453, 0.030427932739257812, 0.032576560974121094, 0.034725189208984375, 0.036873817443847656, 0.03902244567871094, 0.04117107391357422, 0.0433197021484375, 0.04546833038330078, 0.04761695861816406, 0.049765586853027344, 0.051914215087890625, 0.054062843322753906, 0.05621147155761719, 0.05836009979248047, 0.06050872802734375, 0.06265735626220703, 0.06480598449707031, 0.0669546127319336, 0.06910324096679688, 0.07125186920166016, 0.07340049743652344, 0.07554912567138672, 0.07769775390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 6.0, 12.0, 6.0, 12.0, 22.0, 14.0, 23.0, 31.0, 18.0, 31.0, 37.0, 35.0, 50.0, 54.0, 52.0, 42.0, 53.0, 47.0, 46.0, 44.0, 39.0, 36.0, 29.0, 36.0, 23.0, 32.0, 25.0, 17.0, 24.0, 20.0, 14.0, 7.0, 6.0, 10.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0], "bins": [-0.07470703125, -0.07268571853637695, -0.0706644058227539, -0.06864309310913086, -0.06662178039550781, -0.06460046768188477, -0.06257915496826172, -0.06055784225463867, -0.058536529541015625, -0.05651521682739258, -0.05449390411376953, -0.052472591400146484, -0.05045127868652344, -0.04842996597290039, -0.046408653259277344, -0.0443873405456543, -0.04236602783203125, -0.0403447151184082, -0.038323402404785156, -0.03630208969116211, -0.03428077697753906, -0.032259464263916016, -0.03023815155029297, -0.028216838836669922, -0.026195526123046875, -0.024174213409423828, -0.02215290069580078, -0.020131587982177734, -0.018110275268554688, -0.01608896255493164, -0.014067649841308594, -0.012046337127685547, -0.0100250244140625, -0.008003711700439453, -0.005982398986816406, -0.003961086273193359, -0.0019397735595703125, 8.153915405273438e-05, 0.0021028518676757812, 0.004124164581298828, 0.006145477294921875, 0.008166790008544922, 0.010188102722167969, 0.012209415435791016, 0.014230728149414062, 0.01625204086303711, 0.018273353576660156, 0.020294666290283203, 0.02231597900390625, 0.024337291717529297, 0.026358604431152344, 0.02837991714477539, 0.030401229858398438, 0.032422542572021484, 0.03444385528564453, 0.03646516799926758, 0.038486480712890625, 0.04050779342651367, 0.04252910614013672, 0.044550418853759766, 0.04657173156738281, 0.04859304428100586, 0.050614356994628906, 0.05263566970825195, 0.054656982421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 14.0, 17.0, 46.0, 69.0, 80.0, 81.0, 99.0, 123.0, 118.0, 91.0, 70.0, 66.0, 50.0, 24.0, 13.0, 9.0, 10.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5441861152648926, -1.506771206855774, -1.4693562984466553, -1.431941270828247, -1.3945263624191284, -1.3571114540100098, -1.3196964263916016, -1.282281517982483, -1.2448666095733643, -1.2074517011642456, -1.170036792755127, -1.1326217651367188, -1.0952068567276, -1.0577919483184814, -1.0203769207000732, -0.9829620122909546, -0.9455471038818359, -0.9081321954727173, -0.8707172274589539, -0.8333022594451904, -0.7958873510360718, -0.7584724426269531, -0.7210574746131897, -0.6836425065994263, -0.6462275981903076, -0.608812689781189, -0.5713977217674255, -0.5339827537536621, -0.49656784534454346, -0.4591529071331024, -0.4217379689216614, -0.38432303071022034, -0.3469081521034241, -0.30949321389198303, -0.272078275680542, -0.23466333746910095, -0.1972483992576599, -0.15983346104621887, -0.12241852283477783, -0.08500358462333679, -0.04758864641189575, -0.010173708200454712, 0.027241230010986328, 0.06465616822242737, 0.10207110643386841, 0.13948604464530945, 0.1769009828567505, 0.21431592106819153, 0.25173085927963257, 0.2891457974910736, 0.32656073570251465, 0.3639756739139557, 0.40139061212539673, 0.43880555033683777, 0.4762204885482788, 0.5136353969573975, 0.5510503649711609, 0.5884653329849243, 0.625880241394043, 0.6632951498031616, 0.700710117816925, 0.7381250858306885, 0.7755399942398071, 0.8129549026489258, 0.8503698706626892]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 6.0, 9.0, 20.0, 24.0, 14.0, 19.0, 13.0, 17.0, 25.0, 20.0, 34.0, 36.0, 43.0, 35.0, 33.0, 40.0, 28.0, 42.0, 45.0, 46.0, 44.0, 35.0, 41.0, 33.0, 38.0, 28.0, 28.0, 23.0, 21.0, 19.0, 17.0, 18.0, 11.0, 14.0, 7.0, 10.0, 12.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.829835832118988, -0.8057913780212402, -0.7817469239234924, -0.7577024698257446, -0.7336580157279968, -0.709613561630249, -0.685569167137146, -0.6615246534347534, -0.6374802589416504, -0.6134358048439026, -0.5893913507461548, -0.565346896648407, -0.5413024425506592, -0.5172579884529114, -0.49321356415748596, -0.46916911005973816, -0.44512462615966797, -0.42108017206192017, -0.39703571796417236, -0.37299126386642456, -0.34894680976867676, -0.32490235567092896, -0.30085793137550354, -0.27681347727775574, -0.25276902318000793, -0.22872456908226013, -0.20468011498451233, -0.18063567578792572, -0.15659122169017792, -0.13254676759243011, -0.1085023283958435, -0.0844578742980957, -0.060413360595703125, -0.03636891022324562, -0.012324459850788116, 0.01171998679637909, 0.03576444089412689, 0.059808894991874695, 0.0838533341884613, 0.1078977882862091, 0.1319422423839569, 0.1559866964817047, 0.18003115057945251, 0.20407558977603912, 0.22812004387378693, 0.25216448307037354, 0.27620893716812134, 0.30025339126586914, 0.32429784536361694, 0.34834229946136475, 0.37238675355911255, 0.39643120765686035, 0.42047566175460815, 0.44452011585235596, 0.46856454014778137, 0.4926089942455292, 0.5166534185409546, 0.5406978726387024, 0.5647423267364502, 0.588786780834198, 0.6128312349319458, 0.6368756890296936, 0.6609201431274414, 0.6849645376205444, 0.709009051322937]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 10.0, 15.0, 17.0, 24.0, 47.0, 85.0, 141.0, 297.0, 621.0, 1386.0, 3341.0, 8898.0, 25127.0, 79419.0, 320902.0, 1652476.0, 1664127.0, 319018.0, 78520.0, 24665.0, 8992.0, 3477.0, 1356.0, 672.0, 298.0, 166.0, 85.0, 44.0, 31.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.28125, -0.27403831481933594, -0.2668266296386719, -0.2596149444580078, -0.25240325927734375, -0.2451915740966797, -0.23797988891601562, -0.23076820373535156, -0.2235565185546875, -0.21634483337402344, -0.20913314819335938, -0.2019214630126953, -0.19470977783203125, -0.1874980926513672, -0.18028640747070312, -0.17307472229003906, -0.165863037109375, -0.15865135192871094, -0.15143966674804688, -0.1442279815673828, -0.13701629638671875, -0.1298046112060547, -0.12259292602539062, -0.11538124084472656, -0.1081695556640625, -0.10095787048339844, -0.09374618530273438, -0.08653450012207031, -0.07932281494140625, -0.07211112976074219, -0.06489944458007812, -0.05768775939941406, -0.05047607421875, -0.04326438903808594, -0.036052703857421875, -0.028841018676757812, -0.02162933349609375, -0.014417648315429688, -0.007205963134765625, 5.7220458984375e-06, 0.0072174072265625, 0.014429092407226562, 0.021640777587890625, 0.028852462768554688, 0.03606414794921875, 0.04327583312988281, 0.050487518310546875, 0.05769920349121094, 0.064910888671875, 0.07212257385253906, 0.07933425903320312, 0.08654594421386719, 0.09375762939453125, 0.10096931457519531, 0.10818099975585938, 0.11539268493652344, 0.1226043701171875, 0.12981605529785156, 0.13702774047851562, 0.1442394256591797, 0.15145111083984375, 0.1586627960205078, 0.16587448120117188, 0.17308616638183594, 0.1802978515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 6.0, 13.0, 6.0, 13.0, 17.0, 21.0, 16.0, 20.0, 18.0, 27.0, 43.0, 35.0, 46.0, 43.0, 39.0, 36.0, 32.0, 34.0, 42.0, 37.0, 43.0, 50.0, 34.0, 28.0, 27.0, 36.0, 36.0, 19.0, 30.0, 24.0, 16.0, 12.0, 11.0, 12.0, 13.0, 8.0, 3.0, 12.0, 10.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10211181640625, -0.09863471984863281, -0.09515762329101562, -0.09168052673339844, -0.08820343017578125, -0.08472633361816406, -0.08124923706054688, -0.07777214050292969, -0.0742950439453125, -0.07081794738769531, -0.06734085083007812, -0.06386375427246094, -0.06038665771484375, -0.05690956115722656, -0.053432464599609375, -0.04995536804199219, -0.046478271484375, -0.04300117492675781, -0.039524078369140625, -0.03604698181152344, -0.03256988525390625, -0.029092788696289062, -0.025615692138671875, -0.022138595581054688, -0.0186614990234375, -0.015184402465820312, -0.011707305908203125, -0.008230209350585938, -0.00475311279296875, -0.0012760162353515625, 0.002201080322265625, 0.0056781768798828125, 0.0091552734375, 0.012632369995117188, 0.016109466552734375, 0.019586563110351562, 0.02306365966796875, 0.026540756225585938, 0.030017852783203125, 0.03349494934082031, 0.0369720458984375, 0.04044914245605469, 0.043926239013671875, 0.04740333557128906, 0.05088043212890625, 0.05435752868652344, 0.057834625244140625, 0.06131172180175781, 0.064788818359375, 0.06826591491699219, 0.07174301147460938, 0.07522010803222656, 0.07869720458984375, 0.08217430114746094, 0.08565139770507812, 0.08912849426269531, 0.0926055908203125, 0.09608268737792969, 0.09955978393554688, 0.10303688049316406, 0.10651397705078125, 0.10999107360839844, 0.11346817016601562, 0.11694526672363281, 0.12042236328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 5.0, 6.0, 16.0, 20.0, 35.0, 45.0, 69.0, 106.0, 173.0, 306.0, 566.0, 1083.0, 2267.0, 5305.0, 12596.0, 33386.0, 92756.0, 275323.0, 882683.0, 1801058.0, 729250.0, 230510.0, 78380.0, 28378.0, 10983.0, 4650.0, 2102.0, 992.0, 504.0, 301.0, 155.0, 95.0, 66.0, 37.0, 31.0, 19.0, 11.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.206787109375, -0.20059967041015625, -0.1944122314453125, -0.18822479248046875, -0.182037353515625, -0.17584991455078125, -0.1696624755859375, -0.16347503662109375, -0.15728759765625, -0.15110015869140625, -0.1449127197265625, -0.13872528076171875, -0.132537841796875, -0.12635040283203125, -0.1201629638671875, -0.11397552490234375, -0.1077880859375, -0.10160064697265625, -0.0954132080078125, -0.08922576904296875, -0.083038330078125, -0.07685089111328125, -0.0706634521484375, -0.06447601318359375, -0.05828857421875, -0.05210113525390625, -0.0459136962890625, -0.03972625732421875, -0.033538818359375, -0.02735137939453125, -0.0211639404296875, -0.01497650146484375, -0.0087890625, -0.00260162353515625, 0.0035858154296875, 0.00977325439453125, 0.015960693359375, 0.02214813232421875, 0.0283355712890625, 0.03452301025390625, 0.04071044921875, 0.04689788818359375, 0.0530853271484375, 0.05927276611328125, 0.065460205078125, 0.07164764404296875, 0.0778350830078125, 0.08402252197265625, 0.0902099609375, 0.09639739990234375, 0.1025848388671875, 0.10877227783203125, 0.114959716796875, 0.12114715576171875, 0.1273345947265625, 0.13352203369140625, 0.13970947265625, 0.14589691162109375, 0.1520843505859375, 0.15827178955078125, 0.164459228515625, 0.17064666748046875, 0.1768341064453125, 0.18302154541015625, 0.189208984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 2.0, 10.0, 6.0, 13.0, 16.0, 27.0, 27.0, 38.0, 60.0, 71.0, 96.0, 129.0, 184.0, 239.0, 356.0, 458.0, 524.0, 462.0, 354.0, 258.0, 184.0, 155.0, 86.0, 65.0, 68.0, 50.0, 29.0, 22.0, 18.0, 18.0, 13.0, 7.0, 11.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.253173828125, -0.2462310791015625, -0.239288330078125, -0.2323455810546875, -0.22540283203125, -0.2184600830078125, -0.211517333984375, -0.2045745849609375, -0.1976318359375, -0.1906890869140625, -0.183746337890625, -0.1768035888671875, -0.16986083984375, -0.1629180908203125, -0.155975341796875, -0.1490325927734375, -0.14208984375, -0.1351470947265625, -0.128204345703125, -0.1212615966796875, -0.11431884765625, -0.1073760986328125, -0.100433349609375, -0.0934906005859375, -0.0865478515625, -0.0796051025390625, -0.072662353515625, -0.0657196044921875, -0.05877685546875, -0.0518341064453125, -0.044891357421875, -0.0379486083984375, -0.031005859375, -0.0240631103515625, -0.017120361328125, -0.0101776123046875, -0.00323486328125, 0.0037078857421875, 0.010650634765625, 0.0175933837890625, 0.0245361328125, 0.0314788818359375, 0.038421630859375, 0.0453643798828125, 0.05230712890625, 0.0592498779296875, 0.066192626953125, 0.0731353759765625, 0.080078125, 0.0870208740234375, 0.093963623046875, 0.1009063720703125, 0.10784912109375, 0.1147918701171875, 0.121734619140625, 0.1286773681640625, 0.1356201171875, 0.1425628662109375, 0.149505615234375, 0.1564483642578125, 0.16339111328125, 0.1703338623046875, 0.177276611328125, 0.1842193603515625, 0.191162109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 15.0, 37.0, 56.0, 83.0, 122.0, 122.0, 137.0, 132.0, 91.0, 77.0, 56.0, 29.0, 23.0, 13.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9409077167510986, -1.892691731452942, -1.8444758653640747, -1.796259880065918, -1.7480440139770508, -1.699828028678894, -1.6516120433807373, -1.6033961772918701, -1.555180311203003, -1.5069643259048462, -1.458748459815979, -1.4105324745178223, -1.362316608428955, -1.3141006231307983, -1.2658846378326416, -1.2176687717437744, -1.1694527864456177, -1.121236801147461, -1.0730209350585938, -1.024804949760437, -0.9765890836715698, -0.9283730983734131, -0.8801571726799011, -0.8319412469863892, -0.7837253212928772, -0.7355093955993652, -0.6872934699058533, -0.6390775442123413, -0.5908615589141846, -0.5426456928253174, -0.49442970752716064, -0.4462137818336487, -0.3979978561401367, -0.34978193044662476, -0.3015660047531128, -0.25335004925727844, -0.20513412356376648, -0.15691819787025452, -0.10870224237442017, -0.0604863166809082, -0.01227039098739624, 0.03594554215669632, 0.08416147530078888, 0.13237741589546204, 0.180593341588974, 0.22880926728248596, 0.2770252227783203, 0.3252411484718323, 0.37345707416534424, 0.4216729998588562, 0.46988892555236816, 0.5181049108505249, 0.5663207769393921, 0.6145367622375488, 0.6627526879310608, 0.7109686136245728, 0.7591845393180847, 0.8074004650115967, 0.8556163907051086, 0.9038323163986206, 0.9520483016967773, 1.0002641677856445, 1.0484801530838013, 1.096696138381958, 1.1449120044708252]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 5.0, 5.0, 0.0, 9.0, 9.0, 8.0, 19.0, 20.0, 25.0, 26.0, 20.0, 32.0, 32.0, 35.0, 41.0, 39.0, 36.0, 53.0, 42.0, 39.0, 34.0, 43.0, 51.0, 30.0, 39.0, 31.0, 30.0, 30.0, 28.0, 38.0, 32.0, 21.0, 20.0, 15.0, 7.0, 10.0, 5.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6615331768989563, -0.6389403343200684, -0.6163474917411804, -0.5937546491622925, -0.5711618661880493, -0.5485690236091614, -0.5259761810302734, -0.5033833384513855, -0.48079052567481995, -0.458197683095932, -0.43560487031936646, -0.4130120277404785, -0.3904191851615906, -0.367826372385025, -0.3452335298061371, -0.32264071702957153, -0.3000478744506836, -0.27745503187179565, -0.2548622190952301, -0.23226937651634216, -0.20967654883861542, -0.18708372116088867, -0.16449087858200073, -0.141898050904274, -0.11930522322654724, -0.0967123955488205, -0.07411956042051315, -0.05152672529220581, -0.028933897614479065, -0.006341069936752319, 0.01625177264213562, 0.038844600319862366, 0.061437368392944336, 0.08403019607067108, 0.10662303119897842, 0.12921586632728577, 0.1518086940050125, 0.17440152168273926, 0.1969943642616272, 0.21958719193935394, 0.2421800196170807, 0.26477286219596863, 0.2873656749725342, 0.3099585175514221, 0.33255136013031006, 0.3551441729068756, 0.37773701548576355, 0.4003298282623291, 0.42292267084121704, 0.445515513420105, 0.46810832619667053, 0.49070116877555847, 0.513293981552124, 0.535886824131012, 0.5584796667098999, 0.5810725092887878, 0.6036653518676758, 0.6262581944465637, 0.6488510370254517, 0.6714438199996948, 0.6940366625785828, 0.7166295051574707, 0.7392223477363586, 0.7618151903152466, 0.7844079732894897]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 9.0, 10.0, 16.0, 21.0, 39.0, 55.0, 124.0, 189.0, 323.0, 597.0, 1005.0, 1841.0, 3299.0, 5960.0, 10942.0, 19232.0, 33271.0, 56419.0, 92424.0, 143343.0, 190120.0, 177255.0, 123121.0, 78414.0, 47350.0, 27418.0, 15952.0, 8821.0, 4863.0, 2689.0, 1532.0, 776.0, 458.0, 266.0, 142.0, 91.0, 57.0, 35.0, 21.0, 20.0, 11.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2303466796875, -0.22310829162597656, -0.21586990356445312, -0.2086315155029297, -0.20139312744140625, -0.1941547393798828, -0.18691635131835938, -0.17967796325683594, -0.1724395751953125, -0.16520118713378906, -0.15796279907226562, -0.1507244110107422, -0.14348602294921875, -0.1362476348876953, -0.12900924682617188, -0.12177085876464844, -0.114532470703125, -0.10729408264160156, -0.10005569458007812, -0.09281730651855469, -0.08557891845703125, -0.07834053039550781, -0.07110214233398438, -0.06386375427246094, -0.0566253662109375, -0.04938697814941406, -0.042148590087890625, -0.03491020202636719, -0.02767181396484375, -0.020433425903320312, -0.013195037841796875, -0.0059566497802734375, 0.00128173828125, 0.008520126342773438, 0.015758514404296875, 0.022996902465820312, 0.03023529052734375, 0.03747367858886719, 0.044712066650390625, 0.05195045471191406, 0.0591888427734375, 0.06642723083496094, 0.07366561889648438, 0.08090400695800781, 0.08814239501953125, 0.09538078308105469, 0.10261917114257812, 0.10985755920410156, 0.117095947265625, 0.12433433532714844, 0.13157272338867188, 0.1388111114501953, 0.14604949951171875, 0.1532878875732422, 0.16052627563476562, 0.16776466369628906, 0.1750030517578125, 0.18224143981933594, 0.18947982788085938, 0.1967182159423828, 0.20395660400390625, 0.2111949920654297, 0.21843338012695312, 0.22567176818847656, 0.23291015625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 8.0, 11.0, 8.0, 19.0, 16.0, 24.0, 19.0, 30.0, 21.0, 38.0, 40.0, 32.0, 32.0, 47.0, 33.0, 43.0, 36.0, 36.0, 36.0, 43.0, 41.0, 33.0, 42.0, 35.0, 26.0, 28.0, 27.0, 22.0, 20.0, 29.0, 26.0, 14.0, 7.0, 9.0, 11.0, 8.0, 5.0, 8.0, 7.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1007080078125, -0.0974264144897461, -0.09414482116699219, -0.09086322784423828, -0.08758163452148438, -0.08430004119873047, -0.08101844787597656, -0.07773685455322266, -0.07445526123046875, -0.07117366790771484, -0.06789207458496094, -0.06461048126220703, -0.061328887939453125, -0.05804729461669922, -0.05476570129394531, -0.051484107971191406, -0.0482025146484375, -0.044920921325683594, -0.04163932800292969, -0.03835773468017578, -0.035076141357421875, -0.03179454803466797, -0.028512954711914062, -0.025231361389160156, -0.02194976806640625, -0.018668174743652344, -0.015386581420898438, -0.012104988098144531, -0.008823394775390625, -0.005541801452636719, -0.0022602081298828125, 0.0010213851928710938, 0.004302978515625, 0.007584571838378906, 0.010866165161132812, 0.014147758483886719, 0.017429351806640625, 0.02071094512939453, 0.023992538452148438, 0.027274131774902344, 0.03055572509765625, 0.033837318420410156, 0.03711891174316406, 0.04040050506591797, 0.043682098388671875, 0.04696369171142578, 0.05024528503417969, 0.053526878356933594, 0.0568084716796875, 0.060090065002441406, 0.06337165832519531, 0.06665325164794922, 0.06993484497070312, 0.07321643829345703, 0.07649803161621094, 0.07977962493896484, 0.08306121826171875, 0.08634281158447266, 0.08962440490722656, 0.09290599822998047, 0.09618759155273438, 0.09946918487548828, 0.10275077819824219, 0.1060323715209961, 0.10931396484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 9.0, 2.0, 5.0, 6.0, 12.0, 17.0, 21.0, 32.0, 59.0, 97.0, 177.0, 388.0, 795.0, 1835.0, 3887.0, 9177.0, 20274.0, 46050.0, 98605.0, 186959.0, 264148.0, 207133.0, 112508.0, 53179.0, 23884.0, 10722.0, 4632.0, 2076.0, 936.0, 420.0, 209.0, 126.0, 62.0, 45.0, 19.0, 10.0, 11.0, 9.0, 4.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2763671875, -0.26702880859375, -0.2576904296875, -0.24835205078125, -0.239013671875, -0.22967529296875, -0.2203369140625, -0.21099853515625, -0.20166015625, -0.19232177734375, -0.1829833984375, -0.17364501953125, -0.164306640625, -0.15496826171875, -0.1456298828125, -0.13629150390625, -0.126953125, -0.11761474609375, -0.1082763671875, -0.09893798828125, -0.089599609375, -0.08026123046875, -0.0709228515625, -0.06158447265625, -0.05224609375, -0.04290771484375, -0.0335693359375, -0.02423095703125, -0.014892578125, -0.00555419921875, 0.0037841796875, 0.01312255859375, 0.0224609375, 0.03179931640625, 0.0411376953125, 0.05047607421875, 0.059814453125, 0.06915283203125, 0.0784912109375, 0.08782958984375, 0.09716796875, 0.10650634765625, 0.1158447265625, 0.12518310546875, 0.134521484375, 0.14385986328125, 0.1531982421875, 0.16253662109375, 0.171875, 0.18121337890625, 0.1905517578125, 0.19989013671875, 0.209228515625, 0.21856689453125, 0.2279052734375, 0.23724365234375, 0.24658203125, 0.25592041015625, 0.2652587890625, 0.27459716796875, 0.283935546875, 0.29327392578125, 0.3026123046875, 0.31195068359375, 0.3212890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 14.0, 5.0, 12.0, 16.0, 12.0, 13.0, 16.0, 28.0, 20.0, 21.0, 25.0, 40.0, 29.0, 39.0, 36.0, 27.0, 41.0, 51.0, 44.0, 42.0, 36.0, 39.0, 37.0, 44.0, 33.0, 25.0, 38.0, 18.0, 28.0, 26.0, 21.0, 15.0, 14.0, 17.0, 11.0, 8.0, 8.0, 7.0, 11.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.330810546875, -0.3212776184082031, -0.31174468994140625, -0.3022117614746094, -0.2926788330078125, -0.2831459045410156, -0.27361297607421875, -0.2640800476074219, -0.254547119140625, -0.24501419067382812, -0.23548126220703125, -0.22594833374023438, -0.2164154052734375, -0.20688247680664062, -0.19734954833984375, -0.18781661987304688, -0.17828369140625, -0.16875076293945312, -0.15921783447265625, -0.14968490600585938, -0.1401519775390625, -0.13061904907226562, -0.12108612060546875, -0.11155319213867188, -0.102020263671875, -0.09248733520507812, -0.08295440673828125, -0.07342147827148438, -0.0638885498046875, -0.054355621337890625, -0.04482269287109375, -0.035289764404296875, -0.0257568359375, -0.016223907470703125, -0.00669097900390625, 0.002841949462890625, 0.0123748779296875, 0.021907806396484375, 0.03144073486328125, 0.040973663330078125, 0.050506591796875, 0.060039520263671875, 0.06957244873046875, 0.07910537719726562, 0.0886383056640625, 0.09817123413085938, 0.10770416259765625, 0.11723709106445312, 0.12677001953125, 0.13630294799804688, 0.14583587646484375, 0.15536880493164062, 0.1649017333984375, 0.17443466186523438, 0.18396759033203125, 0.19350051879882812, 0.203033447265625, 0.21256637573242188, 0.22209930419921875, 0.23163223266601562, 0.2411651611328125, 0.2506980895996094, 0.26023101806640625, 0.2697639465332031, 0.279296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 10.0, 29.0, 34.0, 56.0, 118.0, 198.0, 321.0, 621.0, 1125.0, 1897.0, 3781.0, 6997.0, 13212.0, 23931.0, 43673.0, 75150.0, 124917.0, 180607.0, 196858.0, 151916.0, 96593.0, 56725.0, 31780.0, 17503.0, 9365.0, 5144.0, 2748.0, 1469.0, 780.0, 438.0, 243.0, 133.0, 65.0, 50.0, 24.0, 19.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0924072265625, -0.08985710144042969, -0.08730697631835938, -0.08475685119628906, -0.08220672607421875, -0.07965660095214844, -0.07710647583007812, -0.07455635070800781, -0.0720062255859375, -0.06945610046386719, -0.06690597534179688, -0.06435585021972656, -0.06180572509765625, -0.05925559997558594, -0.056705474853515625, -0.05415534973144531, -0.051605224609375, -0.04905509948730469, -0.046504974365234375, -0.04395484924316406, -0.04140472412109375, -0.03885459899902344, -0.036304473876953125, -0.03375434875488281, -0.0312042236328125, -0.028654098510742188, -0.026103973388671875, -0.023553848266601562, -0.02100372314453125, -0.018453598022460938, -0.015903472900390625, -0.013353347778320312, -0.01080322265625, -0.008253097534179688, -0.005702972412109375, -0.0031528472900390625, -0.00060272216796875, 0.0019474029541015625, 0.004497528076171875, 0.0070476531982421875, 0.0095977783203125, 0.012147903442382812, 0.014698028564453125, 0.017248153686523438, 0.01979827880859375, 0.022348403930664062, 0.024898529052734375, 0.027448654174804688, 0.029998779296875, 0.03254890441894531, 0.035099029541015625, 0.03764915466308594, 0.04019927978515625, 0.04274940490722656, 0.045299530029296875, 0.04784965515136719, 0.0503997802734375, 0.05294990539550781, 0.055500030517578125, 0.05805015563964844, 0.06060028076171875, 0.06315040588378906, 0.06570053100585938, 0.06825065612792969, 0.07080078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 10.0, 7.0, 11.0, 11.0, 16.0, 15.0, 23.0, 24.0, 31.0, 35.0, 39.0, 49.0, 50.0, 46.0, 45.0, 54.0, 62.0, 59.0, 67.0, 46.0, 50.0, 32.0, 31.0, 29.0, 19.0, 20.0, 17.0, 10.0, 6.0, 10.0, 6.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1398067474365234e-05, -2.0689330995082855e-05, -1.9980594515800476e-05, -1.9271858036518097e-05, -1.8563121557235718e-05, -1.785438507795334e-05, -1.714564859867096e-05, -1.643691211938858e-05, -1.57281756401062e-05, -1.5019439160823822e-05, -1.4310702681541443e-05, -1.3601966202259064e-05, -1.2893229722976685e-05, -1.2184493243694305e-05, -1.1475756764411926e-05, -1.0767020285129547e-05, -1.0058283805847168e-05, -9.349547326564789e-06, -8.64081084728241e-06, -7.93207436800003e-06, -7.223337888717651e-06, -6.514601409435272e-06, -5.805864930152893e-06, -5.097128450870514e-06, -4.388391971588135e-06, -3.6796554923057556e-06, -2.9709190130233765e-06, -2.2621825337409973e-06, -1.5534460544586182e-06, -8.44709575176239e-07, -1.3597309589385986e-07, 5.727633833885193e-07, 1.2814998626708984e-06, 1.9902363419532776e-06, 2.6989728212356567e-06, 3.407709300518036e-06, 4.116445779800415e-06, 4.825182259082794e-06, 5.533918738365173e-06, 6.2426552176475525e-06, 6.951391696929932e-06, 7.66012817621231e-06, 8.36886465549469e-06, 9.077601134777069e-06, 9.786337614059448e-06, 1.0495074093341827e-05, 1.1203810572624207e-05, 1.1912547051906586e-05, 1.2621283531188965e-05, 1.3330020010471344e-05, 1.4038756489753723e-05, 1.4747492969036102e-05, 1.545622944831848e-05, 1.616496592760086e-05, 1.687370240688324e-05, 1.758243888616562e-05, 1.8291175365447998e-05, 1.8999911844730377e-05, 1.9708648324012756e-05, 2.0417384803295135e-05, 2.1126121282577515e-05, 2.1834857761859894e-05, 2.2543594241142273e-05, 2.3252330720424652e-05, 2.396106719970703e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 9.0, 14.0, 24.0, 36.0, 69.0, 79.0, 144.0, 250.0, 431.0, 700.0, 1301.0, 2183.0, 4041.0, 7045.0, 12947.0, 22397.0, 38389.0, 64364.0, 103626.0, 152786.0, 184752.0, 163163.0, 115037.0, 72223.0, 43667.0, 25225.0, 14507.0, 8211.0, 4752.0, 2583.0, 1492.0, 830.0, 494.0, 281.0, 175.0, 120.0, 67.0, 45.0, 33.0, 19.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.069580078125, -0.06744670867919922, -0.06531333923339844, -0.06317996978759766, -0.061046600341796875, -0.058913230895996094, -0.05677986145019531, -0.05464649200439453, -0.05251312255859375, -0.05037975311279297, -0.04824638366699219, -0.046113014221191406, -0.043979644775390625, -0.041846275329589844, -0.03971290588378906, -0.03757953643798828, -0.0354461669921875, -0.03331279754638672, -0.031179428100585938, -0.029046058654785156, -0.026912689208984375, -0.024779319763183594, -0.022645950317382812, -0.02051258087158203, -0.01837921142578125, -0.01624584197998047, -0.014112472534179688, -0.011979103088378906, -0.009845733642578125, -0.007712364196777344, -0.0055789947509765625, -0.0034456253051757812, -0.001312255859375, 0.0008211135864257812, 0.0029544830322265625, 0.005087852478027344, 0.007221221923828125, 0.009354591369628906, 0.011487960815429688, 0.013621330261230469, 0.01575469970703125, 0.01788806915283203, 0.020021438598632812, 0.022154808044433594, 0.024288177490234375, 0.026421546936035156, 0.028554916381835938, 0.03068828582763672, 0.0328216552734375, 0.03495502471923828, 0.03708839416503906, 0.039221763610839844, 0.041355133056640625, 0.043488502502441406, 0.04562187194824219, 0.04775524139404297, 0.04988861083984375, 0.05202198028564453, 0.05415534973144531, 0.056288719177246094, 0.058422088623046875, 0.060555458068847656, 0.06268882751464844, 0.06482219696044922, 0.06695556640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 6.0, 8.0, 10.0, 14.0, 9.0, 18.0, 14.0, 19.0, 27.0, 25.0, 28.0, 40.0, 60.0, 46.0, 65.0, 66.0, 92.0, 67.0, 59.0, 49.0, 38.0, 35.0, 44.0, 22.0, 34.0, 28.0, 8.0, 15.0, 14.0, 8.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1048583984375, -0.10190582275390625, -0.0989532470703125, -0.09600067138671875, -0.093048095703125, -0.09009552001953125, -0.0871429443359375, -0.08419036865234375, -0.08123779296875, -0.07828521728515625, -0.0753326416015625, -0.07238006591796875, -0.069427490234375, -0.06647491455078125, -0.0635223388671875, -0.06056976318359375, -0.0576171875, -0.05466461181640625, -0.0517120361328125, -0.04875946044921875, -0.045806884765625, -0.04285430908203125, -0.0399017333984375, -0.03694915771484375, -0.03399658203125, -0.03104400634765625, -0.0280914306640625, -0.02513885498046875, -0.022186279296875, -0.01923370361328125, -0.0162811279296875, -0.01332855224609375, -0.0103759765625, -0.00742340087890625, -0.0044708251953125, -0.00151824951171875, 0.001434326171875, 0.00438690185546875, 0.0073394775390625, 0.01029205322265625, 0.01324462890625, 0.01619720458984375, 0.0191497802734375, 0.02210235595703125, 0.025054931640625, 0.02800750732421875, 0.0309600830078125, 0.03391265869140625, 0.036865234375, 0.03981781005859375, 0.0427703857421875, 0.04572296142578125, 0.048675537109375, 0.05162811279296875, 0.0545806884765625, 0.05753326416015625, 0.06048583984375, 0.06343841552734375, 0.0663909912109375, 0.06934356689453125, 0.072296142578125, 0.07524871826171875, 0.0782012939453125, 0.08115386962890625, 0.0841064453125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 10.0, 13.0, 12.0, 21.0, 39.0, 58.0, 86.0, 128.0, 126.0, 103.0, 116.0, 88.0, 78.0, 52.0, 33.0, 18.0, 9.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3004951477050781, -1.2525471448898315, -1.204599142074585, -1.1566511392593384, -1.1087031364440918, -1.0607551336288452, -1.0128071308135986, -0.964859127998352, -0.9169111251831055, -0.8689631223678589, -0.8210151195526123, -0.7730671167373657, -0.7251191139221191, -0.6771711111068726, -0.629223108291626, -0.5812751054763794, -0.5333271026611328, -0.48537909984588623, -0.43743109703063965, -0.38948309421539307, -0.3415350914001465, -0.2935870885848999, -0.24563908576965332, -0.19769108295440674, -0.14974308013916016, -0.10179507732391357, -0.05384707450866699, -0.00589907169342041, 0.04204893112182617, 0.08999693393707275, 0.13794493675231934, 0.18589293956756592, 0.2338409423828125, 0.2817889451980591, 0.32973694801330566, 0.37768495082855225, 0.42563295364379883, 0.4735809564590454, 0.521528959274292, 0.5694769620895386, 0.6174249649047852, 0.6653729677200317, 0.7133209705352783, 0.7612689733505249, 0.8092169761657715, 0.8571649789810181, 0.9051129817962646, 0.9530609846115112, 1.0010089874267578, 1.0489569902420044, 1.096904993057251, 1.1448529958724976, 1.1928009986877441, 1.2407490015029907, 1.2886970043182373, 1.3366450071334839, 1.3845930099487305, 1.432541012763977, 1.4804890155792236, 1.5284370183944702, 1.5763850212097168, 1.6243330240249634, 1.67228102684021, 1.7202290296554565, 1.7681770324707031]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 13.0, 7.0, 6.0, 10.0, 15.0, 10.0, 17.0, 20.0, 15.0, 23.0, 25.0, 23.0, 36.0, 39.0, 37.0, 51.0, 42.0, 43.0, 44.0, 48.0, 37.0, 44.0, 41.0, 45.0, 36.0, 45.0, 23.0, 26.0, 27.0, 35.0, 21.0, 24.0, 17.0, 12.0, 7.0, 7.0, 5.0, 9.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9006566405296326, -0.8736768364906311, -0.8466969728469849, -0.8197171688079834, -0.7927373051643372, -0.7657575011253357, -0.7387776374816895, -0.711797833442688, -0.6848180294036865, -0.6578382253646851, -0.6308583617210388, -0.6038785576820374, -0.5768986940383911, -0.5499188899993896, -0.5229390859603882, -0.49595922231674194, -0.4689793586730957, -0.44199952483177185, -0.415019690990448, -0.38803988695144653, -0.3610600233078003, -0.33408021926879883, -0.307100385427475, -0.2801205515861511, -0.25314071774482727, -0.22616088390350342, -0.19918105006217957, -0.1722012311220169, -0.14522139728069305, -0.1182415634393692, -0.09126174449920654, -0.06428191065788269, -0.03730213642120361, -0.01032230630517006, 0.016657523810863495, 0.04363735020160675, 0.0706171840429306, 0.09759701788425446, 0.12457683682441711, 0.15155667066574097, 0.17853650450706482, 0.20551633834838867, 0.23249617218971252, 0.2594760060310364, 0.28645581007003784, 0.3134356737136841, 0.34041547775268555, 0.3673953115940094, 0.39437514543533325, 0.4213549792766571, 0.44833481311798096, 0.4753146171569824, 0.5022944808006287, 0.5292742848396301, 0.5562541484832764, 0.5832339525222778, 0.6102137565612793, 0.6371935606002808, 0.664173424243927, 0.6911532282829285, 0.7181330919265747, 0.7451128959655762, 0.7720927000045776, 0.7990725636482239, 0.8260524272918701]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 6.0, 6.0, 11.0, 24.0, 29.0, 30.0, 55.0, 85.0, 126.0, 213.0, 362.0, 587.0, 1121.0, 2318.0, 5038.0, 11365.0, 27766.0, 76261.0, 265715.0, 1333553.0, 1918811.0, 386834.0, 102246.0, 35700.0, 14032.0, 6070.0, 2789.0, 1350.0, 711.0, 453.0, 233.0, 127.0, 71.0, 48.0, 43.0, 37.0, 15.0, 13.0, 13.0, 9.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.2763671875, -0.26947975158691406, -0.2625923156738281, -0.2557048797607422, -0.24881744384765625, -0.2419300079345703, -0.23504257202148438, -0.22815513610839844, -0.2212677001953125, -0.21438026428222656, -0.20749282836914062, -0.2006053924560547, -0.19371795654296875, -0.1868305206298828, -0.17994308471679688, -0.17305564880371094, -0.166168212890625, -0.15928077697753906, -0.15239334106445312, -0.1455059051513672, -0.13861846923828125, -0.1317310333251953, -0.12484359741210938, -0.11795616149902344, -0.1110687255859375, -0.10418128967285156, -0.09729385375976562, -0.09040641784667969, -0.08351898193359375, -0.07663154602050781, -0.06974411010742188, -0.06285667419433594, -0.05596923828125, -0.04908180236816406, -0.042194366455078125, -0.03530693054199219, -0.02841949462890625, -0.021532058715820312, -0.014644622802734375, -0.0077571868896484375, -0.0008697509765625, 0.0060176849365234375, 0.012905120849609375, 0.019792556762695312, 0.02667999267578125, 0.03356742858886719, 0.040454864501953125, 0.04734230041503906, 0.054229736328125, 0.06111717224121094, 0.06800460815429688, 0.07489204406738281, 0.08177947998046875, 0.08866691589355469, 0.09555435180664062, 0.10244178771972656, 0.1093292236328125, 0.11621665954589844, 0.12310409545898438, 0.1299915313720703, 0.13687896728515625, 0.1437664031982422, 0.15065383911132812, 0.15754127502441406, 0.1644287109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 10.0, 9.0, 12.0, 10.0, 15.0, 25.0, 21.0, 23.0, 29.0, 35.0, 29.0, 35.0, 24.0, 47.0, 52.0, 41.0, 41.0, 39.0, 30.0, 55.0, 35.0, 46.0, 38.0, 32.0, 32.0, 43.0, 28.0, 25.0, 14.0, 22.0, 16.0, 9.0, 11.0, 13.0, 15.0, 7.0, 5.0, 3.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.125, -0.121063232421875, -0.11712646484375, -0.113189697265625, -0.1092529296875, -0.105316162109375, -0.10137939453125, -0.097442626953125, -0.093505859375, -0.089569091796875, -0.08563232421875, -0.081695556640625, -0.0777587890625, -0.073822021484375, -0.06988525390625, -0.065948486328125, -0.06201171875, -0.058074951171875, -0.05413818359375, -0.050201416015625, -0.0462646484375, -0.042327880859375, -0.03839111328125, -0.034454345703125, -0.030517578125, -0.026580810546875, -0.02264404296875, -0.018707275390625, -0.0147705078125, -0.010833740234375, -0.00689697265625, -0.002960205078125, 0.0009765625, 0.004913330078125, 0.00885009765625, 0.012786865234375, 0.0167236328125, 0.020660400390625, 0.02459716796875, 0.028533935546875, 0.032470703125, 0.036407470703125, 0.04034423828125, 0.044281005859375, 0.0482177734375, 0.052154541015625, 0.05609130859375, 0.060028076171875, 0.06396484375, 0.067901611328125, 0.07183837890625, 0.075775146484375, 0.0797119140625, 0.083648681640625, 0.08758544921875, 0.091522216796875, 0.095458984375, 0.099395751953125, 0.10333251953125, 0.107269287109375, 0.1112060546875, 0.115142822265625, 0.11907958984375, 0.123016357421875, 0.126953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 13.0, 12.0, 14.0, 21.0, 37.0, 52.0, 61.0, 132.0, 220.0, 380.0, 632.0, 1006.0, 1903.0, 3381.0, 6468.0, 13211.0, 28205.0, 63553.0, 149840.0, 388049.0, 1146051.0, 1504749.0, 535679.0, 198760.0, 81819.0, 35978.0, 16606.0, 8056.0, 4080.0, 2209.0, 1252.0, 707.0, 411.0, 259.0, 160.0, 104.0, 67.0, 63.0, 27.0, 17.0, 7.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.18509864807128906, -0.17915725708007812, -0.1732158660888672, -0.16727447509765625, -0.1613330841064453, -0.15539169311523438, -0.14945030212402344, -0.1435089111328125, -0.13756752014160156, -0.13162612915039062, -0.1256847381591797, -0.11974334716796875, -0.11380195617675781, -0.10786056518554688, -0.10191917419433594, -0.095977783203125, -0.09003639221191406, -0.08409500122070312, -0.07815361022949219, -0.07221221923828125, -0.06627082824707031, -0.060329437255859375, -0.05438804626464844, -0.0484466552734375, -0.04250526428222656, -0.036563873291015625, -0.030622482299804688, -0.02468109130859375, -0.018739700317382812, -0.012798309326171875, -0.0068569183349609375, -0.00091552734375, 0.0050258636474609375, 0.010967254638671875, 0.016908645629882812, 0.02285003662109375, 0.028791427612304688, 0.034732818603515625, 0.04067420959472656, 0.0466156005859375, 0.05255699157714844, 0.058498382568359375, 0.06443977355957031, 0.07038116455078125, 0.07632255554199219, 0.08226394653320312, 0.08820533752441406, 0.094146728515625, 0.10008811950683594, 0.10602951049804688, 0.11197090148925781, 0.11791229248046875, 0.12385368347167969, 0.12979507446289062, 0.13573646545410156, 0.1416778564453125, 0.14761924743652344, 0.15356063842773438, 0.1595020294189453, 0.16544342041015625, 0.1713848114013672, 0.17732620239257812, 0.18326759338378906, 0.189208984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 12.0, 7.0, 14.0, 17.0, 30.0, 32.0, 46.0, 77.0, 102.0, 133.0, 197.0, 261.0, 461.0, 599.0, 612.0, 464.0, 309.0, 207.0, 126.0, 103.0, 84.0, 52.0, 35.0, 31.0, 16.0, 10.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274169921875, -0.2661113739013672, -0.2580528259277344, -0.24999427795410156, -0.24193572998046875, -0.23387718200683594, -0.22581863403320312, -0.2177600860595703, -0.2097015380859375, -0.2016429901123047, -0.19358444213867188, -0.18552589416503906, -0.17746734619140625, -0.16940879821777344, -0.16135025024414062, -0.1532917022705078, -0.145233154296875, -0.1371746063232422, -0.12911605834960938, -0.12105751037597656, -0.11299896240234375, -0.10494041442871094, -0.09688186645507812, -0.08882331848144531, -0.0807647705078125, -0.07270622253417969, -0.06464767456054688, -0.05658912658691406, -0.04853057861328125, -0.04047203063964844, -0.032413482666015625, -0.024354934692382812, -0.01629638671875, -0.008237838745117188, -0.000179290771484375, 0.007879257202148438, 0.01593780517578125, 0.023996353149414062, 0.032054901123046875, 0.04011344909667969, 0.0481719970703125, 0.05623054504394531, 0.06428909301757812, 0.07234764099121094, 0.08040618896484375, 0.08846473693847656, 0.09652328491210938, 0.10458183288574219, 0.112640380859375, 0.12069892883300781, 0.12875747680664062, 0.13681602478027344, 0.14487457275390625, 0.15293312072753906, 0.16099166870117188, 0.1690502166748047, 0.1771087646484375, 0.1851673126220703, 0.19322586059570312, 0.20128440856933594, 0.20934295654296875, 0.21740150451660156, 0.22546005249023438, 0.2335186004638672, 0.2415771484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 18.0, 28.0, 21.0, 50.0, 60.0, 59.0, 80.0, 83.0, 85.0, 116.0, 70.0, 68.0, 54.0, 50.0, 48.0, 24.0, 27.0, 20.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.499582052230835, -1.466069221496582, -1.4325562715530396, -1.399043321609497, -1.3655304908752441, -1.3320176601409912, -1.2985047101974487, -1.2649917602539062, -1.2314789295196533, -1.1979660987854004, -1.164453148841858, -1.1309401988983154, -1.0974273681640625, -1.0639145374298096, -1.030401587486267, -0.9968886971473694, -0.9633758068084717, -0.929862916469574, -0.8963500261306763, -0.8628371357917786, -0.8293242454528809, -0.7958113551139832, -0.7622984647750854, -0.7287855744361877, -0.69527268409729, -0.6617597937583923, -0.6282469034194946, -0.5947340130805969, -0.5612211227416992, -0.5277082324028015, -0.4941953420639038, -0.4606824517250061, -0.4271695017814636, -0.3936566114425659, -0.3601437211036682, -0.3266308307647705, -0.2931179404258728, -0.2596050500869751, -0.2260921597480774, -0.1925792694091797, -0.15906637907028198, -0.12555348873138428, -0.09204059839248657, -0.05852770805358887, -0.025014817714691162, 0.008498072624206543, 0.04201096296310425, 0.07552385330200195, 0.10903674364089966, 0.14254963397979736, 0.17606252431869507, 0.20957541465759277, 0.24308830499649048, 0.2766011953353882, 0.3101140856742859, 0.3436269760131836, 0.3771398663520813, 0.410652756690979, 0.4441656470298767, 0.4776785373687744, 0.5111914277076721, 0.5447043180465698, 0.5782172083854675, 0.6117300987243652, 0.6452429890632629]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 11.0, 8.0, 10.0, 7.0, 14.0, 10.0, 3.0, 23.0, 21.0, 28.0, 28.0, 34.0, 33.0, 48.0, 34.0, 51.0, 37.0, 49.0, 36.0, 43.0, 45.0, 37.0, 40.0, 34.0, 23.0, 34.0, 20.0, 20.0, 32.0, 26.0, 25.0, 15.0, 15.0, 17.0, 18.0, 6.0, 10.0, 7.0, 14.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.5979805588722229, -0.5795903205871582, -0.5612000823020935, -0.542809784412384, -0.5244195461273193, -0.5060293078422546, -0.48763906955718994, -0.46924883127212524, -0.45085856318473816, -0.43246832489967346, -0.4140780568122864, -0.3956878185272217, -0.377297580242157, -0.3589073121547699, -0.3405170738697052, -0.3221268057823181, -0.3037365674972534, -0.2853463292121887, -0.26695606112480164, -0.24856582283973694, -0.23017556965351105, -0.21178531646728516, -0.19339507818222046, -0.17500482499599457, -0.15661457180976868, -0.13822431862354279, -0.11983407288789749, -0.1014438271522522, -0.0830535739660263, -0.06466332077980042, -0.04627307504415512, -0.027882829308509827, -0.009492635726928711, 0.008897613734006882, 0.027287863194942474, 0.04567811265587807, 0.06406836211681366, 0.08245861530303955, 0.10084886103868484, 0.11923910677433014, 0.13762935996055603, 0.15601961314678192, 0.1744098663330078, 0.1928001046180725, 0.2111903578042984, 0.2295806109905243, 0.247970849275589, 0.2663611173629761, 0.28475135564804077, 0.30314159393310547, 0.32153186202049255, 0.33992210030555725, 0.35831236839294434, 0.37670260667800903, 0.39509284496307373, 0.4134830832481384, 0.4318733513355255, 0.4502635896205902, 0.4686538577079773, 0.487044095993042, 0.5054343342781067, 0.5238245725631714, 0.5422148704528809, 0.5606051087379456, 0.5789953470230103]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 14.0, 14.0, 19.0, 34.0, 48.0, 72.0, 103.0, 172.0, 300.0, 476.0, 808.0, 1400.0, 2345.0, 3841.0, 6368.0, 11010.0, 18611.0, 32496.0, 57235.0, 102953.0, 173186.0, 217734.0, 175603.0, 105296.0, 58633.0, 32781.0, 19304.0, 11238.0, 6690.0, 3960.0, 2337.0, 1396.0, 814.0, 487.0, 304.0, 177.0, 106.0, 63.0, 48.0, 30.0, 15.0, 9.0, 5.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19647979736328125, -0.1895904541015625, -0.18270111083984375, -0.175811767578125, -0.16892242431640625, -0.1620330810546875, -0.15514373779296875, -0.14825439453125, -0.14136505126953125, -0.1344757080078125, -0.12758636474609375, -0.120697021484375, -0.11380767822265625, -0.1069183349609375, -0.10002899169921875, -0.0931396484375, -0.08625030517578125, -0.0793609619140625, -0.07247161865234375, -0.065582275390625, -0.05869293212890625, -0.0518035888671875, -0.04491424560546875, -0.03802490234375, -0.03113555908203125, -0.0242462158203125, -0.01735687255859375, -0.010467529296875, -0.00357818603515625, 0.0033111572265625, 0.01020050048828125, 0.01708984375, 0.02397918701171875, 0.0308685302734375, 0.03775787353515625, 0.044647216796875, 0.05153656005859375, 0.0584259033203125, 0.06531524658203125, 0.07220458984375, 0.07909393310546875, 0.0859832763671875, 0.09287261962890625, 0.099761962890625, 0.10665130615234375, 0.1135406494140625, 0.12042999267578125, 0.1273193359375, 0.13420867919921875, 0.1410980224609375, 0.14798736572265625, 0.154876708984375, 0.16176605224609375, 0.1686553955078125, 0.17554473876953125, 0.18243408203125, 0.18932342529296875, 0.1962127685546875, 0.20310211181640625, 0.209991455078125, 0.21688079833984375, 0.2237701416015625, 0.23065948486328125, 0.237548828125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 11.0, 2.0, 7.0, 9.0, 15.0, 14.0, 19.0, 21.0, 24.0, 24.0, 22.0, 34.0, 36.0, 40.0, 45.0, 46.0, 33.0, 43.0, 41.0, 45.0, 29.0, 33.0, 42.0, 39.0, 35.0, 45.0, 29.0, 32.0, 29.0, 31.0, 16.0, 18.0, 14.0, 13.0, 14.0, 11.0, 9.0, 6.0, 7.0, 2.0, 8.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1337890625, -0.12989521026611328, -0.12600135803222656, -0.12210750579833984, -0.11821365356445312, -0.1143198013305664, -0.11042594909667969, -0.10653209686279297, -0.10263824462890625, -0.09874439239501953, -0.09485054016113281, -0.0909566879272461, -0.08706283569335938, -0.08316898345947266, -0.07927513122558594, -0.07538127899169922, -0.0714874267578125, -0.06759357452392578, -0.06369972229003906, -0.059805870056152344, -0.055912017822265625, -0.052018165588378906, -0.04812431335449219, -0.04423046112060547, -0.04033660888671875, -0.03644275665283203, -0.03254890441894531, -0.028655052185058594, -0.024761199951171875, -0.020867347717285156, -0.016973495483398438, -0.013079643249511719, -0.009185791015625, -0.005291938781738281, -0.0013980865478515625, 0.0024957656860351562, 0.006389617919921875, 0.010283470153808594, 0.014177322387695312, 0.01807117462158203, 0.02196502685546875, 0.02585887908935547, 0.029752731323242188, 0.033646583557128906, 0.037540435791015625, 0.041434288024902344, 0.04532814025878906, 0.04922199249267578, 0.0531158447265625, 0.05700969696044922, 0.06090354919433594, 0.06479740142822266, 0.06869125366210938, 0.0725851058959961, 0.07647895812988281, 0.08037281036376953, 0.08426666259765625, 0.08816051483154297, 0.09205436706542969, 0.0959482192993164, 0.09984207153320312, 0.10373592376708984, 0.10762977600097656, 0.11152362823486328, 0.11541748046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 9.0, 8.0, 14.0, 13.0, 24.0, 45.0, 87.0, 134.0, 286.0, 733.0, 1673.0, 4525.0, 12148.0, 35315.0, 112679.0, 327141.0, 358939.0, 131642.0, 40719.0, 13902.0, 4989.0, 1993.0, 760.0, 376.0, 174.0, 96.0, 44.0, 23.0, 21.0, 10.0, 8.0, 8.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.440673828125, -0.4277381896972656, -0.41480255126953125, -0.4018669128417969, -0.3889312744140625, -0.3759956359863281, -0.36305999755859375, -0.3501243591308594, -0.337188720703125, -0.3242530822753906, -0.31131744384765625, -0.2983818054199219, -0.2854461669921875, -0.2725105285644531, -0.25957489013671875, -0.24663925170898438, -0.23370361328125, -0.22076797485351562, -0.20783233642578125, -0.19489669799804688, -0.1819610595703125, -0.16902542114257812, -0.15608978271484375, -0.14315414428710938, -0.130218505859375, -0.11728286743164062, -0.10434722900390625, -0.09141159057617188, -0.0784759521484375, -0.06554031372070312, -0.05260467529296875, -0.039669036865234375, -0.0267333984375, -0.013797760009765625, -0.00086212158203125, 0.012073516845703125, 0.0250091552734375, 0.037944793701171875, 0.05088043212890625, 0.06381607055664062, 0.076751708984375, 0.08968734741210938, 0.10262298583984375, 0.11555862426757812, 0.1284942626953125, 0.14142990112304688, 0.15436553955078125, 0.16730117797851562, 0.18023681640625, 0.19317245483398438, 0.20610809326171875, 0.21904373168945312, 0.2319793701171875, 0.24491500854492188, 0.25785064697265625, 0.2707862854003906, 0.283721923828125, 0.2966575622558594, 0.30959320068359375, 0.3225288391113281, 0.3354644775390625, 0.3484001159667969, 0.36133575439453125, 0.3742713928222656, 0.38720703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 4.0, 2.0, 6.0, 5.0, 9.0, 9.0, 3.0, 11.0, 15.0, 15.0, 20.0, 18.0, 20.0, 23.0, 34.0, 19.0, 27.0, 43.0, 38.0, 48.0, 43.0, 49.0, 51.0, 48.0, 39.0, 50.0, 45.0, 34.0, 35.0, 32.0, 35.0, 29.0, 19.0, 17.0, 27.0, 12.0, 16.0, 15.0, 7.0, 9.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34423828125, -0.3328399658203125, -0.321441650390625, -0.3100433349609375, -0.29864501953125, -0.2872467041015625, -0.275848388671875, -0.2644500732421875, -0.2530517578125, -0.2416534423828125, -0.230255126953125, -0.2188568115234375, -0.20745849609375, -0.1960601806640625, -0.184661865234375, -0.1732635498046875, -0.161865234375, -0.1504669189453125, -0.139068603515625, -0.1276702880859375, -0.11627197265625, -0.1048736572265625, -0.093475341796875, -0.0820770263671875, -0.0706787109375, -0.0592803955078125, -0.047882080078125, -0.0364837646484375, -0.02508544921875, -0.0136871337890625, -0.002288818359375, 0.0091094970703125, 0.0205078125, 0.0319061279296875, 0.043304443359375, 0.0547027587890625, 0.06610107421875, 0.0774993896484375, 0.088897705078125, 0.1002960205078125, 0.1116943359375, 0.1230926513671875, 0.134490966796875, 0.1458892822265625, 0.15728759765625, 0.1686859130859375, 0.180084228515625, 0.1914825439453125, 0.202880859375, 0.2142791748046875, 0.225677490234375, 0.2370758056640625, 0.24847412109375, 0.2598724365234375, 0.271270751953125, 0.2826690673828125, 0.2940673828125, 0.3054656982421875, 0.316864013671875, 0.3282623291015625, 0.33966064453125, 0.3510589599609375, 0.362457275390625, 0.3738555908203125, 0.38525390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 5.0, 9.0, 13.0, 26.0, 35.0, 54.0, 90.0, 142.0, 216.0, 310.0, 483.0, 829.0, 1472.0, 2243.0, 3685.0, 6193.0, 10381.0, 17923.0, 31378.0, 56440.0, 106726.0, 191825.0, 238692.0, 171339.0, 92036.0, 49212.0, 27235.0, 16021.0, 9333.0, 5612.0, 3272.0, 2087.0, 1250.0, 751.0, 458.0, 297.0, 160.0, 119.0, 67.0, 40.0, 29.0, 27.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.09442138671875, -0.09175300598144531, -0.08908462524414062, -0.08641624450683594, -0.08374786376953125, -0.08107948303222656, -0.07841110229492188, -0.07574272155761719, -0.0730743408203125, -0.07040596008300781, -0.06773757934570312, -0.06506919860839844, -0.06240081787109375, -0.05973243713378906, -0.057064056396484375, -0.05439567565917969, -0.051727294921875, -0.04905891418457031, -0.046390533447265625, -0.04372215270996094, -0.04105377197265625, -0.03838539123535156, -0.035717010498046875, -0.03304862976074219, -0.0303802490234375, -0.027711868286132812, -0.025043487548828125, -0.022375106811523438, -0.01970672607421875, -0.017038345336914062, -0.014369964599609375, -0.011701583862304688, -0.009033203125, -0.0063648223876953125, -0.003696441650390625, -0.0010280609130859375, 0.00164031982421875, 0.0043087005615234375, 0.006977081298828125, 0.009645462036132812, 0.0123138427734375, 0.014982223510742188, 0.017650604248046875, 0.020318984985351562, 0.02298736572265625, 0.025655746459960938, 0.028324127197265625, 0.030992507934570312, 0.033660888671875, 0.03632926940917969, 0.038997650146484375, 0.04166603088378906, 0.04433441162109375, 0.04700279235839844, 0.049671173095703125, 0.05233955383300781, 0.0550079345703125, 0.05767631530761719, 0.060344696044921875, 0.06301307678222656, 0.06568145751953125, 0.06834983825683594, 0.07101821899414062, 0.07368659973144531, 0.07635498046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 8.0, 3.0, 13.0, 18.0, 19.0, 23.0, 18.0, 51.0, 47.0, 107.0, 141.0, 128.0, 128.0, 87.0, 58.0, 39.0, 24.0, 20.0, 18.0, 5.0, 8.0, 6.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.844499588012695e-05, -3.7173740565776825e-05, -3.59024852514267e-05, -3.463122993707657e-05, -3.335997462272644e-05, -3.208871930837631e-05, -3.0817463994026184e-05, -2.9546208679676056e-05, -2.8274953365325928e-05, -2.70036980509758e-05, -2.573244273662567e-05, -2.4461187422275543e-05, -2.3189932107925415e-05, -2.1918676793575287e-05, -2.064742147922516e-05, -1.937616616487503e-05, -1.8104910850524902e-05, -1.6833655536174774e-05, -1.5562400221824646e-05, -1.4291144907474518e-05, -1.301988959312439e-05, -1.1748634278774261e-05, -1.0477378964424133e-05, -9.206123650074005e-06, -7.934868335723877e-06, -6.663613021373749e-06, -5.392357707023621e-06, -4.1211023926734924e-06, -2.8498470783233643e-06, -1.578591763973236e-06, -3.073364496231079e-07, 9.639188647270203e-07, 2.2351741790771484e-06, 3.5064294934272766e-06, 4.777684807777405e-06, 6.048940122127533e-06, 7.320195436477661e-06, 8.59145075082779e-06, 9.862706065177917e-06, 1.1133961379528046e-05, 1.2405216693878174e-05, 1.3676472008228302e-05, 1.494772732257843e-05, 1.621898263692856e-05, 1.7490237951278687e-05, 1.8761493265628815e-05, 2.0032748579978943e-05, 2.130400389432907e-05, 2.25752592086792e-05, 2.3846514523029327e-05, 2.5117769837379456e-05, 2.6389025151729584e-05, 2.7660280466079712e-05, 2.893153578042984e-05, 3.0202791094779968e-05, 3.1474046409130096e-05, 3.2745301723480225e-05, 3.401655703783035e-05, 3.528781235218048e-05, 3.655906766653061e-05, 3.783032298088074e-05, 3.9101578295230865e-05, 4.0372833609580994e-05, 4.164408892393112e-05, 4.291534423828125e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 19.0, 35.0, 37.0, 53.0, 87.0, 143.0, 227.0, 464.0, 864.0, 1541.0, 2781.0, 5311.0, 9919.0, 18962.0, 36785.0, 71241.0, 144194.0, 250525.0, 238875.0, 131428.0, 64847.0, 33358.0, 17199.0, 9012.0, 4877.0, 2578.0, 1345.0, 761.0, 474.0, 240.0, 143.0, 80.0, 43.0, 36.0, 25.0, 11.0, 8.0, 5.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07943153381347656, -0.07658767700195312, -0.07374382019042969, -0.07089996337890625, -0.06805610656738281, -0.06521224975585938, -0.06236839294433594, -0.0595245361328125, -0.05668067932128906, -0.053836822509765625, -0.05099296569824219, -0.04814910888671875, -0.04530525207519531, -0.042461395263671875, -0.03961753845214844, -0.036773681640625, -0.03392982482910156, -0.031085968017578125, -0.028242111206054688, -0.02539825439453125, -0.022554397583007812, -0.019710540771484375, -0.016866683959960938, -0.0140228271484375, -0.011178970336914062, -0.008335113525390625, -0.0054912567138671875, -0.00264739990234375, 0.0001964569091796875, 0.003040313720703125, 0.0058841705322265625, 0.00872802734375, 0.011571884155273438, 0.014415740966796875, 0.017259597778320312, 0.02010345458984375, 0.022947311401367188, 0.025791168212890625, 0.028635025024414062, 0.0314788818359375, 0.03432273864746094, 0.037166595458984375, 0.04001045227050781, 0.04285430908203125, 0.04569816589355469, 0.048542022705078125, 0.05138587951660156, 0.054229736328125, 0.05707359313964844, 0.059917449951171875, 0.06276130676269531, 0.06560516357421875, 0.06844902038574219, 0.07129287719726562, 0.07413673400878906, 0.0769805908203125, 0.07982444763183594, 0.08266830444335938, 0.08551216125488281, 0.08835601806640625, 0.09119987487792969, 0.09404373168945312, 0.09688758850097656, 0.0997314453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 10.0, 5.0, 11.0, 12.0, 23.0, 19.0, 23.0, 33.0, 43.0, 56.0, 64.0, 66.0, 84.0, 70.0, 83.0, 64.0, 57.0, 52.0, 43.0, 39.0, 22.0, 27.0, 21.0, 23.0, 12.0, 7.0, 10.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13096141815185547, -0.12727928161621094, -0.1235971450805664, -0.11991500854492188, -0.11623287200927734, -0.11255073547363281, -0.10886859893798828, -0.10518646240234375, -0.10150432586669922, -0.09782218933105469, -0.09414005279541016, -0.09045791625976562, -0.0867757797241211, -0.08309364318847656, -0.07941150665283203, -0.0757293701171875, -0.07204723358154297, -0.06836509704589844, -0.0646829605102539, -0.061000823974609375, -0.057318687438964844, -0.05363655090332031, -0.04995441436767578, -0.04627227783203125, -0.04259014129638672, -0.03890800476074219, -0.035225868225097656, -0.031543731689453125, -0.027861595153808594, -0.024179458618164062, -0.02049732208251953, -0.016815185546875, -0.013133049011230469, -0.009450912475585938, -0.005768775939941406, -0.002086639404296875, 0.0015954971313476562, 0.0052776336669921875, 0.008959770202636719, 0.01264190673828125, 0.01632404327392578, 0.020006179809570312, 0.023688316345214844, 0.027370452880859375, 0.031052589416503906, 0.03473472595214844, 0.03841686248779297, 0.0420989990234375, 0.04578113555908203, 0.04946327209472656, 0.053145408630371094, 0.056827545166015625, 0.060509681701660156, 0.06419181823730469, 0.06787395477294922, 0.07155609130859375, 0.07523822784423828, 0.07892036437988281, 0.08260250091552734, 0.08628463745117188, 0.0899667739868164, 0.09364891052246094, 0.09733104705810547, 0.10101318359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 11.0, 23.0, 33.0, 62.0, 77.0, 142.0, 135.0, 128.0, 125.0, 115.0, 69.0, 35.0, 26.0, 15.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.926974296569824, -2.866107940673828, -2.805241346359253, -2.744374990463257, -2.6835083961486816, -2.6226420402526855, -2.5617756843566895, -2.5009090900421143, -2.440042734146118, -2.379176378250122, -2.318309783935547, -2.257443428039551, -2.1965768337249756, -2.1357104778289795, -2.0748441219329834, -2.013977527618408, -1.953111171722412, -1.8922446966171265, -1.8313782215118408, -1.7705118656158447, -1.709645390510559, -1.6487789154052734, -1.5879124402999878, -1.5270459651947021, -1.4661794900894165, -1.4053130149841309, -1.3444465398788452, -1.2835801839828491, -1.2227137088775635, -1.1618472337722778, -1.1009807586669922, -1.040114402770996, -0.9792479276657104, -0.9183814525604248, -0.8575150370597839, -0.7966485619544983, -0.7357821464538574, -0.6749156713485718, -0.6140491962432861, -0.5531827807426453, -0.492316335439682, -0.43144989013671875, -0.3705834448337555, -0.30971699953079224, -0.24885053932666779, -0.18798407912254333, -0.12711763381958008, -0.06625118851661682, -0.0053847432136535645, 0.05548170581459999, 0.11634815484285355, 0.1772146075963974, 0.23808105289936066, 0.2989475131034851, 0.35981395840644836, 0.4206804037094116, 0.4815468490123749, 0.5424132943153381, 0.6032797694206238, 0.6641461849212646, 0.7250126600265503, 0.7858791351318359, 0.8467455506324768, 0.9076119661331177, 0.9684784412384033]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 5.0, 13.0, 6.0, 17.0, 9.0, 23.0, 21.0, 25.0, 30.0, 29.0, 32.0, 38.0, 35.0, 33.0, 35.0, 50.0, 41.0, 40.0, 29.0, 34.0, 40.0, 30.0, 34.0, 41.0, 34.0, 34.0, 18.0, 20.0, 21.0, 27.0, 24.0, 24.0, 12.0, 6.0, 10.0, 9.0, 7.0, 10.0, 2.0, 4.0, 9.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.881180465221405, -0.8543571829795837, -0.8275339007377625, -0.8007106781005859, -0.7738873958587646, -0.7470641136169434, -0.7202408313751221, -0.6934175491333008, -0.6665942668914795, -0.6397709846496582, -0.6129477024078369, -0.5861244201660156, -0.5593011975288391, -0.5324779152870178, -0.5056546330451965, -0.47883135080337524, -0.45200809836387634, -0.42518481612205505, -0.39836156368255615, -0.37153828144073486, -0.3447149991989136, -0.3178917169570923, -0.2910684645175934, -0.2642451822757721, -0.237421914935112, -0.2105986475944519, -0.18377536535263062, -0.15695209801197052, -0.13012883067131042, -0.10330554842948914, -0.07648228108882904, -0.04965899884700775, -0.022835731506347656, 0.003987541422247887, 0.03081081435084343, 0.05763408541679382, 0.08445736020803452, 0.11128063499927521, 0.1381039023399353, 0.1649271845817566, 0.1917504519224167, 0.21857371926307678, 0.24539700150489807, 0.272220253944397, 0.29904353618621826, 0.32586681842803955, 0.35269010066986084, 0.37951338291168213, 0.40633663535118103, 0.4331599175930023, 0.4599831700325012, 0.4868064522743225, 0.5136297345161438, 0.5404530167579651, 0.5672762393951416, 0.5940995216369629, 0.6209228038787842, 0.6477460861206055, 0.6745693683624268, 0.701392650604248, 0.7282158732414246, 0.7550391554832458, 0.7818624377250671, 0.8086857199668884, 0.8355090022087097]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 3.0, 5.0, 9.0, 11.0, 15.0, 14.0, 23.0, 28.0, 42.0, 61.0, 76.0, 152.0, 311.0, 737.0, 2023.0, 6184.0, 22392.0, 106464.0, 935907.0, 2784641.0, 272778.0, 46054.0, 10928.0, 3241.0, 1094.0, 476.0, 229.0, 131.0, 58.0, 44.0, 39.0, 25.0, 15.0, 17.0, 7.0, 9.0, 7.0, 5.0, 7.0, 5.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387451171875, -0.37613677978515625, -0.3648223876953125, -0.35350799560546875, -0.342193603515625, -0.33087921142578125, -0.3195648193359375, -0.30825042724609375, -0.29693603515625, -0.28562164306640625, -0.2743072509765625, -0.26299285888671875, -0.251678466796875, -0.24036407470703125, -0.2290496826171875, -0.21773529052734375, -0.2064208984375, -0.19510650634765625, -0.1837921142578125, -0.17247772216796875, -0.161163330078125, -0.14984893798828125, -0.1385345458984375, -0.12722015380859375, -0.11590576171875, -0.10459136962890625, -0.0932769775390625, -0.08196258544921875, -0.070648193359375, -0.05933380126953125, -0.0480194091796875, -0.03670501708984375, -0.025390625, -0.01407623291015625, -0.0027618408203125, 0.00855255126953125, 0.019866943359375, 0.03118133544921875, 0.0424957275390625, 0.05381011962890625, 0.06512451171875, 0.07643890380859375, 0.0877532958984375, 0.09906768798828125, 0.110382080078125, 0.12169647216796875, 0.1330108642578125, 0.14432525634765625, 0.1556396484375, 0.16695404052734375, 0.1782684326171875, 0.18958282470703125, 0.200897216796875, 0.21221160888671875, 0.2235260009765625, 0.23484039306640625, 0.24615478515625, 0.25746917724609375, 0.2687835693359375, 0.28009796142578125, 0.291412353515625, 0.30272674560546875, 0.3140411376953125, 0.32535552978515625, 0.336669921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 2.0, 7.0, 14.0, 7.0, 11.0, 17.0, 11.0, 24.0, 18.0, 17.0, 17.0, 27.0, 28.0, 27.0, 44.0, 48.0, 36.0, 48.0, 48.0, 42.0, 44.0, 33.0, 45.0, 38.0, 38.0, 31.0, 41.0, 24.0, 30.0, 35.0, 24.0, 17.0, 18.0, 21.0, 15.0, 14.0, 5.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13054847717285156, -0.12620925903320312, -0.12187004089355469, -0.11753082275390625, -0.11319160461425781, -0.10885238647460938, -0.10451316833496094, -0.1001739501953125, -0.09583473205566406, -0.09149551391601562, -0.08715629577636719, -0.08281707763671875, -0.07847785949707031, -0.07413864135742188, -0.06979942321777344, -0.065460205078125, -0.06112098693847656, -0.056781768798828125, -0.05244255065917969, -0.04810333251953125, -0.04376411437988281, -0.039424896240234375, -0.03508567810058594, -0.0307464599609375, -0.026407241821289062, -0.022068023681640625, -0.017728805541992188, -0.01338958740234375, -0.009050369262695312, -0.004711151123046875, -0.0003719329833984375, 0.00396728515625, 0.008306503295898438, 0.012645721435546875, 0.016984939575195312, 0.02132415771484375, 0.025663375854492188, 0.030002593994140625, 0.03434181213378906, 0.0386810302734375, 0.04302024841308594, 0.047359466552734375, 0.05169868469238281, 0.05603790283203125, 0.06037712097167969, 0.06471633911132812, 0.06905555725097656, 0.073394775390625, 0.07773399353027344, 0.08207321166992188, 0.08641242980957031, 0.09075164794921875, 0.09509086608886719, 0.09943008422851562, 0.10376930236816406, 0.1081085205078125, 0.11244773864746094, 0.11678695678710938, 0.12112617492675781, 0.12546539306640625, 0.1298046112060547, 0.13414382934570312, 0.13848304748535156, 0.142822265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 13.0, 12.0, 22.0, 21.0, 47.0, 55.0, 70.0, 116.0, 191.0, 250.0, 416.0, 676.0, 975.0, 1599.0, 2607.0, 4595.0, 7905.0, 14409.0, 27233.0, 53242.0, 109197.0, 237226.0, 563808.0, 1390865.0, 1027510.0, 403117.0, 174828.0, 83065.0, 41204.0, 21364.0, 11515.0, 6351.0, 3834.0, 2185.0, 1302.0, 877.0, 498.0, 364.0, 235.0, 161.0, 90.0, 64.0, 46.0, 38.0, 29.0, 15.0, 12.0, 10.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.1871337890625, -0.18143081665039062, -0.17572784423828125, -0.17002487182617188, -0.1643218994140625, -0.15861892700195312, -0.15291595458984375, -0.14721298217773438, -0.141510009765625, -0.13580703735351562, -0.13010406494140625, -0.12440109252929688, -0.1186981201171875, -0.11299514770507812, -0.10729217529296875, -0.10158920288085938, -0.09588623046875, -0.09018325805664062, -0.08448028564453125, -0.07877731323242188, -0.0730743408203125, -0.06737136840820312, -0.06166839599609375, -0.055965423583984375, -0.050262451171875, -0.044559478759765625, -0.03885650634765625, -0.033153533935546875, -0.0274505615234375, -0.021747589111328125, -0.01604461669921875, -0.010341644287109375, -0.004638671875, 0.001064300537109375, 0.00676727294921875, 0.012470245361328125, 0.0181732177734375, 0.023876190185546875, 0.02957916259765625, 0.035282135009765625, 0.040985107421875, 0.046688079833984375, 0.05239105224609375, 0.058094024658203125, 0.0637969970703125, 0.06949996948242188, 0.07520294189453125, 0.08090591430664062, 0.08660888671875, 0.09231185913085938, 0.09801483154296875, 0.10371780395507812, 0.1094207763671875, 0.11512374877929688, 0.12082672119140625, 0.12652969360351562, 0.132232666015625, 0.13793563842773438, 0.14363861083984375, 0.14934158325195312, 0.1550445556640625, 0.16074752807617188, 0.16645050048828125, 0.17215347290039062, 0.1778564453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 11.0, 16.0, 13.0, 14.0, 26.0, 42.0, 46.0, 58.0, 84.0, 94.0, 150.0, 197.0, 267.0, 373.0, 510.0, 560.0, 452.0, 288.0, 219.0, 168.0, 139.0, 87.0, 60.0, 45.0, 38.0, 29.0, 22.0, 13.0, 8.0, 11.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2164306640625, -0.20927047729492188, -0.20211029052734375, -0.19495010375976562, -0.1877899169921875, -0.18062973022460938, -0.17346954345703125, -0.16630935668945312, -0.159149169921875, -0.15198898315429688, -0.14482879638671875, -0.13766860961914062, -0.1305084228515625, -0.12334823608398438, -0.11618804931640625, -0.10902786254882812, -0.10186767578125, -0.09470748901367188, -0.08754730224609375, -0.08038711547851562, -0.0732269287109375, -0.06606674194335938, -0.05890655517578125, -0.051746368408203125, -0.044586181640625, -0.037425994873046875, -0.03026580810546875, -0.023105621337890625, -0.0159454345703125, -0.008785247802734375, -0.00162506103515625, 0.005535125732421875, 0.0126953125, 0.019855499267578125, 0.02701568603515625, 0.034175872802734375, 0.0413360595703125, 0.048496246337890625, 0.05565643310546875, 0.06281661987304688, 0.069976806640625, 0.07713699340820312, 0.08429718017578125, 0.09145736694335938, 0.0986175537109375, 0.10577774047851562, 0.11293792724609375, 0.12009811401367188, 0.12725830078125, 0.13441848754882812, 0.14157867431640625, 0.14873886108398438, 0.1558990478515625, 0.16305923461914062, 0.17021942138671875, 0.17737960815429688, 0.184539794921875, 0.19169998168945312, 0.19886016845703125, 0.20602035522460938, 0.2131805419921875, 0.22034072875976562, 0.22750091552734375, 0.23466110229492188, 0.2418212890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 12.0, 15.0, 21.0, 36.0, 46.0, 72.0, 84.0, 85.0, 101.0, 102.0, 89.0, 90.0, 74.0, 65.0, 42.0, 25.0, 9.0, 12.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8949137926101685, -0.855153501033783, -0.8153932094573975, -0.775632917881012, -0.7358726263046265, -0.6961122751235962, -0.6563519835472107, -0.6165916919708252, -0.5768314003944397, -0.5370711088180542, -0.4973108172416687, -0.4575504958629608, -0.4177902042865753, -0.3780299127101898, -0.33826959133148193, -0.29850929975509644, -0.25874900817871094, -0.21898871660232544, -0.17922841012477875, -0.13946810364723206, -0.09970781207084656, -0.05994752049446106, -0.020187214016914368, 0.019573092460632324, 0.05933338403701782, 0.09909368306398392, 0.13885398209095, 0.1786142885684967, 0.2183745801448822, 0.2581348717212677, 0.2978951930999756, 0.3376554846763611, 0.37741589546203613, 0.41717618703842163, 0.45693647861480713, 0.496696799993515, 0.5364570617675781, 0.5762174129486084, 0.6159777045249939, 0.6557379961013794, 0.6954982876777649, 0.7352585792541504, 0.7750188708305359, 0.8147791624069214, 0.8545395135879517, 0.8942997455596924, 0.9340600967407227, 0.9738203883171082, 1.0135806798934937, 1.053341031074524, 1.0931012630462646, 1.132861614227295, 1.1726218461990356, 1.212382197380066, 1.2521424293518066, 1.291902780532837, 1.3316631317138672, 1.3714234828948975, 1.4111837148666382, 1.4509440660476685, 1.4907042980194092, 1.5304646492004395, 1.5702248811721802, 1.6099852323532104, 1.6497454643249512]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 6.0, 8.0, 12.0, 16.0, 21.0, 19.0, 20.0, 25.0, 32.0, 31.0, 32.0, 35.0, 36.0, 44.0, 42.0, 43.0, 43.0, 42.0, 43.0, 47.0, 31.0, 33.0, 32.0, 31.0, 24.0, 25.0, 27.0, 22.0, 25.0, 19.0, 22.0, 23.0, 9.0, 13.0, 11.0, 5.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6329967975616455, -0.611678421497345, -0.5903599858283997, -0.5690416097640991, -0.5477231740951538, -0.5264047980308533, -0.5050864219665527, -0.4837680160999298, -0.4624496102333069, -0.44113120436668396, -0.41981279850006104, -0.3984944224357605, -0.3771760165691376, -0.35585761070251465, -0.3345392346382141, -0.3132208287715912, -0.29190242290496826, -0.27058401703834534, -0.2492656260728836, -0.22794723510742188, -0.20662882924079895, -0.18531042337417603, -0.1639920324087143, -0.14267364144325256, -0.12135523557662964, -0.10003683716058731, -0.07871843874454498, -0.057400040328502655, -0.03608164191246033, -0.014763243496418, 0.006555154919624329, 0.02787354588508606, 0.049191951751708984, 0.07051035016775131, 0.09182874858379364, 0.11314714699983597, 0.1344655454158783, 0.15578395128250122, 0.17710234224796295, 0.19842073321342468, 0.2197391390800476, 0.24105754494667053, 0.26237595081329346, 0.283694326877594, 0.3050127327442169, 0.32633113861083984, 0.3476495146751404, 0.3689679205417633, 0.39028632640838623, 0.41160473227500916, 0.4329231381416321, 0.4542415142059326, 0.47555992007255554, 0.49687832593917847, 0.518196702003479, 0.5395151376724243, 0.5608335137367249, 0.5821518898010254, 0.6034703254699707, 0.6247887015342712, 0.6461070775985718, 0.6674255132675171, 0.6887438893318176, 0.7100622653961182, 0.7313807010650635]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 6.0, 13.0, 16.0, 25.0, 41.0, 49.0, 79.0, 122.0, 182.0, 284.0, 463.0, 734.0, 1107.0, 1635.0, 2507.0, 3801.0, 5566.0, 8252.0, 12471.0, 18450.0, 28499.0, 45530.0, 75977.0, 135714.0, 208310.0, 194694.0, 119256.0, 67601.0, 40486.0, 25695.0, 16801.0, 11311.0, 7659.0, 5146.0, 3373.0, 2336.0, 1509.0, 985.0, 672.0, 454.0, 279.0, 158.0, 102.0, 83.0, 47.0, 30.0, 22.0, 6.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14501953125, -0.13962554931640625, -0.1342315673828125, -0.12883758544921875, -0.123443603515625, -0.11804962158203125, -0.1126556396484375, -0.10726165771484375, -0.10186767578125, -0.09647369384765625, -0.0910797119140625, -0.08568572998046875, -0.080291748046875, -0.07489776611328125, -0.0695037841796875, -0.06410980224609375, -0.0587158203125, -0.05332183837890625, -0.0479278564453125, -0.04253387451171875, -0.037139892578125, -0.03174591064453125, -0.0263519287109375, -0.02095794677734375, -0.01556396484375, -0.01016998291015625, -0.0047760009765625, 0.00061798095703125, 0.006011962890625, 0.01140594482421875, 0.0167999267578125, 0.02219390869140625, 0.027587890625, 0.03298187255859375, 0.0383758544921875, 0.04376983642578125, 0.049163818359375, 0.05455780029296875, 0.0599517822265625, 0.06534576416015625, 0.07073974609375, 0.07613372802734375, 0.0815277099609375, 0.08692169189453125, 0.092315673828125, 0.09770965576171875, 0.1031036376953125, 0.10849761962890625, 0.1138916015625, 0.11928558349609375, 0.1246795654296875, 0.13007354736328125, 0.135467529296875, 0.14086151123046875, 0.1462554931640625, 0.15164947509765625, 0.15704345703125, 0.16243743896484375, 0.1678314208984375, 0.17322540283203125, 0.178619384765625, 0.18401336669921875, 0.1894073486328125, 0.19480133056640625, 0.2001953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 9.0, 7.0, 10.0, 10.0, 19.0, 14.0, 13.0, 20.0, 20.0, 29.0, 35.0, 32.0, 33.0, 34.0, 36.0, 33.0, 41.0, 41.0, 40.0, 30.0, 38.0, 41.0, 38.0, 36.0, 37.0, 30.0, 32.0, 39.0, 29.0, 24.0, 22.0, 22.0, 16.0, 15.0, 11.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.138427734375, -0.1342334747314453, -0.13003921508789062, -0.12584495544433594, -0.12165069580078125, -0.11745643615722656, -0.11326217651367188, -0.10906791687011719, -0.1048736572265625, -0.10067939758300781, -0.09648513793945312, -0.09229087829589844, -0.08809661865234375, -0.08390235900878906, -0.07970809936523438, -0.07551383972167969, -0.071319580078125, -0.06712532043457031, -0.06293106079101562, -0.05873680114746094, -0.05454254150390625, -0.05034828186035156, -0.046154022216796875, -0.04195976257324219, -0.0377655029296875, -0.03357124328613281, -0.029376983642578125, -0.025182723999023438, -0.02098846435546875, -0.016794204711914062, -0.012599945068359375, -0.008405685424804688, -0.00421142578125, -1.71661376953125e-05, 0.004177093505859375, 0.008371353149414062, 0.01256561279296875, 0.016759872436523438, 0.020954132080078125, 0.025148391723632812, 0.0293426513671875, 0.03353691101074219, 0.037731170654296875, 0.04192543029785156, 0.04611968994140625, 0.05031394958496094, 0.054508209228515625, 0.05870246887207031, 0.062896728515625, 0.06709098815917969, 0.07128524780273438, 0.07547950744628906, 0.07967376708984375, 0.08386802673339844, 0.08806228637695312, 0.09225654602050781, 0.0964508056640625, 0.10064506530761719, 0.10483932495117188, 0.10903358459472656, 0.11322784423828125, 0.11742210388183594, 0.12161636352539062, 0.1258106231689453, 0.1300048828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 9.0, 16.0, 28.0, 26.0, 25.0, 32.0, 50.0, 90.0, 198.0, 417.0, 1045.0, 2766.0, 7723.0, 21575.0, 64313.0, 245943.0, 486793.0, 149787.0, 43860.0, 14933.0, 5394.0, 1991.0, 751.0, 300.0, 146.0, 102.0, 59.0, 38.0, 40.0, 12.0, 20.0, 14.0, 6.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.476806640625, -0.4629173278808594, -0.44902801513671875, -0.4351387023925781, -0.4212493896484375, -0.4073600769042969, -0.39347076416015625, -0.3795814514160156, -0.365692138671875, -0.3518028259277344, -0.33791351318359375, -0.3240242004394531, -0.3101348876953125, -0.2962455749511719, -0.28235626220703125, -0.2684669494628906, -0.25457763671875, -0.24068832397460938, -0.22679901123046875, -0.21290969848632812, -0.1990203857421875, -0.18513107299804688, -0.17124176025390625, -0.15735244750976562, -0.143463134765625, -0.12957382202148438, -0.11568450927734375, -0.10179519653320312, -0.0879058837890625, -0.07401657104492188, -0.06012725830078125, -0.046237945556640625, -0.0323486328125, -0.018459320068359375, -0.00457000732421875, 0.009319305419921875, 0.0232086181640625, 0.037097930908203125, 0.05098724365234375, 0.06487655639648438, 0.078765869140625, 0.09265518188476562, 0.10654449462890625, 0.12043380737304688, 0.1343231201171875, 0.14821243286132812, 0.16210174560546875, 0.17599105834960938, 0.18988037109375, 0.20376968383789062, 0.21765899658203125, 0.23154830932617188, 0.2454376220703125, 0.2593269348144531, 0.27321624755859375, 0.2871055603027344, 0.300994873046875, 0.3148841857910156, 0.32877349853515625, 0.3426628112792969, 0.3565521240234375, 0.3704414367675781, 0.38433074951171875, 0.3982200622558594, 0.412109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 5.0, 10.0, 11.0, 14.0, 16.0, 15.0, 19.0, 28.0, 23.0, 27.0, 36.0, 52.0, 31.0, 30.0, 40.0, 36.0, 55.0, 45.0, 38.0, 58.0, 51.0, 40.0, 40.0, 31.0, 41.0, 20.0, 18.0, 33.0, 27.0, 25.0, 17.0, 19.0, 8.0, 3.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.410888671875, -0.3975257873535156, -0.38416290283203125, -0.3708000183105469, -0.3574371337890625, -0.3440742492675781, -0.33071136474609375, -0.3173484802246094, -0.303985595703125, -0.2906227111816406, -0.27725982666015625, -0.2638969421386719, -0.2505340576171875, -0.23717117309570312, -0.22380828857421875, -0.21044540405273438, -0.19708251953125, -0.18371963500976562, -0.17035675048828125, -0.15699386596679688, -0.1436309814453125, -0.13026809692382812, -0.11690521240234375, -0.10354232788085938, -0.090179443359375, -0.07681655883789062, -0.06345367431640625, -0.050090789794921875, -0.0367279052734375, -0.023365020751953125, -0.01000213623046875, 0.003360748291015625, 0.0167236328125, 0.030086517333984375, 0.04344940185546875, 0.056812286376953125, 0.0701751708984375, 0.08353805541992188, 0.09690093994140625, 0.11026382446289062, 0.123626708984375, 0.13698959350585938, 0.15035247802734375, 0.16371536254882812, 0.1770782470703125, 0.19044113159179688, 0.20380401611328125, 0.21716690063476562, 0.23052978515625, 0.24389266967773438, 0.25725555419921875, 0.2706184387207031, 0.2839813232421875, 0.2973442077636719, 0.31070709228515625, 0.3240699768066406, 0.337432861328125, 0.3507957458496094, 0.36415863037109375, 0.3775215148925781, 0.3908843994140625, 0.4042472839355469, 0.41761016845703125, 0.4309730529785156, 0.4443359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 16.0, 13.0, 22.0, 37.0, 56.0, 89.0, 135.0, 304.0, 625.0, 1579.0, 3663.0, 9130.0, 23353.0, 68147.0, 321756.0, 471300.0, 97705.0, 30477.0, 11796.0, 4747.0, 1969.0, 830.0, 364.0, 156.0, 95.0, 54.0, 27.0, 18.0, 22.0, 15.0, 13.0, 8.0, 2.0, 3.0, 9.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.1595287322998047, -0.15291976928710938, -0.14631080627441406, -0.13970184326171875, -0.13309288024902344, -0.12648391723632812, -0.11987495422363281, -0.1132659912109375, -0.10665702819824219, -0.10004806518554688, -0.09343910217285156, -0.08683013916015625, -0.08022117614746094, -0.07361221313476562, -0.06700325012207031, -0.060394287109375, -0.05378532409667969, -0.047176361083984375, -0.04056739807128906, -0.03395843505859375, -0.027349472045898438, -0.020740509033203125, -0.014131546020507812, -0.0075225830078125, -0.0009136199951171875, 0.005695343017578125, 0.012304306030273438, 0.01891326904296875, 0.025522232055664062, 0.032131195068359375, 0.03874015808105469, 0.04534912109375, 0.05195808410644531, 0.058567047119140625, 0.06517601013183594, 0.07178497314453125, 0.07839393615722656, 0.08500289916992188, 0.09161186218261719, 0.0982208251953125, 0.10482978820800781, 0.11143875122070312, 0.11804771423339844, 0.12465667724609375, 0.13126564025878906, 0.13787460327148438, 0.1444835662841797, 0.151092529296875, 0.1577014923095703, 0.16431045532226562, 0.17091941833496094, 0.17752838134765625, 0.18413734436035156, 0.19074630737304688, 0.1973552703857422, 0.2039642333984375, 0.2105731964111328, 0.21718215942382812, 0.22379112243652344, 0.23040008544921875, 0.23700904846191406, 0.24361801147460938, 0.2502269744873047, 0.2568359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 7.0, 9.0, 10.0, 10.0, 16.0, 11.0, 24.0, 35.0, 52.0, 63.0, 111.0, 107.0, 111.0, 97.0, 64.0, 50.0, 35.0, 25.0, 21.0, 23.0, 16.0, 9.0, 13.0, 8.0, 8.0, 9.0, 9.0, 3.0, 6.0, 6.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.331899642944336e-05, -3.236997872591019e-05, -3.1420961022377014e-05, -3.047194331884384e-05, -2.952292561531067e-05, -2.8573907911777496e-05, -2.7624890208244324e-05, -2.667587250471115e-05, -2.572685480117798e-05, -2.4777837097644806e-05, -2.3828819394111633e-05, -2.287980169057846e-05, -2.1930783987045288e-05, -2.0981766283512115e-05, -2.0032748579978943e-05, -1.908373087644577e-05, -1.8134713172912598e-05, -1.7185695469379425e-05, -1.6236677765846252e-05, -1.528766006231308e-05, -1.4338642358779907e-05, -1.3389624655246735e-05, -1.2440606951713562e-05, -1.149158924818039e-05, -1.0542571544647217e-05, -9.593553841114044e-06, -8.644536137580872e-06, -7.695518434047699e-06, -6.746500730514526e-06, -5.797483026981354e-06, -4.848465323448181e-06, -3.8994476199150085e-06, -2.950429916381836e-06, -2.0014122128486633e-06, -1.0523945093154907e-06, -1.0337680578231812e-07, 8.456408977508545e-07, 1.794658601284027e-06, 2.7436763048171997e-06, 3.6926940083503723e-06, 4.641711711883545e-06, 5.5907294154167175e-06, 6.53974711894989e-06, 7.488764822483063e-06, 8.437782526016235e-06, 9.386800229549408e-06, 1.033581793308258e-05, 1.1284835636615753e-05, 1.2233853340148926e-05, 1.3182871043682098e-05, 1.4131888747215271e-05, 1.5080906450748444e-05, 1.6029924154281616e-05, 1.697894185781479e-05, 1.792795956134796e-05, 1.8876977264881134e-05, 1.9825994968414307e-05, 2.077501267194748e-05, 2.1724030375480652e-05, 2.2673048079013824e-05, 2.3622065782546997e-05, 2.457108348608017e-05, 2.5520101189613342e-05, 2.6469118893146515e-05, 2.7418136596679688e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 10.0, 19.0, 20.0, 41.0, 49.0, 84.0, 137.0, 223.0, 447.0, 903.0, 1798.0, 3515.0, 7241.0, 14686.0, 31389.0, 73032.0, 208745.0, 403046.0, 182250.0, 65739.0, 28398.0, 13487.0, 6668.0, 3290.0, 1545.0, 794.0, 377.0, 249.0, 127.0, 69.0, 58.0, 26.0, 28.0, 15.0, 15.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.130126953125, -0.12598800659179688, -0.12184906005859375, -0.11771011352539062, -0.1135711669921875, -0.10943222045898438, -0.10529327392578125, -0.10115432739257812, -0.097015380859375, -0.09287643432617188, -0.08873748779296875, -0.08459854125976562, -0.0804595947265625, -0.07632064819335938, -0.07218170166015625, -0.06804275512695312, -0.06390380859375, -0.059764862060546875, -0.05562591552734375, -0.051486968994140625, -0.0473480224609375, -0.043209075927734375, -0.03907012939453125, -0.034931182861328125, -0.030792236328125, -0.026653289794921875, -0.02251434326171875, -0.018375396728515625, -0.0142364501953125, -0.010097503662109375, -0.00595855712890625, -0.001819610595703125, 0.0023193359375, 0.006458282470703125, 0.01059722900390625, 0.014736175537109375, 0.0188751220703125, 0.023014068603515625, 0.02715301513671875, 0.031291961669921875, 0.035430908203125, 0.039569854736328125, 0.04370880126953125, 0.047847747802734375, 0.0519866943359375, 0.056125640869140625, 0.06026458740234375, 0.06440353393554688, 0.06854248046875, 0.07268142700195312, 0.07682037353515625, 0.08095932006835938, 0.0850982666015625, 0.08923721313476562, 0.09337615966796875, 0.09751510620117188, 0.101654052734375, 0.10579299926757812, 0.10993194580078125, 0.11407089233398438, 0.1182098388671875, 0.12234878540039062, 0.12648773193359375, 0.13062667846679688, 0.134765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 17.0, 23.0, 17.0, 23.0, 41.0, 57.0, 83.0, 104.0, 100.0, 101.0, 85.0, 50.0, 55.0, 40.0, 40.0, 27.0, 13.0, 19.0, 4.0, 10.0, 7.0, 8.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.12311363220214844, -0.11854171752929688, -0.11396980285644531, -0.10939788818359375, -0.10482597351074219, -0.10025405883789062, -0.09568214416503906, -0.0911102294921875, -0.08653831481933594, -0.08196640014648438, -0.07739448547363281, -0.07282257080078125, -0.06825065612792969, -0.06367874145507812, -0.05910682678222656, -0.054534912109375, -0.04996299743652344, -0.045391082763671875, -0.04081916809082031, -0.03624725341796875, -0.03167533874511719, -0.027103424072265625, -0.022531509399414062, -0.0179595947265625, -0.013387680053710938, -0.008815765380859375, -0.0042438507080078125, 0.00032806396484375, 0.0048999786376953125, 0.009471893310546875, 0.014043807983398438, 0.01861572265625, 0.023187637329101562, 0.027759552001953125, 0.03233146667480469, 0.03690338134765625, 0.04147529602050781, 0.046047210693359375, 0.05061912536621094, 0.0551910400390625, 0.05976295471191406, 0.06433486938476562, 0.06890678405761719, 0.07347869873046875, 0.07805061340332031, 0.08262252807617188, 0.08719444274902344, 0.091766357421875, 0.09633827209472656, 0.10091018676757812, 0.10548210144042969, 0.11005401611328125, 0.11462593078613281, 0.11919784545898438, 0.12376976013183594, 0.1283416748046875, 0.13291358947753906, 0.13748550415039062, 0.1420574188232422, 0.14662933349609375, 0.1512012481689453, 0.15577316284179688, 0.16034507751464844, 0.1649169921875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 19.0, 88.0, 252.0, 388.0, 218.0, 42.0, 7.0, 5.0], "bins": [-10.677162170410156, -10.496923446655273, -10.31668472290039, -10.136446952819824, -9.956208229064941, -9.775969505310059, -9.595730781555176, -9.41549301147461, -9.235254287719727, -9.055015563964844, -8.874776840209961, -8.694539070129395, -8.514300346374512, -8.334061622619629, -8.153822898864746, -7.9735846519470215, -7.793346405029297, -7.613107681274414, -7.4328694343566895, -7.252630710601807, -7.072392463684082, -6.892153739929199, -6.711915493011475, -6.531676769256592, -6.351438045501709, -6.171199321746826, -5.990961074829102, -5.810722351074219, -5.630484104156494, -5.450245380401611, -5.270007133483887, -5.089768409729004, -4.909530162811279, -4.7292914390563965, -4.549053192138672, -4.368814468383789, -4.1885762214660645, -4.008337497711182, -3.828099250793457, -3.647860527038574, -3.4676222801208496, -3.287383794784546, -3.107145309448242, -2.9269068241119385, -2.7466683387756348, -2.566429853439331, -2.3861913681030273, -2.2059526443481445, -2.025714159011841, -1.845475673675537, -1.6652371883392334, -1.4849987030029297, -1.304760217666626, -1.1245217323303223, -0.944283127784729, -0.7640446424484253, -0.5838061571121216, -0.40356767177581787, -0.22332915663719177, -0.043090641498565674, 0.13714784383773804, 0.31738632917404175, 0.49762487411499023, 0.677863359451294, 0.8581018447875977]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 5.0, 5.0, 6.0, 6.0, 8.0, 10.0, 10.0, 11.0, 25.0, 16.0, 25.0, 25.0, 20.0, 20.0, 35.0, 25.0, 35.0, 31.0, 31.0, 43.0, 51.0, 40.0, 31.0, 34.0, 41.0, 32.0, 38.0, 41.0, 28.0, 23.0, 37.0, 31.0, 28.0, 23.0, 16.0, 17.0, 25.0, 11.0, 10.0, 7.0, 5.0, 6.0, 13.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.0680755376815796, -1.0359394550323486, -1.0038033723831177, -0.9716672897338867, -0.9395312070846558, -0.9073951244354248, -0.8752590417861938, -0.8431229591369629, -0.8109868764877319, -0.778850793838501, -0.74671471118927, -0.7145786285400391, -0.6824425458908081, -0.6503064632415771, -0.6181703805923462, -0.5860342979431152, -0.5538982152938843, -0.5217621326446533, -0.48962604999542236, -0.4574899673461914, -0.42535388469696045, -0.3932178020477295, -0.36108171939849854, -0.3289456367492676, -0.2968095541000366, -0.26467347145080566, -0.2325373888015747, -0.20040130615234375, -0.1682652235031128, -0.13612914085388184, -0.10399305820465088, -0.07185697555541992, -0.039720892906188965, -0.007584810256958008, 0.02455127239227295, 0.056687355041503906, 0.08882343769073486, 0.12095952033996582, 0.15309560298919678, 0.18523168563842773, 0.2173677682876587, 0.24950385093688965, 0.2816399335861206, 0.31377601623535156, 0.3459120988845825, 0.3780481815338135, 0.41018426418304443, 0.4423203468322754, 0.47445642948150635, 0.5065925121307373, 0.5387285947799683, 0.5708646774291992, 0.6030007600784302, 0.6351368427276611, 0.6672729253768921, 0.699409008026123, 0.731545090675354, 0.763681173324585, 0.7958172559738159, 0.8279533386230469, 0.8600894212722778, 0.8922255039215088, 0.9243615865707397, 0.9564976692199707, 0.9886337518692017]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 6.0, 12.0, 11.0, 27.0, 30.0, 49.0, 74.0, 105.0, 166.0, 259.0, 410.0, 768.0, 1364.0, 2461.0, 4798.0, 9701.0, 20369.0, 44611.0, 105211.0, 282715.0, 1025420.0, 1928431.0, 480171.0, 163398.0, 66321.0, 29625.0, 13885.0, 6481.0, 3268.0, 1790.0, 964.0, 491.0, 324.0, 192.0, 117.0, 77.0, 40.0, 35.0, 16.0, 13.0, 20.0, 7.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0], "bins": [-0.2047119140625, -0.19855117797851562, -0.19239044189453125, -0.18622970581054688, -0.1800689697265625, -0.17390823364257812, -0.16774749755859375, -0.16158676147460938, -0.155426025390625, -0.14926528930664062, -0.14310455322265625, -0.13694381713867188, -0.1307830810546875, -0.12462234497070312, -0.11846160888671875, -0.11230087280273438, -0.10614013671875, -0.09997940063476562, -0.09381866455078125, -0.08765792846679688, -0.0814971923828125, -0.07533645629882812, -0.06917572021484375, -0.06301498413085938, -0.056854248046875, -0.050693511962890625, -0.04453277587890625, -0.038372039794921875, -0.0322113037109375, -0.026050567626953125, -0.01988983154296875, -0.013729095458984375, -0.007568359375, -0.001407623291015625, 0.00475311279296875, 0.010913848876953125, 0.0170745849609375, 0.023235321044921875, 0.02939605712890625, 0.035556793212890625, 0.041717529296875, 0.047878265380859375, 0.05403900146484375, 0.060199737548828125, 0.0663604736328125, 0.07252120971679688, 0.07868194580078125, 0.08484268188476562, 0.09100341796875, 0.09716415405273438, 0.10332489013671875, 0.10948562622070312, 0.1156463623046875, 0.12180709838867188, 0.12796783447265625, 0.13412857055664062, 0.140289306640625, 0.14645004272460938, 0.15261077880859375, 0.15877151489257812, 0.1649322509765625, 0.17109298706054688, 0.17725372314453125, 0.18341445922851562, 0.1895751953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 12.0, 13.0, 14.0, 5.0, 17.0, 18.0, 21.0, 28.0, 21.0, 37.0, 41.0, 34.0, 34.0, 45.0, 52.0, 49.0, 60.0, 65.0, 54.0, 47.0, 46.0, 37.0, 33.0, 34.0, 24.0, 37.0, 28.0, 12.0, 13.0, 15.0, 14.0, 5.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.218017578125, -0.21233749389648438, -0.20665740966796875, -0.20097732543945312, -0.1952972412109375, -0.18961715698242188, -0.18393707275390625, -0.17825698852539062, -0.172576904296875, -0.16689682006835938, -0.16121673583984375, -0.15553665161132812, -0.1498565673828125, -0.14417648315429688, -0.13849639892578125, -0.13281631469726562, -0.12713623046875, -0.12145614624023438, -0.11577606201171875, -0.11009597778320312, -0.1044158935546875, -0.09873580932617188, -0.09305572509765625, -0.08737564086914062, -0.081695556640625, -0.07601547241210938, -0.07033538818359375, -0.06465530395507812, -0.0589752197265625, -0.053295135498046875, -0.04761505126953125, -0.041934967041015625, -0.0362548828125, -0.030574798583984375, -0.02489471435546875, -0.019214630126953125, -0.0135345458984375, -0.007854461669921875, -0.00217437744140625, 0.003505706787109375, 0.009185791015625, 0.014865875244140625, 0.02054595947265625, 0.026226043701171875, 0.0319061279296875, 0.037586212158203125, 0.04326629638671875, 0.048946380615234375, 0.05462646484375, 0.060306549072265625, 0.06598663330078125, 0.07166671752929688, 0.0773468017578125, 0.08302688598632812, 0.08870697021484375, 0.09438705444335938, 0.100067138671875, 0.10574722290039062, 0.11142730712890625, 0.11710739135742188, 0.1227874755859375, 0.12846755981445312, 0.13414764404296875, 0.13982772827148438, 0.1455078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 10.0, 13.0, 35.0, 36.0, 60.0, 82.0, 92.0, 148.0, 215.0, 301.0, 414.0, 653.0, 943.0, 1519.0, 2489.0, 4098.0, 7155.0, 13031.0, 24029.0, 47650.0, 99097.0, 214189.0, 518613.0, 1444833.0, 1086570.0, 392853.0, 169408.0, 79456.0, 39285.0, 20590.0, 10726.0, 6016.0, 3558.0, 2128.0, 1373.0, 831.0, 541.0, 388.0, 260.0, 156.0, 135.0, 80.0, 56.0, 44.0, 32.0, 27.0, 10.0, 12.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.2122802734375, -0.20561599731445312, -0.19895172119140625, -0.19228744506835938, -0.1856231689453125, -0.17895889282226562, -0.17229461669921875, -0.16563034057617188, -0.158966064453125, -0.15230178833007812, -0.14563751220703125, -0.13897323608398438, -0.1323089599609375, -0.12564468383789062, -0.11898040771484375, -0.11231613159179688, -0.10565185546875, -0.09898757934570312, -0.09232330322265625, -0.08565902709960938, -0.0789947509765625, -0.07233047485351562, -0.06566619873046875, -0.059001922607421875, -0.052337646484375, -0.045673370361328125, -0.03900909423828125, -0.032344818115234375, -0.0256805419921875, -0.019016265869140625, -0.01235198974609375, -0.005687713623046875, 0.0009765625, 0.007640838623046875, 0.01430511474609375, 0.020969390869140625, 0.0276336669921875, 0.034297943115234375, 0.04096221923828125, 0.047626495361328125, 0.054290771484375, 0.060955047607421875, 0.06761932373046875, 0.07428359985351562, 0.0809478759765625, 0.08761215209960938, 0.09427642822265625, 0.10094070434570312, 0.10760498046875, 0.11426925659179688, 0.12093353271484375, 0.12759780883789062, 0.1342620849609375, 0.14092636108398438, 0.14759063720703125, 0.15425491333007812, 0.160919189453125, 0.16758346557617188, 0.17424774169921875, 0.18091201782226562, 0.1875762939453125, 0.19424057006835938, 0.20090484619140625, 0.20756912231445312, 0.2142333984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 4.0, 9.0, 18.0, 14.0, 32.0, 39.0, 61.0, 97.0, 114.0, 167.0, 252.0, 408.0, 602.0, 768.0, 485.0, 361.0, 207.0, 135.0, 84.0, 68.0, 42.0, 29.0, 18.0, 12.0, 7.0, 13.0, 8.0, 1.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313232421875, -0.30353546142578125, -0.2938385009765625, -0.28414154052734375, -0.274444580078125, -0.26474761962890625, -0.2550506591796875, -0.24535369873046875, -0.23565673828125, -0.22595977783203125, -0.2162628173828125, -0.20656585693359375, -0.196868896484375, -0.18717193603515625, -0.1774749755859375, -0.16777801513671875, -0.1580810546875, -0.14838409423828125, -0.1386871337890625, -0.12899017333984375, -0.119293212890625, -0.10959625244140625, -0.0998992919921875, -0.09020233154296875, -0.08050537109375, -0.07080841064453125, -0.0611114501953125, -0.05141448974609375, -0.041717529296875, -0.03202056884765625, -0.0223236083984375, -0.01262664794921875, -0.0029296875, 0.00676727294921875, 0.0164642333984375, 0.02616119384765625, 0.035858154296875, 0.04555511474609375, 0.0552520751953125, 0.06494903564453125, 0.07464599609375, 0.08434295654296875, 0.0940399169921875, 0.10373687744140625, 0.113433837890625, 0.12313079833984375, 0.1328277587890625, 0.14252471923828125, 0.1522216796875, 0.16191864013671875, 0.1716156005859375, 0.18131256103515625, 0.191009521484375, 0.20070648193359375, 0.2104034423828125, 0.22010040283203125, 0.22979736328125, 0.23949432373046875, 0.2491912841796875, 0.25888824462890625, 0.268585205078125, 0.27828216552734375, 0.2879791259765625, 0.29767608642578125, 0.307373046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 6.0, 11.0, 24.0, 51.0, 87.0, 135.0, 171.0, 148.0, 160.0, 105.0, 58.0, 30.0, 16.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.773592472076416, -0.6987533569335938, -0.6239142417907715, -0.5490751266479492, -0.47423604130744934, -0.3993969261646271, -0.3245578408241272, -0.24971872568130493, -0.17487961053848267, -0.100040502846241, -0.02520139515399933, 0.04963770508766174, 0.12447682023048401, 0.19931593537330627, 0.27415502071380615, 0.3489941358566284, 0.4238332509994507, 0.49867236614227295, 0.5735114812850952, 0.6483505964279175, 0.7231897115707397, 0.798028826713562, 0.8728678822517395, 0.9477069973945618, 1.0225460529327393, 1.0973851680755615, 1.1722242832183838, 1.247063398361206, 1.3219025135040283, 1.3967416286468506, 1.4715807437896729, 1.5464198589324951, 1.6212589740753174, 1.6960980892181396, 1.770937204360962, 1.8457763195037842, 1.9206154346466064, 1.9954545497894287, 2.070293664932251, 2.1451327800750732, 2.2199718952178955, 2.2948110103607178, 2.36965012550354, 2.4444892406463623, 2.5193283557891846, 2.594167470932007, 2.669006586074829, 2.7438457012176514, 2.8186845779418945, 2.893523693084717, 2.968362808227539, 3.0432019233703613, 3.1180410385131836, 3.192880153656006, 3.267719268798828, 3.3425583839416504, 3.4173974990844727, 3.492236614227295, 3.567075729370117, 3.6419148445129395, 3.7167539596557617, 3.791593074798584, 3.8664321899414062, 3.9412713050842285, 4.016110420227051]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 6.0, 11.0, 11.0, 15.0, 16.0, 13.0, 27.0, 20.0, 24.0, 15.0, 24.0, 21.0, 32.0, 29.0, 28.0, 26.0, 40.0, 40.0, 44.0, 33.0, 29.0, 48.0, 38.0, 26.0, 44.0, 36.0, 32.0, 32.0, 23.0, 26.0, 33.0, 20.0, 18.0, 20.0, 17.0, 14.0, 13.0, 4.0, 6.0, 9.0, 8.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 4.0], "bins": [-0.7017074823379517, -0.6809483170509338, -0.660189151763916, -0.639430046081543, -0.6186708807945251, -0.5979117155075073, -0.5771525502204895, -0.5563933849334717, -0.5356342792510986, -0.5148751139640808, -0.4941159784793854, -0.47335681319236755, -0.4525976777076721, -0.4318385124206543, -0.4110793471336365, -0.39032018184661865, -0.36956101655960083, -0.348801851272583, -0.3280427157878876, -0.30728355050086975, -0.2865244150161743, -0.2657652497291565, -0.24500608444213867, -0.22424693405628204, -0.20348778367042542, -0.1827286332845688, -0.16196948289871216, -0.14121031761169434, -0.12045116722583771, -0.09969201683998108, -0.07893285900354385, -0.05817370116710663, -0.037414610385894775, -0.01665545627474785, 0.004103697836399078, 0.024862851947546005, 0.04562200605869293, 0.06638115644454956, 0.08714031428098679, 0.10789947211742401, 0.12865862250328064, 0.14941777288913727, 0.1701769232749939, 0.19093608856201172, 0.21169523894786835, 0.23245438933372498, 0.2532135546207428, 0.27397269010543823, 0.29473185539245605, 0.3154910206794739, 0.3362501561641693, 0.35700932145118713, 0.37776845693588257, 0.3985276222229004, 0.4192867875099182, 0.44004595279693604, 0.46080508828163147, 0.4815642535686493, 0.5023233890533447, 0.5230825543403625, 0.5438417196273804, 0.5646008253097534, 0.5853599905967712, 0.6061191558837891, 0.6268783211708069]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 12.0, 8.0, 13.0, 20.0, 28.0, 37.0, 50.0, 89.0, 147.0, 212.0, 330.0, 570.0, 878.0, 1432.0, 2380.0, 4169.0, 7301.0, 12677.0, 22927.0, 41326.0, 78832.0, 152936.0, 244342.0, 216927.0, 121189.0, 62756.0, 33478.0, 18258.0, 10489.0, 6028.0, 3512.0, 1980.0, 1246.0, 731.0, 445.0, 275.0, 184.0, 122.0, 69.0, 46.0, 33.0, 23.0, 14.0, 13.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2027587890625, -0.1961803436279297, -0.18960189819335938, -0.18302345275878906, -0.17644500732421875, -0.16986656188964844, -0.16328811645507812, -0.1567096710205078, -0.1501312255859375, -0.1435527801513672, -0.13697433471679688, -0.13039588928222656, -0.12381744384765625, -0.11723899841308594, -0.11066055297851562, -0.10408210754394531, -0.097503662109375, -0.09092521667480469, -0.08434677124023438, -0.07776832580566406, -0.07118988037109375, -0.06461143493652344, -0.058032989501953125, -0.05145454406738281, -0.0448760986328125, -0.03829765319824219, -0.031719207763671875, -0.025140762329101562, -0.01856231689453125, -0.011983871459960938, -0.005405426025390625, 0.0011730194091796875, 0.00775146484375, 0.014329910278320312, 0.020908355712890625, 0.027486801147460938, 0.03406524658203125, 0.04064369201660156, 0.047222137451171875, 0.05380058288574219, 0.0603790283203125, 0.06695747375488281, 0.07353591918945312, 0.08011436462402344, 0.08669281005859375, 0.09327125549316406, 0.09984970092773438, 0.10642814636230469, 0.113006591796875, 0.11958503723144531, 0.12616348266601562, 0.13274192810058594, 0.13932037353515625, 0.14589881896972656, 0.15247726440429688, 0.1590557098388672, 0.1656341552734375, 0.1722126007080078, 0.17879104614257812, 0.18536949157714844, 0.19194793701171875, 0.19852638244628906, 0.20510482788085938, 0.2116832733154297, 0.21826171875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 7.0, 10.0, 14.0, 18.0, 19.0, 27.0, 25.0, 39.0, 37.0, 58.0, 49.0, 42.0, 49.0, 51.0, 56.0, 48.0, 49.0, 46.0, 59.0, 46.0, 47.0, 32.0, 27.0, 25.0, 24.0, 23.0, 17.0, 15.0, 7.0, 7.0, 6.0, 2.0, 1.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2293701171875, -0.2227783203125, -0.2161865234375, -0.2095947265625, -0.2030029296875, -0.1964111328125, -0.1898193359375, -0.1832275390625, -0.1766357421875, -0.1700439453125, -0.1634521484375, -0.1568603515625, -0.1502685546875, -0.1436767578125, -0.1370849609375, -0.1304931640625, -0.1239013671875, -0.1173095703125, -0.1107177734375, -0.1041259765625, -0.0975341796875, -0.0909423828125, -0.0843505859375, -0.0777587890625, -0.0711669921875, -0.0645751953125, -0.0579833984375, -0.0513916015625, -0.0447998046875, -0.0382080078125, -0.0316162109375, -0.0250244140625, -0.0184326171875, -0.0118408203125, -0.0052490234375, 0.0013427734375, 0.0079345703125, 0.0145263671875, 0.0211181640625, 0.0277099609375, 0.0343017578125, 0.0408935546875, 0.0474853515625, 0.0540771484375, 0.0606689453125, 0.0672607421875, 0.0738525390625, 0.0804443359375, 0.0870361328125, 0.0936279296875, 0.1002197265625, 0.1068115234375, 0.1134033203125, 0.1199951171875, 0.1265869140625, 0.1331787109375, 0.1397705078125, 0.1463623046875, 0.1529541015625, 0.1595458984375, 0.1661376953125, 0.1727294921875, 0.1793212890625, 0.1859130859375, 0.1925048828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 3.0, 11.0, 11.0, 9.0, 20.0, 13.0, 25.0, 33.0, 31.0, 72.0, 129.0, 319.0, 1243.0, 5609.0, 27901.0, 151770.0, 629574.0, 189410.0, 33402.0, 6610.0, 1498.0, 415.0, 138.0, 73.0, 62.0, 44.0, 26.0, 19.0, 20.0, 12.0, 9.0, 6.0, 8.0, 4.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63232421875, -0.610931396484375, -0.58953857421875, -0.568145751953125, -0.5467529296875, -0.525360107421875, -0.50396728515625, -0.482574462890625, -0.461181640625, -0.439788818359375, -0.41839599609375, -0.397003173828125, -0.3756103515625, -0.354217529296875, -0.33282470703125, -0.311431884765625, -0.2900390625, -0.268646240234375, -0.24725341796875, -0.225860595703125, -0.2044677734375, -0.183074951171875, -0.16168212890625, -0.140289306640625, -0.118896484375, -0.097503662109375, -0.07611083984375, -0.054718017578125, -0.0333251953125, -0.011932373046875, 0.00946044921875, 0.030853271484375, 0.05224609375, 0.073638916015625, 0.09503173828125, 0.116424560546875, 0.1378173828125, 0.159210205078125, 0.18060302734375, 0.201995849609375, 0.223388671875, 0.244781494140625, 0.26617431640625, 0.287567138671875, 0.3089599609375, 0.330352783203125, 0.35174560546875, 0.373138427734375, 0.39453125, 0.415924072265625, 0.43731689453125, 0.458709716796875, 0.4801025390625, 0.501495361328125, 0.52288818359375, 0.544281005859375, 0.565673828125, 0.587066650390625, 0.60845947265625, 0.629852294921875, 0.6512451171875, 0.672637939453125, 0.69403076171875, 0.715423583984375, 0.73681640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 13.0, 6.0, 13.0, 12.0, 12.0, 13.0, 27.0, 29.0, 27.0, 42.0, 36.0, 34.0, 59.0, 56.0, 54.0, 48.0, 55.0, 58.0, 62.0, 38.0, 45.0, 41.0, 38.0, 18.0, 35.0, 15.0, 21.0, 20.0, 10.0, 9.0, 10.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63818359375, -0.61895751953125, -0.5997314453125, -0.58050537109375, -0.561279296875, -0.54205322265625, -0.5228271484375, -0.50360107421875, -0.484375, -0.46514892578125, -0.4459228515625, -0.42669677734375, -0.407470703125, -0.38824462890625, -0.3690185546875, -0.34979248046875, -0.33056640625, -0.31134033203125, -0.2921142578125, -0.27288818359375, -0.253662109375, -0.23443603515625, -0.2152099609375, -0.19598388671875, -0.1767578125, -0.15753173828125, -0.1383056640625, -0.11907958984375, -0.099853515625, -0.08062744140625, -0.0614013671875, -0.04217529296875, -0.02294921875, -0.00372314453125, 0.0155029296875, 0.03472900390625, 0.053955078125, 0.07318115234375, 0.0924072265625, 0.11163330078125, 0.130859375, 0.15008544921875, 0.1693115234375, 0.18853759765625, 0.207763671875, 0.22698974609375, 0.2462158203125, 0.26544189453125, 0.28466796875, 0.30389404296875, 0.3231201171875, 0.34234619140625, 0.361572265625, 0.38079833984375, 0.4000244140625, 0.41925048828125, 0.4384765625, 0.45770263671875, 0.4769287109375, 0.49615478515625, 0.515380859375, 0.53460693359375, 0.5538330078125, 0.57305908203125, 0.59228515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 11.0, 7.0, 20.0, 21.0, 24.0, 41.0, 65.0, 83.0, 110.0, 155.0, 279.0, 465.0, 757.0, 1395.0, 2509.0, 5211.0, 11441.0, 25377.0, 58400.0, 134153.0, 332548.0, 278393.0, 108997.0, 47675.0, 21174.0, 9605.0, 4432.0, 2200.0, 1158.0, 687.0, 360.0, 259.0, 180.0, 98.0, 67.0, 58.0, 32.0, 30.0, 23.0, 17.0, 11.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.14531898498535156, -0.14061355590820312, -0.1359081268310547, -0.13120269775390625, -0.1264972686767578, -0.12179183959960938, -0.11708641052246094, -0.1123809814453125, -0.10767555236816406, -0.10297012329101562, -0.09826469421386719, -0.09355926513671875, -0.08885383605957031, -0.08414840698242188, -0.07944297790527344, -0.074737548828125, -0.07003211975097656, -0.06532669067382812, -0.06062126159667969, -0.05591583251953125, -0.05121040344238281, -0.046504974365234375, -0.04179954528808594, -0.0370941162109375, -0.03238868713378906, -0.027683258056640625, -0.022977828979492188, -0.01827239990234375, -0.013566970825195312, -0.008861541748046875, -0.0041561126708984375, 0.00054931640625, 0.0052547454833984375, 0.009960174560546875, 0.014665603637695312, 0.01937103271484375, 0.024076461791992188, 0.028781890869140625, 0.03348731994628906, 0.0381927490234375, 0.04289817810058594, 0.047603607177734375, 0.05230903625488281, 0.05701446533203125, 0.06171989440917969, 0.06642532348632812, 0.07113075256347656, 0.075836181640625, 0.08054161071777344, 0.08524703979492188, 0.08995246887207031, 0.09465789794921875, 0.09936332702636719, 0.10406875610351562, 0.10877418518066406, 0.1134796142578125, 0.11818504333496094, 0.12289047241210938, 0.1275959014892578, 0.13230133056640625, 0.1370067596435547, 0.14171218872070312, 0.14641761779785156, 0.151123046875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 5.0, 9.0, 8.0, 11.0, 9.0, 16.0, 12.0, 22.0, 20.0, 20.0, 35.0, 39.0, 56.0, 68.0, 88.0, 82.0, 89.0, 68.0, 58.0, 58.0, 40.0, 29.0, 21.0, 15.0, 22.0, 19.0, 11.0, 6.0, 15.0, 9.0, 7.0, 7.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1723099052906036e-05, -2.0856037735939026e-05, -1.9988976418972015e-05, -1.9121915102005005e-05, -1.8254853785037994e-05, -1.7387792468070984e-05, -1.6520731151103973e-05, -1.5653669834136963e-05, -1.4786608517169952e-05, -1.3919547200202942e-05, -1.3052485883235931e-05, -1.2185424566268921e-05, -1.131836324930191e-05, -1.04513019323349e-05, -9.58424061536789e-06, -8.717179298400879e-06, -7.850117981433868e-06, -6.983056664466858e-06, -6.115995347499847e-06, -5.248934030532837e-06, -4.381872713565826e-06, -3.514811396598816e-06, -2.6477500796318054e-06, -1.780688762664795e-06, -9.136274456977844e-07, -4.6566128730773926e-08, 8.204951882362366e-07, 1.687556505203247e-06, 2.5546178221702576e-06, 3.421679139137268e-06, 4.2887404561042786e-06, 5.155801773071289e-06, 6.0228630900382996e-06, 6.88992440700531e-06, 7.75698572397232e-06, 8.624047040939331e-06, 9.491108357906342e-06, 1.0358169674873352e-05, 1.1225230991840363e-05, 1.2092292308807373e-05, 1.2959353625774384e-05, 1.3826414942741394e-05, 1.4693476259708405e-05, 1.5560537576675415e-05, 1.6427598893642426e-05, 1.7294660210609436e-05, 1.8161721527576447e-05, 1.9028782844543457e-05, 1.9895844161510468e-05, 2.0762905478477478e-05, 2.162996679544449e-05, 2.24970281124115e-05, 2.336408942937851e-05, 2.423115074634552e-05, 2.509821206331253e-05, 2.596527338027954e-05, 2.683233469724655e-05, 2.7699396014213562e-05, 2.8566457331180573e-05, 2.9433518648147583e-05, 3.0300579965114594e-05, 3.1167641282081604e-05, 3.2034702599048615e-05, 3.2901763916015625e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 10.0, 17.0, 22.0, 24.0, 45.0, 69.0, 96.0, 136.0, 236.0, 445.0, 1124.0, 3437.0, 12448.0, 54271.0, 258464.0, 543614.0, 133702.0, 29510.0, 7128.0, 2091.0, 771.0, 326.0, 194.0, 103.0, 72.0, 53.0, 37.0, 26.0, 20.0, 13.0, 15.0, 9.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.245361328125, -0.23726272583007812, -0.22916412353515625, -0.22106552124023438, -0.2129669189453125, -0.20486831665039062, -0.19676971435546875, -0.18867111206054688, -0.180572509765625, -0.17247390747070312, -0.16437530517578125, -0.15627670288085938, -0.1481781005859375, -0.14007949829101562, -0.13198089599609375, -0.12388229370117188, -0.11578369140625, -0.10768508911132812, -0.09958648681640625, -0.09148788452148438, -0.0833892822265625, -0.07529067993164062, -0.06719207763671875, -0.059093475341796875, -0.050994873046875, -0.042896270751953125, -0.03479766845703125, -0.026699066162109375, -0.0186004638671875, -0.010501861572265625, -0.00240325927734375, 0.005695343017578125, 0.0137939453125, 0.021892547607421875, 0.02999114990234375, 0.038089752197265625, 0.0461883544921875, 0.054286956787109375, 0.06238555908203125, 0.07048416137695312, 0.078582763671875, 0.08668136596679688, 0.09477996826171875, 0.10287857055664062, 0.1109771728515625, 0.11907577514648438, 0.12717437744140625, 0.13527297973632812, 0.14337158203125, 0.15147018432617188, 0.15956878662109375, 0.16766738891601562, 0.1757659912109375, 0.18386459350585938, 0.19196319580078125, 0.20006179809570312, 0.208160400390625, 0.21625900268554688, 0.22435760498046875, 0.23245620727539062, 0.2405548095703125, 0.24865341186523438, 0.25675201416015625, 0.2648506164550781, 0.27294921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 10.0, 14.0, 12.0, 17.0, 31.0, 51.0, 53.0, 71.0, 123.0, 172.0, 128.0, 92.0, 48.0, 46.0, 37.0, 35.0, 21.0, 13.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332763671875, -0.3241443634033203, -0.3155250549316406, -0.30690574645996094, -0.29828643798828125, -0.28966712951660156, -0.2810478210449219, -0.2724285125732422, -0.2638092041015625, -0.2551898956298828, -0.24657058715820312, -0.23795127868652344, -0.22933197021484375, -0.22071266174316406, -0.21209335327148438, -0.2034740447998047, -0.194854736328125, -0.1862354278564453, -0.17761611938476562, -0.16899681091308594, -0.16037750244140625, -0.15175819396972656, -0.14313888549804688, -0.1345195770263672, -0.1259002685546875, -0.11728096008300781, -0.10866165161132812, -0.10004234313964844, -0.09142303466796875, -0.08280372619628906, -0.07418441772460938, -0.06556510925292969, -0.05694580078125, -0.04832649230957031, -0.039707183837890625, -0.031087875366210938, -0.02246856689453125, -0.013849258422851562, -0.005229949951171875, 0.0033893585205078125, 0.0120086669921875, 0.020627975463867188, 0.029247283935546875, 0.03786659240722656, 0.04648590087890625, 0.05510520935058594, 0.06372451782226562, 0.07234382629394531, 0.080963134765625, 0.08958244323730469, 0.09820175170898438, 0.10682106018066406, 0.11544036865234375, 0.12405967712402344, 0.13267898559570312, 0.1412982940673828, 0.1499176025390625, 0.1585369110107422, 0.16715621948242188, 0.17577552795410156, 0.18439483642578125, 0.19301414489746094, 0.20163345336914062, 0.2102527618408203, 0.2188720703125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 18.0, 31.0, 60.0, 102.0, 150.0, 201.0, 179.0, 119.0, 80.0, 40.0, 11.0, 9.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.127254009246826, -4.0386176109313965, -3.9499809741973877, -3.861344337463379, -3.772707939147949, -3.6840713024139404, -3.5954349040985107, -3.506798267364502, -3.4181618690490723, -3.3295252323150635, -3.240888833999634, -3.152252197265625, -3.0636157989501953, -2.9749791622161865, -2.886342763900757, -2.797706127166748, -2.7090697288513184, -2.6204330921173096, -2.53179669380188, -2.443160057067871, -2.3545236587524414, -2.2658870220184326, -2.177250623703003, -2.088613986968994, -1.9999773502349854, -1.9113408327102661, -1.8227043151855469, -1.7340677976608276, -1.6454312801361084, -1.5567947626113892, -1.46815824508667, -1.3795216083526611, -1.2908852100372314, -1.2022486925125122, -1.113612174987793, -1.0249756574630737, -0.9363391399383545, -0.8477026224136353, -0.7590660452842712, -0.670429527759552, -0.5817930102348328, -0.4931564927101135, -0.4045199751853943, -0.31588342785835266, -0.22724691033363342, -0.13861039280891418, -0.04997384548187256, 0.03866267204284668, 0.12729918956756592, 0.21593570709228516, 0.3045722246170044, 0.393208771944046, 0.48184528946876526, 0.5704817771911621, 0.6591183543205261, 0.7477548718452454, 0.8363913893699646, 0.9250279068946838, 1.0136644840240479, 1.102301001548767, 1.1909375190734863, 1.2795740365982056, 1.3682105541229248, 1.456847071647644, 1.5454835891723633]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 7.0, 8.0, 6.0, 10.0, 6.0, 15.0, 8.0, 15.0, 26.0, 24.0, 26.0, 45.0, 22.0, 27.0, 30.0, 46.0, 46.0, 49.0, 49.0, 41.0, 42.0, 30.0, 48.0, 52.0, 41.0, 38.0, 34.0, 37.0, 31.0, 21.0, 20.0, 19.0, 13.0, 16.0, 10.0, 7.0, 6.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1887855529785156, -1.145653247833252, -1.1025210618972778, -1.0593887567520142, -1.01625657081604, -0.9731242656707764, -0.9299919605255127, -0.8868597149848938, -0.8437274694442749, -0.800595223903656, -0.7574629783630371, -0.7143306732177734, -0.6711984276771545, -0.6280661821365356, -0.584933876991272, -0.5418016314506531, -0.4986693859100342, -0.4555371403694153, -0.412404865026474, -0.3692725896835327, -0.3261403441429138, -0.2830080986022949, -0.23987582325935364, -0.19674354791641235, -0.15361130237579346, -0.11047904193401337, -0.06734678149223328, -0.024214521050453186, 0.018917739391326904, 0.062049999833106995, 0.10518226027488708, 0.14831453561782837, 0.19144690036773682, 0.2345791608095169, 0.277711421251297, 0.3208436965942383, 0.3639759421348572, 0.4071081876754761, 0.45024046301841736, 0.49337273836135864, 0.5365049839019775, 0.5796372294425964, 0.6227694749832153, 0.665901780128479, 0.7090340256690979, 0.7521662712097168, 0.7952985763549805, 0.8384308218955994, 0.8815630674362183, 0.9246953129768372, 0.967827558517456, 1.0109598636627197, 1.0540921688079834, 1.0972243547439575, 1.1403566598892212, 1.1834888458251953, 1.226621150970459, 1.2697534561157227, 1.3128856420516968, 1.3560179471969604, 1.3991501331329346, 1.4422824382781982, 1.485414743423462, 1.5285470485687256, 1.5716792345046997]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 13.0, 10.0, 11.0, 21.0, 36.0, 54.0, 89.0, 138.0, 214.0, 284.0, 489.0, 767.0, 1224.0, 2111.0, 3593.0, 6336.0, 11517.0, 20630.0, 38623.0, 74848.0, 156484.0, 372481.0, 1001492.0, 1441724.0, 602304.0, 235665.0, 105980.0, 53399.0, 28114.0, 15376.0, 8356.0, 4843.0, 2771.0, 1591.0, 1000.0, 627.0, 354.0, 242.0, 166.0, 99.0, 78.0, 35.0, 26.0, 22.0, 25.0, 11.0, 6.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.173828125, -0.16843795776367188, -0.16304779052734375, -0.15765762329101562, -0.1522674560546875, -0.14687728881835938, -0.14148712158203125, -0.13609695434570312, -0.130706787109375, -0.12531661987304688, -0.11992645263671875, -0.11453628540039062, -0.1091461181640625, -0.10375595092773438, -0.09836578369140625, -0.09297561645507812, -0.08758544921875, -0.08219528198242188, -0.07680511474609375, -0.07141494750976562, -0.0660247802734375, -0.060634613037109375, -0.05524444580078125, -0.049854278564453125, -0.044464111328125, -0.039073944091796875, -0.03368377685546875, -0.028293609619140625, -0.0229034423828125, -0.017513275146484375, -0.01212310791015625, -0.006732940673828125, -0.0013427734375, 0.004047393798828125, 0.00943756103515625, 0.014827728271484375, 0.0202178955078125, 0.025608062744140625, 0.03099822998046875, 0.036388397216796875, 0.041778564453125, 0.047168731689453125, 0.05255889892578125, 0.057949066162109375, 0.0633392333984375, 0.06872940063476562, 0.07411956787109375, 0.07950973510742188, 0.08489990234375, 0.09029006958007812, 0.09568023681640625, 0.10107040405273438, 0.1064605712890625, 0.11185073852539062, 0.11724090576171875, 0.12263107299804688, 0.128021240234375, 0.13341140747070312, 0.13880157470703125, 0.14419174194335938, 0.1495819091796875, 0.15497207641601562, 0.16036224365234375, 0.16575241088867188, 0.171142578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 6.0, 11.0, 13.0, 11.0, 10.0, 20.0, 15.0, 21.0, 30.0, 25.0, 29.0, 36.0, 31.0, 53.0, 40.0, 47.0, 46.0, 43.0, 49.0, 44.0, 43.0, 34.0, 41.0, 47.0, 41.0, 35.0, 28.0, 27.0, 19.0, 11.0, 23.0, 14.0, 10.0, 11.0, 12.0, 7.0, 4.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.175537109375, -0.1695098876953125, -0.163482666015625, -0.1574554443359375, -0.15142822265625, -0.1454010009765625, -0.139373779296875, -0.1333465576171875, -0.1273193359375, -0.1212921142578125, -0.115264892578125, -0.1092376708984375, -0.10321044921875, -0.0971832275390625, -0.091156005859375, -0.0851287841796875, -0.0791015625, -0.0730743408203125, -0.067047119140625, -0.0610198974609375, -0.05499267578125, -0.0489654541015625, -0.042938232421875, -0.0369110107421875, -0.0308837890625, -0.0248565673828125, -0.018829345703125, -0.0128021240234375, -0.00677490234375, -0.0007476806640625, 0.005279541015625, 0.0113067626953125, 0.017333984375, 0.0233612060546875, 0.029388427734375, 0.0354156494140625, 0.04144287109375, 0.0474700927734375, 0.053497314453125, 0.0595245361328125, 0.0655517578125, 0.0715789794921875, 0.077606201171875, 0.0836334228515625, 0.08966064453125, 0.0956878662109375, 0.101715087890625, 0.1077423095703125, 0.11376953125, 0.1197967529296875, 0.125823974609375, 0.1318511962890625, 0.13787841796875, 0.1439056396484375, 0.149932861328125, 0.1559600830078125, 0.1619873046875, 0.1680145263671875, 0.174041748046875, 0.1800689697265625, 0.18609619140625, 0.1921234130859375, 0.198150634765625, 0.2041778564453125, 0.210205078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 13.0, 10.0, 12.0, 31.0, 46.0, 76.0, 105.0, 164.0, 198.0, 325.0, 508.0, 805.0, 1296.0, 2319.0, 4236.0, 8074.0, 16493.0, 36031.0, 86716.0, 222424.0, 692067.0, 1889378.0, 809333.0, 249845.0, 95717.0, 40180.0, 18281.0, 8801.0, 4548.0, 2452.0, 1377.0, 866.0, 516.0, 330.0, 240.0, 144.0, 100.0, 61.0, 47.0, 40.0, 27.0, 14.0, 11.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0], "bins": [-0.32568359375, -0.3165245056152344, -0.30736541748046875, -0.2982063293457031, -0.2890472412109375, -0.2798881530761719, -0.27072906494140625, -0.2615699768066406, -0.252410888671875, -0.24325180053710938, -0.23409271240234375, -0.22493362426757812, -0.2157745361328125, -0.20661544799804688, -0.19745635986328125, -0.18829727172851562, -0.17913818359375, -0.16997909545898438, -0.16082000732421875, -0.15166091918945312, -0.1425018310546875, -0.13334274291992188, -0.12418365478515625, -0.11502456665039062, -0.105865478515625, -0.09670639038085938, -0.08754730224609375, -0.07838821411132812, -0.0692291259765625, -0.060070037841796875, -0.05091094970703125, -0.041751861572265625, -0.0325927734375, -0.023433685302734375, -0.01427459716796875, -0.005115509033203125, 0.0040435791015625, 0.013202667236328125, 0.02236175537109375, 0.031520843505859375, 0.040679931640625, 0.049839019775390625, 0.05899810791015625, 0.06815719604492188, 0.0773162841796875, 0.08647537231445312, 0.09563446044921875, 0.10479354858398438, 0.11395263671875, 0.12311172485351562, 0.13227081298828125, 0.14142990112304688, 0.1505889892578125, 0.15974807739257812, 0.16890716552734375, 0.17806625366210938, 0.187225341796875, 0.19638442993164062, 0.20554351806640625, 0.21470260620117188, 0.2238616943359375, 0.23302078247070312, 0.24217987060546875, 0.2513389587402344, 0.260498046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 8.0, 17.0, 14.0, 22.0, 26.0, 49.0, 60.0, 84.0, 113.0, 163.0, 224.0, 347.0, 507.0, 648.0, 566.0, 399.0, 238.0, 177.0, 109.0, 72.0, 51.0, 42.0, 21.0, 21.0, 16.0, 13.0, 10.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.375, -0.3631401062011719, -0.35128021240234375, -0.3394203186035156, -0.3275604248046875, -0.3157005310058594, -0.30384063720703125, -0.2919807434082031, -0.280120849609375, -0.2682609558105469, -0.25640106201171875, -0.24454116821289062, -0.2326812744140625, -0.22082138061523438, -0.20896148681640625, -0.19710159301757812, -0.18524169921875, -0.17338180541992188, -0.16152191162109375, -0.14966201782226562, -0.1378021240234375, -0.12594223022460938, -0.11408233642578125, -0.10222244262695312, -0.090362548828125, -0.07850265502929688, -0.06664276123046875, -0.054782867431640625, -0.0429229736328125, -0.031063079833984375, -0.01920318603515625, -0.007343292236328125, 0.0045166015625, 0.016376495361328125, 0.02823638916015625, 0.040096282958984375, 0.0519561767578125, 0.06381607055664062, 0.07567596435546875, 0.08753585815429688, 0.099395751953125, 0.11125564575195312, 0.12311553955078125, 0.13497543334960938, 0.1468353271484375, 0.15869522094726562, 0.17055511474609375, 0.18241500854492188, 0.19427490234375, 0.20613479614257812, 0.21799468994140625, 0.22985458374023438, 0.2417144775390625, 0.2535743713378906, 0.26543426513671875, 0.2772941589355469, 0.289154052734375, 0.3010139465332031, 0.31287384033203125, 0.3247337341308594, 0.3365936279296875, 0.3484535217285156, 0.36031341552734375, 0.3721733093261719, 0.384033203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 13.0, 21.0, 25.0, 40.0, 56.0, 66.0, 80.0, 103.0, 89.0, 88.0, 101.0, 70.0, 63.0, 55.0, 45.0, 24.0, 17.0, 10.0, 11.0, 6.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5935465097427368, -1.535908579826355, -1.4782705307006836, -1.4206326007843018, -1.3629945516586304, -1.3053566217422485, -1.2477185726165771, -1.1900806427001953, -1.1324427127838135, -1.0748047828674316, -1.0171667337417603, -0.9595288038253784, -0.901890754699707, -0.8442528247833252, -0.7866148352622986, -0.728976845741272, -0.6713387966156006, -0.613700807094574, -0.5560628175735474, -0.49842485785484314, -0.44078686833381653, -0.3831488788127899, -0.3255109190940857, -0.2678729295730591, -0.21023494005203247, -0.15259695053100586, -0.09495897591114044, -0.037321001291275024, 0.020316988229751587, 0.0779549777507782, 0.13559293746948242, 0.19323092699050903, 0.2508690357208252, 0.3085070252418518, 0.3661450147628784, 0.42378297448158264, 0.48142096400260925, 0.5390589237213135, 0.5966969132423401, 0.6543349027633667, 0.7119728922843933, 0.7696108818054199, 0.8272488713264465, 0.8848868608474731, 0.942524790763855, 1.0001628398895264, 1.0578007698059082, 1.11543869972229, 1.1730767488479614, 1.2307146787643433, 1.2883527278900146, 1.3459906578063965, 1.4036287069320679, 1.4612666368484497, 1.518904685974121, 1.576542615890503, 1.6341805458068848, 1.6918184757232666, 1.749456524848938, 1.8070944547653198, 1.8647325038909912, 1.922370433807373, 1.9800083637237549, 2.0376462936401367, 2.0952844619750977]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 10.0, 9.0, 13.0, 19.0, 16.0, 12.0, 11.0, 29.0, 33.0, 42.0, 34.0, 35.0, 50.0, 42.0, 42.0, 35.0, 53.0, 50.0, 34.0, 33.0, 28.0, 37.0, 45.0, 27.0, 35.0, 30.0, 26.0, 31.0, 24.0, 21.0, 21.0, 15.0, 8.0, 8.0, 4.0, 10.0, 8.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.049952745437622, -1.014439344406128, -0.9789260029792786, -0.9434126615524292, -0.9078992605209351, -0.8723858594894409, -0.8368725180625916, -0.8013591766357422, -0.765845775604248, -0.7303323745727539, -0.6948190331459045, -0.6593056917190552, -0.623792290687561, -0.5882788896560669, -0.5527655482292175, -0.5172522068023682, -0.481738805770874, -0.44622543454170227, -0.4107120633125305, -0.37519869208335876, -0.339685320854187, -0.30417194962501526, -0.2686585783958435, -0.23314520716667175, -0.1976318359375, -0.16211846470832825, -0.1266050934791565, -0.09109172224998474, -0.05557835102081299, -0.020064979791641235, 0.015448391437530518, 0.05096176266670227, 0.08647501468658447, 0.12198838591575623, 0.15750175714492798, 0.19301512837409973, 0.22852849960327148, 0.26404187083244324, 0.299555242061615, 0.33506861329078674, 0.3705819845199585, 0.40609535574913025, 0.441608726978302, 0.47712209820747375, 0.5126354694366455, 0.5481488704681396, 0.583662211894989, 0.6191755533218384, 0.6546889543533325, 0.6902023553848267, 0.725715696811676, 0.7612290382385254, 0.7967424392700195, 0.8322558403015137, 0.867769181728363, 0.9032825231552124, 0.9387959241867065, 0.9743093252182007, 1.0098226070404053, 1.0453360080718994, 1.0808494091033936, 1.1163628101348877, 1.1518762111663818, 1.1873894929885864, 1.2229028940200806]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 7.0, 3.0, 6.0, 15.0, 13.0, 30.0, 46.0, 70.0, 90.0, 137.0, 199.0, 305.0, 427.0, 725.0, 1059.0, 1778.0, 2666.0, 4139.0, 6696.0, 10314.0, 16504.0, 27383.0, 47421.0, 84765.0, 148496.0, 218273.0, 194157.0, 118886.0, 66871.0, 37564.0, 22071.0, 13569.0, 8529.0, 5464.0, 3526.0, 2214.0, 1394.0, 937.0, 631.0, 431.0, 262.0, 168.0, 108.0, 79.0, 40.0, 28.0, 27.0, 20.0, 12.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.21630859375, -0.2095050811767578, -0.20270156860351562, -0.19589805603027344, -0.18909454345703125, -0.18229103088378906, -0.17548751831054688, -0.1686840057373047, -0.1618804931640625, -0.1550769805908203, -0.14827346801757812, -0.14146995544433594, -0.13466644287109375, -0.12786293029785156, -0.12105941772460938, -0.11425590515136719, -0.107452392578125, -0.10064888000488281, -0.09384536743164062, -0.08704185485839844, -0.08023834228515625, -0.07343482971191406, -0.06663131713867188, -0.05982780456542969, -0.0530242919921875, -0.04622077941894531, -0.039417266845703125, -0.03261375427246094, -0.02581024169921875, -0.019006729125976562, -0.012203216552734375, -0.0053997039794921875, 0.00140380859375, 0.008207321166992188, 0.015010833740234375, 0.021814346313476562, 0.02861785888671875, 0.03542137145996094, 0.042224884033203125, 0.04902839660644531, 0.0558319091796875, 0.06263542175292969, 0.06943893432617188, 0.07624244689941406, 0.08304595947265625, 0.08984947204589844, 0.09665298461914062, 0.10345649719238281, 0.110260009765625, 0.11706352233886719, 0.12386703491210938, 0.13067054748535156, 0.13747406005859375, 0.14427757263183594, 0.15108108520507812, 0.1578845977783203, 0.1646881103515625, 0.1714916229248047, 0.17829513549804688, 0.18509864807128906, 0.19190216064453125, 0.19870567321777344, 0.20550918579101562, 0.2123126983642578, 0.2191162109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 4.0, 7.0, 3.0, 11.0, 17.0, 9.0, 14.0, 19.0, 31.0, 32.0, 25.0, 27.0, 35.0, 41.0, 39.0, 46.0, 58.0, 45.0, 50.0, 44.0, 49.0, 34.0, 36.0, 40.0, 42.0, 36.0, 46.0, 31.0, 16.0, 15.0, 24.0, 16.0, 17.0, 9.0, 13.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19096946716308594, -0.18455123901367188, -0.1781330108642578, -0.17171478271484375, -0.1652965545654297, -0.15887832641601562, -0.15246009826660156, -0.1460418701171875, -0.13962364196777344, -0.13320541381835938, -0.1267871856689453, -0.12036895751953125, -0.11395072937011719, -0.10753250122070312, -0.10111427307128906, -0.094696044921875, -0.08827781677246094, -0.08185958862304688, -0.07544136047363281, -0.06902313232421875, -0.06260490417480469, -0.056186676025390625, -0.04976844787597656, -0.0433502197265625, -0.03693199157714844, -0.030513763427734375, -0.024095535278320312, -0.01767730712890625, -0.011259078979492188, -0.004840850830078125, 0.0015773773193359375, 0.00799560546875, 0.014413833618164062, 0.020832061767578125, 0.027250289916992188, 0.03366851806640625, 0.04008674621582031, 0.046504974365234375, 0.05292320251464844, 0.0593414306640625, 0.06575965881347656, 0.07217788696289062, 0.07859611511230469, 0.08501434326171875, 0.09143257141113281, 0.09785079956054688, 0.10426902770996094, 0.110687255859375, 0.11710548400878906, 0.12352371215820312, 0.1299419403076172, 0.13636016845703125, 0.1427783966064453, 0.14919662475585938, 0.15561485290527344, 0.1620330810546875, 0.16845130920410156, 0.17486953735351562, 0.1812877655029297, 0.18770599365234375, 0.1941242218017578, 0.20054244995117188, 0.20696067810058594, 0.21337890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 11.0, 12.0, 19.0, 25.0, 32.0, 49.0, 58.0, 100.0, 149.0, 228.0, 389.0, 805.0, 1758.0, 4313.0, 11283.0, 29847.0, 81243.0, 224161.0, 384289.0, 196071.0, 70532.0, 26093.0, 9967.0, 3822.0, 1612.0, 698.0, 358.0, 196.0, 130.0, 89.0, 61.0, 48.0, 30.0, 18.0, 8.0, 10.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439697265625, -0.4257087707519531, -0.41172027587890625, -0.3977317810058594, -0.3837432861328125, -0.3697547912597656, -0.35576629638671875, -0.3417778015136719, -0.327789306640625, -0.3138008117675781, -0.29981231689453125, -0.2858238220214844, -0.2718353271484375, -0.2578468322753906, -0.24385833740234375, -0.22986984252929688, -0.21588134765625, -0.20189285278320312, -0.18790435791015625, -0.17391586303710938, -0.1599273681640625, -0.14593887329101562, -0.13195037841796875, -0.11796188354492188, -0.103973388671875, -0.08998489379882812, -0.07599639892578125, -0.062007904052734375, -0.0480194091796875, -0.034030914306640625, -0.02004241943359375, -0.006053924560546875, 0.0079345703125, 0.021923065185546875, 0.03591156005859375, 0.049900054931640625, 0.0638885498046875, 0.07787704467773438, 0.09186553955078125, 0.10585403442382812, 0.119842529296875, 0.13383102416992188, 0.14781951904296875, 0.16180801391601562, 0.1757965087890625, 0.18978500366210938, 0.20377349853515625, 0.21776199340820312, 0.23175048828125, 0.24573898315429688, 0.25972747802734375, 0.2737159729003906, 0.2877044677734375, 0.3016929626464844, 0.31568145751953125, 0.3296699523925781, 0.343658447265625, 0.3576469421386719, 0.37163543701171875, 0.3856239318847656, 0.3996124267578125, 0.4136009216308594, 0.42758941650390625, 0.4415779113769531, 0.45556640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 8.0, 5.0, 9.0, 7.0, 8.0, 14.0, 13.0, 17.0, 22.0, 30.0, 26.0, 20.0, 27.0, 29.0, 42.0, 40.0, 45.0, 51.0, 40.0, 33.0, 49.0, 53.0, 48.0, 40.0, 43.0, 30.0, 31.0, 34.0, 23.0, 28.0, 27.0, 22.0, 16.0, 12.0, 15.0, 8.0, 8.0, 6.0, 6.0, 4.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.5201187133789062, -0.5001983642578125, -0.48027801513671875, -0.460357666015625, -0.44043731689453125, -0.4205169677734375, -0.40059661865234375, -0.38067626953125, -0.36075592041015625, -0.3408355712890625, -0.32091522216796875, -0.300994873046875, -0.28107452392578125, -0.2611541748046875, -0.24123382568359375, -0.2213134765625, -0.20139312744140625, -0.1814727783203125, -0.16155242919921875, -0.141632080078125, -0.12171173095703125, -0.1017913818359375, -0.08187103271484375, -0.06195068359375, -0.04203033447265625, -0.0221099853515625, -0.00218963623046875, 0.017730712890625, 0.03765106201171875, 0.0575714111328125, 0.07749176025390625, 0.097412109375, 0.11733245849609375, 0.1372528076171875, 0.15717315673828125, 0.177093505859375, 0.19701385498046875, 0.2169342041015625, 0.23685455322265625, 0.25677490234375, 0.27669525146484375, 0.2966156005859375, 0.31653594970703125, 0.336456298828125, 0.35637664794921875, 0.3762969970703125, 0.39621734619140625, 0.4161376953125, 0.43605804443359375, 0.4559783935546875, 0.47589874267578125, 0.495819091796875, 0.5157394409179688, 0.5356597900390625, 0.5555801391601562, 0.57550048828125, 0.5954208374023438, 0.6153411865234375, 0.6352615356445312, 0.655181884765625, 0.6751022338867188, 0.6950225830078125, 0.7149429321289062, 0.73486328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 19.0, 26.0, 39.0, 76.0, 90.0, 153.0, 292.0, 533.0, 1205.0, 3236.0, 9269.0, 30137.0, 103699.0, 346570.0, 381191.0, 120389.0, 34516.0, 10689.0, 3629.0, 1467.0, 548.0, 313.0, 172.0, 96.0, 64.0, 47.0, 28.0, 16.0, 11.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.257568359375, -0.25061798095703125, -0.2436676025390625, -0.23671722412109375, -0.229766845703125, -0.22281646728515625, -0.2158660888671875, -0.20891571044921875, -0.20196533203125, -0.19501495361328125, -0.1880645751953125, -0.18111419677734375, -0.174163818359375, -0.16721343994140625, -0.1602630615234375, -0.15331268310546875, -0.1463623046875, -0.13941192626953125, -0.1324615478515625, -0.12551116943359375, -0.118560791015625, -0.11161041259765625, -0.1046600341796875, -0.09770965576171875, -0.09075927734375, -0.08380889892578125, -0.0768585205078125, -0.06990814208984375, -0.062957763671875, -0.05600738525390625, -0.0490570068359375, -0.04210662841796875, -0.03515625, -0.02820587158203125, -0.0212554931640625, -0.01430511474609375, -0.007354736328125, -0.00040435791015625, 0.0065460205078125, 0.01349639892578125, 0.02044677734375, 0.02739715576171875, 0.0343475341796875, 0.04129791259765625, 0.048248291015625, 0.05519866943359375, 0.0621490478515625, 0.06909942626953125, 0.0760498046875, 0.08300018310546875, 0.0899505615234375, 0.09690093994140625, 0.103851318359375, 0.11080169677734375, 0.1177520751953125, 0.12470245361328125, 0.13165283203125, 0.13860321044921875, 0.1455535888671875, 0.15250396728515625, 0.159454345703125, 0.16640472412109375, 0.1733551025390625, 0.18030548095703125, 0.187255859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 5.0, 6.0, 10.0, 9.0, 16.0, 6.0, 13.0, 26.0, 41.0, 44.0, 64.0, 90.0, 98.0, 112.0, 102.0, 99.0, 71.0, 46.0, 38.0, 24.0, 19.0, 16.0, 8.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57763671875e-05, -4.428252577781677e-05, -4.2788684368133545e-05, -4.129484295845032e-05, -3.980100154876709e-05, -3.830716013908386e-05, -3.6813318729400635e-05, -3.531947731971741e-05, -3.382563591003418e-05, -3.233179450035095e-05, -3.0837953090667725e-05, -2.9344111680984497e-05, -2.785027027130127e-05, -2.6356428861618042e-05, -2.4862587451934814e-05, -2.3368746042251587e-05, -2.187490463256836e-05, -2.0381063222885132e-05, -1.8887221813201904e-05, -1.7393380403518677e-05, -1.589953899383545e-05, -1.4405697584152222e-05, -1.2911856174468994e-05, -1.1418014764785767e-05, -9.924173355102539e-06, -8.430331945419312e-06, -6.936490535736084e-06, -5.4426491260528564e-06, -3.948807716369629e-06, -2.4549663066864014e-06, -9.611248970031738e-07, 5.327165126800537e-07, 2.0265579223632812e-06, 3.520399332046509e-06, 5.014240741729736e-06, 6.508082151412964e-06, 8.001923561096191e-06, 9.495764970779419e-06, 1.0989606380462646e-05, 1.2483447790145874e-05, 1.3977289199829102e-05, 1.547113060951233e-05, 1.6964972019195557e-05, 1.8458813428878784e-05, 1.9952654838562012e-05, 2.144649624824524e-05, 2.2940337657928467e-05, 2.4434179067611694e-05, 2.5928020477294922e-05, 2.742186188697815e-05, 2.8915703296661377e-05, 3.0409544706344604e-05, 3.190338611602783e-05, 3.339722752571106e-05, 3.489106893539429e-05, 3.6384910345077515e-05, 3.787875175476074e-05, 3.937259316444397e-05, 4.08664345741272e-05, 4.2360275983810425e-05, 4.385411739349365e-05, 4.534795880317688e-05, 4.684180021286011e-05, 4.8335641622543335e-05, 4.982948303222656e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 8.0, 18.0, 33.0, 52.0, 108.0, 190.0, 444.0, 1053.0, 2869.0, 9656.0, 34108.0, 120935.0, 353151.0, 354242.0, 122876.0, 34222.0, 9704.0, 2932.0, 1027.0, 468.0, 222.0, 97.0, 55.0, 35.0, 16.0, 14.0, 9.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17409515380859375, -0.1676483154296875, -0.16120147705078125, -0.154754638671875, -0.14830780029296875, -0.1418609619140625, -0.13541412353515625, -0.12896728515625, -0.12252044677734375, -0.1160736083984375, -0.10962677001953125, -0.103179931640625, -0.09673309326171875, -0.0902862548828125, -0.08383941650390625, -0.077392578125, -0.07094573974609375, -0.0644989013671875, -0.05805206298828125, -0.051605224609375, -0.04515838623046875, -0.0387115478515625, -0.03226470947265625, -0.02581787109375, -0.01937103271484375, -0.0129241943359375, -0.00647735595703125, -3.0517578125e-05, 0.00641632080078125, 0.0128631591796875, 0.01930999755859375, 0.0257568359375, 0.03220367431640625, 0.0386505126953125, 0.04509735107421875, 0.051544189453125, 0.05799102783203125, 0.0644378662109375, 0.07088470458984375, 0.07733154296875, 0.08377838134765625, 0.0902252197265625, 0.09667205810546875, 0.103118896484375, 0.10956573486328125, 0.1160125732421875, 0.12245941162109375, 0.12890625, 0.13535308837890625, 0.1417999267578125, 0.14824676513671875, 0.154693603515625, 0.16114044189453125, 0.1675872802734375, 0.17403411865234375, 0.18048095703125, 0.18692779541015625, 0.1933746337890625, 0.19982147216796875, 0.206268310546875, 0.21271514892578125, 0.2191619873046875, 0.22560882568359375, 0.2320556640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 14.0, 16.0, 14.0, 21.0, 21.0, 35.0, 39.0, 51.0, 57.0, 80.0, 69.0, 63.0, 79.0, 85.0, 73.0, 41.0, 43.0, 33.0, 32.0, 28.0, 27.0, 12.0, 7.0, 9.0, 4.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.1833362579345703, -0.17721939086914062, -0.17110252380371094, -0.16498565673828125, -0.15886878967285156, -0.15275192260742188, -0.1466350555419922, -0.1405181884765625, -0.1344013214111328, -0.12828445434570312, -0.12216758728027344, -0.11605072021484375, -0.10993385314941406, -0.10381698608398438, -0.09770011901855469, -0.091583251953125, -0.08546638488769531, -0.07934951782226562, -0.07323265075683594, -0.06711578369140625, -0.06099891662597656, -0.054882049560546875, -0.04876518249511719, -0.0426483154296875, -0.03653144836425781, -0.030414581298828125, -0.024297714233398438, -0.01818084716796875, -0.012063980102539062, -0.005947113037109375, 0.0001697540283203125, 0.00628662109375, 0.012403488159179688, 0.018520355224609375, 0.024637222290039062, 0.03075408935546875, 0.03687095642089844, 0.042987823486328125, 0.04910469055175781, 0.0552215576171875, 0.06133842468261719, 0.06745529174804688, 0.07357215881347656, 0.07968902587890625, 0.08580589294433594, 0.09192276000976562, 0.09803962707519531, 0.104156494140625, 0.11027336120605469, 0.11639022827148438, 0.12250709533691406, 0.12862396240234375, 0.13474082946777344, 0.14085769653320312, 0.1469745635986328, 0.1530914306640625, 0.1592082977294922, 0.16532516479492188, 0.17144203186035156, 0.17755889892578125, 0.18367576599121094, 0.18979263305664062, 0.1959095001220703, 0.2020263671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 9.0, 16.0, 27.0, 74.0, 176.0, 239.0, 215.0, 157.0, 61.0, 17.0, 12.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.999882698059082, -7.848831653594971, -7.697780609130859, -7.546729564666748, -7.395678520202637, -7.244627475738525, -7.093576431274414, -6.942525386810303, -6.791474342346191, -6.64042329788208, -6.489372253417969, -6.338321208953857, -6.187270164489746, -6.036219120025635, -5.885168075561523, -5.734117031097412, -5.583065986633301, -5.4320149421691895, -5.280963897705078, -5.129912853240967, -4.9788618087768555, -4.827810764312744, -4.676759719848633, -4.5257086753845215, -4.374658107757568, -4.223607063293457, -4.072556018829346, -3.9215049743652344, -3.770453929901123, -3.6194028854370117, -3.4683518409729004, -3.317300796508789, -3.166250228881836, -3.0151991844177246, -2.8641481399536133, -2.713097095489502, -2.5620460510253906, -2.4109950065612793, -2.259943962097168, -2.1088929176330566, -1.9578418731689453, -1.806790828704834, -1.6557397842407227, -1.5046887397766113, -1.3536376953125, -1.2025866508483887, -1.051535725593567, -0.9004846811294556, -0.7494336366653442, -0.5983825922012329, -0.44733157753944397, -0.29628056287765503, -0.1452295184135437, 0.005821526050567627, 0.15687251091003418, 0.3079235553741455, 0.45897459983825684, 0.6100256443023682, 0.7610766887664795, 0.912127673625946, 1.0631787776947021, 1.2142298221588135, 1.3652807474136353, 1.5163317918777466, 1.667382836341858]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 8.0, 12.0, 10.0, 19.0, 17.0, 15.0, 24.0, 20.0, 25.0, 26.0, 23.0, 27.0, 38.0, 32.0, 29.0, 39.0, 36.0, 40.0, 36.0, 29.0, 47.0, 44.0, 38.0, 41.0, 37.0, 32.0, 23.0, 31.0, 22.0, 26.0, 22.0, 18.0, 22.0, 12.0, 10.0, 11.0, 6.0, 4.0, 12.0, 9.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5738106966018677, -1.5221275091171265, -1.4704443216323853, -1.4187610149383545, -1.3670778274536133, -1.315394639968872, -1.2637114524841309, -1.2120282649993896, -1.1603450775146484, -1.1086618900299072, -1.056978702545166, -1.0052955150604248, -0.953612208366394, -0.9019290208816528, -0.8502458333969116, -0.7985626459121704, -0.7468793392181396, -0.6951961517333984, -0.6435129046440125, -0.5918297171592712, -0.5401464700698853, -0.48846328258514404, -0.43678009510040283, -0.38509687781333923, -0.33341366052627563, -0.28173044323921204, -0.23004724085330963, -0.17836403846740723, -0.12668082118034363, -0.07499760389328003, -0.02331441640853882, 0.02836880087852478, 0.08005213737487793, 0.13173535466194153, 0.18341855704784393, 0.23510175943374634, 0.28678497672080994, 0.33846819400787354, 0.39015138149261475, 0.44183459877967834, 0.49351781606674194, 0.5452010035514832, 0.5968842506408691, 0.6485674381256104, 0.7002506256103516, 0.7519338726997375, 0.8036170601844788, 0.8553003072738647, 0.906983494758606, 0.9586666822433472, 1.0103498697280884, 1.0620331764221191, 1.1137163639068604, 1.1653995513916016, 1.2170827388763428, 1.268765926361084, 1.3204491138458252, 1.3721323013305664, 1.4238154888153076, 1.4754986763000488, 1.5271819829940796, 1.5788651704788208, 1.630548357963562, 1.6822315454483032, 1.733914852142334]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 7.0, 13.0, 26.0, 22.0, 36.0, 54.0, 83.0, 117.0, 208.0, 368.0, 567.0, 945.0, 1464.0, 2567.0, 4389.0, 7382.0, 12461.0, 21909.0, 39041.0, 71368.0, 142793.0, 313827.0, 772323.0, 1427510.0, 761401.0, 310303.0, 140753.0, 70846.0, 38709.0, 21706.0, 12583.0, 7190.0, 4321.0, 2649.0, 1661.0, 931.0, 625.0, 428.0, 234.0, 158.0, 115.0, 54.0, 53.0, 26.0, 17.0, 15.0, 9.0, 3.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0], "bins": [-0.197509765625, -0.19161224365234375, -0.1857147216796875, -0.17981719970703125, -0.173919677734375, -0.16802215576171875, -0.1621246337890625, -0.15622711181640625, -0.15032958984375, -0.14443206787109375, -0.1385345458984375, -0.13263702392578125, -0.126739501953125, -0.12084197998046875, -0.1149444580078125, -0.10904693603515625, -0.1031494140625, -0.09725189208984375, -0.0913543701171875, -0.08545684814453125, -0.079559326171875, -0.07366180419921875, -0.0677642822265625, -0.06186676025390625, -0.05596923828125, -0.05007171630859375, -0.0441741943359375, -0.03827667236328125, -0.032379150390625, -0.02648162841796875, -0.0205841064453125, -0.01468658447265625, -0.0087890625, -0.00289154052734375, 0.0030059814453125, 0.00890350341796875, 0.014801025390625, 0.02069854736328125, 0.0265960693359375, 0.03249359130859375, 0.03839111328125, 0.04428863525390625, 0.0501861572265625, 0.05608367919921875, 0.061981201171875, 0.06787872314453125, 0.0737762451171875, 0.07967376708984375, 0.0855712890625, 0.09146881103515625, 0.0973663330078125, 0.10326385498046875, 0.109161376953125, 0.11505889892578125, 0.1209564208984375, 0.12685394287109375, 0.13275146484375, 0.13864898681640625, 0.1445465087890625, 0.15044403076171875, 0.156341552734375, 0.16223907470703125, 0.1681365966796875, 0.17403411865234375, 0.179931640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 5.0, 9.0, 11.0, 16.0, 12.0, 21.0, 24.0, 23.0, 19.0, 32.0, 27.0, 23.0, 41.0, 44.0, 38.0, 51.0, 41.0, 48.0, 43.0, 46.0, 48.0, 34.0, 33.0, 30.0, 26.0, 33.0, 28.0, 31.0, 18.0, 23.0, 16.0, 10.0, 11.0, 10.0, 18.0, 6.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.1965923309326172, -0.18981552124023438, -0.18303871154785156, -0.17626190185546875, -0.16948509216308594, -0.16270828247070312, -0.1559314727783203, -0.1491546630859375, -0.1423778533935547, -0.13560104370117188, -0.12882423400878906, -0.12204742431640625, -0.11527061462402344, -0.10849380493164062, -0.10171699523925781, -0.094940185546875, -0.08816337585449219, -0.08138656616210938, -0.07460975646972656, -0.06783294677734375, -0.06105613708496094, -0.054279327392578125, -0.04750251770019531, -0.0407257080078125, -0.03394889831542969, -0.027172088623046875, -0.020395278930664062, -0.01361846923828125, -0.0068416595458984375, -6.4849853515625e-05, 0.0067119598388671875, 0.01348876953125, 0.020265579223632812, 0.027042388916015625, 0.03381919860839844, 0.04059600830078125, 0.04737281799316406, 0.054149627685546875, 0.06092643737792969, 0.0677032470703125, 0.07448005676269531, 0.08125686645507812, 0.08803367614746094, 0.09481048583984375, 0.10158729553222656, 0.10836410522460938, 0.11514091491699219, 0.121917724609375, 0.1286945343017578, 0.13547134399414062, 0.14224815368652344, 0.14902496337890625, 0.15580177307128906, 0.16257858276367188, 0.1693553924560547, 0.1761322021484375, 0.1829090118408203, 0.18968582153320312, 0.19646263122558594, 0.20323944091796875, 0.21001625061035156, 0.21679306030273438, 0.2235698699951172, 0.2303466796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 20.0, 22.0, 32.0, 34.0, 54.0, 93.0, 133.0, 210.0, 333.0, 613.0, 1184.0, 2321.0, 4891.0, 10570.0, 25092.0, 61064.0, 156107.0, 442792.0, 1550388.0, 1328430.0, 378517.0, 136984.0, 53792.0, 22073.0, 9468.0, 4320.0, 2075.0, 1095.0, 583.0, 366.0, 199.0, 135.0, 66.0, 57.0, 42.0, 26.0, 17.0, 14.0, 15.0, 9.0, 8.0, 7.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.331085205078125, -0.31964111328125, -0.308197021484375, -0.2967529296875, -0.285308837890625, -0.27386474609375, -0.262420654296875, -0.2509765625, -0.239532470703125, -0.22808837890625, -0.216644287109375, -0.2052001953125, -0.193756103515625, -0.18231201171875, -0.170867919921875, -0.159423828125, -0.147979736328125, -0.13653564453125, -0.125091552734375, -0.1136474609375, -0.102203369140625, -0.09075927734375, -0.079315185546875, -0.06787109375, -0.056427001953125, -0.04498291015625, -0.033538818359375, -0.0220947265625, -0.010650634765625, 0.00079345703125, 0.012237548828125, 0.023681640625, 0.035125732421875, 0.04656982421875, 0.058013916015625, 0.0694580078125, 0.080902099609375, 0.09234619140625, 0.103790283203125, 0.115234375, 0.126678466796875, 0.13812255859375, 0.149566650390625, 0.1610107421875, 0.172454833984375, 0.18389892578125, 0.195343017578125, 0.206787109375, 0.218231201171875, 0.22967529296875, 0.241119384765625, 0.2525634765625, 0.264007568359375, 0.27545166015625, 0.286895751953125, 0.29833984375, 0.309783935546875, 0.32122802734375, 0.332672119140625, 0.3441162109375, 0.355560302734375, 0.36700439453125, 0.378448486328125, 0.389892578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 13.0, 20.0, 29.0, 32.0, 55.0, 88.0, 90.0, 140.0, 197.0, 272.0, 376.0, 564.0, 549.0, 462.0, 362.0, 217.0, 148.0, 112.0, 80.0, 50.0, 48.0, 34.0, 34.0, 19.0, 16.0, 11.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4072265625, -0.3932991027832031, -0.37937164306640625, -0.3654441833496094, -0.3515167236328125, -0.3375892639160156, -0.32366180419921875, -0.3097343444824219, -0.295806884765625, -0.2818794250488281, -0.26795196533203125, -0.2540245056152344, -0.2400970458984375, -0.22616958618164062, -0.21224212646484375, -0.19831466674804688, -0.18438720703125, -0.17045974731445312, -0.15653228759765625, -0.14260482788085938, -0.1286773681640625, -0.11474990844726562, -0.10082244873046875, -0.08689498901367188, -0.072967529296875, -0.059040069580078125, -0.04511260986328125, -0.031185150146484375, -0.0172576904296875, -0.003330230712890625, 0.01059722900390625, 0.024524688720703125, 0.0384521484375, 0.052379608154296875, 0.06630706787109375, 0.08023452758789062, 0.0941619873046875, 0.10808944702148438, 0.12201690673828125, 0.13594436645507812, 0.149871826171875, 0.16379928588867188, 0.17772674560546875, 0.19165420532226562, 0.2055816650390625, 0.21950912475585938, 0.23343658447265625, 0.24736404418945312, 0.26129150390625, 0.2752189636230469, 0.28914642333984375, 0.3030738830566406, 0.3170013427734375, 0.3309288024902344, 0.34485626220703125, 0.3587837219238281, 0.372711181640625, 0.3866386413574219, 0.40056610107421875, 0.4144935607910156, 0.4284210205078125, 0.4423484802246094, 0.45627593994140625, 0.4702033996582031, 0.484130859375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 8.0, 10.0, 15.0, 26.0, 25.0, 68.0, 56.0, 103.0, 109.0, 92.0, 126.0, 105.0, 89.0, 60.0, 24.0, 25.0, 25.0, 25.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.4839625358581543, -3.409820318222046, -3.3356781005859375, -3.261535882949829, -3.1873936653137207, -3.1132514476776123, -3.039109230041504, -2.9649672508239746, -2.890824794769287, -2.8166825771331787, -2.7425403594970703, -2.668398141860962, -2.5942559242248535, -2.520113706588745, -2.4459714889526367, -2.3718295097351074, -2.297687292098999, -2.2235450744628906, -2.1494028568267822, -2.075260639190674, -2.0011184215545654, -1.926976203918457, -1.8528341054916382, -1.7786918878555298, -1.7045496702194214, -1.630407452583313, -1.5562652349472046, -1.4821230173110962, -1.4079809188842773, -1.333838701248169, -1.2596964836120605, -1.1855542659759521, -1.1114120483398438, -1.0372698307037354, -0.963127613067627, -0.8889854550361633, -0.8148432374000549, -0.7407010197639465, -0.6665588617324829, -0.5924166440963745, -0.5182744264602661, -0.4441322088241577, -0.3699900209903717, -0.2958478331565857, -0.2217056155204773, -0.1475633978843689, -0.07342121005058289, 0.000720977783203125, 0.07486319541931152, 0.14900539815425873, 0.22314760088920593, 0.29728978872299194, 0.37143200635910034, 0.44557422399520874, 0.5197163820266724, 0.5938585996627808, 0.6680008172988892, 0.7421430349349976, 0.816285252571106, 0.8904274106025696, 0.964569628238678, 1.0387117862701416, 1.11285400390625, 1.1869962215423584, 1.2611384391784668]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 6.0, 8.0, 13.0, 7.0, 9.0, 15.0, 13.0, 17.0, 22.0, 28.0, 28.0, 34.0, 36.0, 40.0, 51.0, 35.0, 37.0, 46.0, 52.0, 46.0, 45.0, 47.0, 45.0, 39.0, 42.0, 39.0, 33.0, 19.0, 19.0, 26.0, 23.0, 16.0, 16.0, 12.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6356086730957031, -1.5899025201797485, -1.5441962480545044, -1.4984900951385498, -1.4527839422225952, -1.4070777893066406, -1.3613715171813965, -1.315665364265442, -1.2699592113494873, -1.2242530584335327, -1.1785467863082886, -1.132840633392334, -1.0871344804763794, -1.0414283275604248, -0.9957220554351807, -0.9500159025192261, -0.9043096303939819, -0.8586034178733826, -0.812897264957428, -0.7671910524368286, -0.721484899520874, -0.6757786870002747, -0.6300724744796753, -0.5843663215637207, -0.5386601090431213, -0.49295392632484436, -0.4472477436065674, -0.401541531085968, -0.35583534836769104, -0.31012916564941406, -0.2644229531288147, -0.21871677041053772, -0.1730104684829712, -0.1273042857646942, -0.08159808814525604, -0.03589189052581787, 0.009814292192459106, 0.055520474910736084, 0.10122668743133545, 0.14693287014961243, 0.1926390528678894, 0.23834523558616638, 0.28405141830444336, 0.3297576308250427, 0.3754638135433197, 0.4211699962615967, 0.46687620878219604, 0.5125824213027954, 0.55828857421875, 0.6039947867393494, 0.649700939655304, 0.6954071521759033, 0.7411133050918579, 0.7868195176124573, 0.8325257301330566, 0.8782318830490112, 0.9239380955696106, 0.96964430809021, 1.0153504610061646, 1.0610566139221191, 1.1067628860473633, 1.1524690389633179, 1.1981751918792725, 1.2438814640045166, 1.2895876169204712]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 7.0, 5.0, 13.0, 18.0, 22.0, 52.0, 76.0, 126.0, 170.0, 269.0, 338.0, 536.0, 851.0, 1275.0, 1930.0, 3011.0, 4512.0, 6873.0, 10699.0, 16996.0, 29125.0, 56131.0, 126842.0, 268961.0, 265284.0, 123498.0, 55031.0, 28666.0, 16755.0, 10724.0, 6806.0, 4505.0, 2901.0, 1923.0, 1198.0, 830.0, 527.0, 328.0, 255.0, 158.0, 111.0, 89.0, 49.0, 28.0, 19.0, 14.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.265869140625, -0.2575569152832031, -0.24924468994140625, -0.24093246459960938, -0.2326202392578125, -0.22430801391601562, -0.21599578857421875, -0.20768356323242188, -0.199371337890625, -0.19105911254882812, -0.18274688720703125, -0.17443466186523438, -0.1661224365234375, -0.15781021118164062, -0.14949798583984375, -0.14118576049804688, -0.13287353515625, -0.12456130981445312, -0.11624908447265625, -0.10793685913085938, -0.0996246337890625, -0.09131240844726562, -0.08300018310546875, -0.07468795776367188, -0.066375732421875, -0.058063507080078125, -0.04975128173828125, -0.041439056396484375, -0.0331268310546875, -0.024814605712890625, -0.01650238037109375, -0.008190155029296875, 0.0001220703125, 0.008434295654296875, 0.01674652099609375, 0.025058746337890625, 0.0333709716796875, 0.041683197021484375, 0.04999542236328125, 0.058307647705078125, 0.066619873046875, 0.07493209838867188, 0.08324432373046875, 0.09155654907226562, 0.0998687744140625, 0.10818099975585938, 0.11649322509765625, 0.12480545043945312, 0.13311767578125, 0.14142990112304688, 0.14974212646484375, 0.15805435180664062, 0.1663665771484375, 0.17467880249023438, 0.18299102783203125, 0.19130325317382812, 0.199615478515625, 0.20792770385742188, 0.21623992919921875, 0.22455215454101562, 0.2328643798828125, 0.24117660522460938, 0.24948883056640625, 0.2578010559082031, 0.26611328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 7.0, 15.0, 12.0, 21.0, 12.0, 23.0, 19.0, 21.0, 28.0, 40.0, 37.0, 36.0, 37.0, 42.0, 41.0, 30.0, 46.0, 49.0, 39.0, 48.0, 45.0, 47.0, 35.0, 38.0, 26.0, 36.0, 19.0, 17.0, 23.0, 16.0, 17.0, 15.0, 9.0, 6.0, 10.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.19200706481933594, -0.18491744995117188, -0.1778278350830078, -0.17073822021484375, -0.1636486053466797, -0.15655899047851562, -0.14946937561035156, -0.1423797607421875, -0.13529014587402344, -0.12820053100585938, -0.12111091613769531, -0.11402130126953125, -0.10693168640136719, -0.09984207153320312, -0.09275245666503906, -0.085662841796875, -0.07857322692871094, -0.07148361206054688, -0.06439399719238281, -0.05730438232421875, -0.05021476745605469, -0.043125152587890625, -0.03603553771972656, -0.0289459228515625, -0.021856307983398438, -0.014766693115234375, -0.0076770782470703125, -0.00058746337890625, 0.0065021514892578125, 0.013591766357421875, 0.020681381225585938, 0.02777099609375, 0.03486061096191406, 0.041950225830078125, 0.04903984069824219, 0.05612945556640625, 0.06321907043457031, 0.07030868530273438, 0.07739830017089844, 0.0844879150390625, 0.09157752990722656, 0.09866714477539062, 0.10575675964355469, 0.11284637451171875, 0.11993598937988281, 0.12702560424804688, 0.13411521911621094, 0.141204833984375, 0.14829444885253906, 0.15538406372070312, 0.1624736785888672, 0.16956329345703125, 0.1766529083251953, 0.18374252319335938, 0.19083213806152344, 0.1979217529296875, 0.20501136779785156, 0.21210098266601562, 0.2191905975341797, 0.22628021240234375, 0.2333698272705078, 0.24045944213867188, 0.24754905700683594, 0.254638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 14.0, 19.0, 30.0, 34.0, 47.0, 81.0, 138.0, 271.0, 507.0, 1161.0, 3165.0, 8925.0, 25148.0, 83749.0, 395489.0, 403719.0, 85575.0, 25646.0, 9051.0, 3332.0, 1265.0, 520.0, 262.0, 159.0, 75.0, 55.0, 28.0, 18.0, 12.0, 7.0, 10.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.60791015625, -0.5894927978515625, -0.571075439453125, -0.5526580810546875, -0.53424072265625, -0.5158233642578125, -0.497406005859375, -0.4789886474609375, -0.4605712890625, -0.4421539306640625, -0.423736572265625, -0.4053192138671875, -0.38690185546875, -0.3684844970703125, -0.350067138671875, -0.3316497802734375, -0.313232421875, -0.2948150634765625, -0.276397705078125, -0.2579803466796875, -0.23956298828125, -0.2211456298828125, -0.202728271484375, -0.1843109130859375, -0.1658935546875, -0.1474761962890625, -0.129058837890625, -0.1106414794921875, -0.09222412109375, -0.0738067626953125, -0.055389404296875, -0.0369720458984375, -0.0185546875, -0.0001373291015625, 0.018280029296875, 0.0366973876953125, 0.05511474609375, 0.0735321044921875, 0.091949462890625, 0.1103668212890625, 0.1287841796875, 0.1472015380859375, 0.165618896484375, 0.1840362548828125, 0.20245361328125, 0.2208709716796875, 0.239288330078125, 0.2577056884765625, 0.276123046875, 0.2945404052734375, 0.312957763671875, 0.3313751220703125, 0.34979248046875, 0.3682098388671875, 0.386627197265625, 0.4050445556640625, 0.4234619140625, 0.4418792724609375, 0.460296630859375, 0.4787139892578125, 0.49713134765625, 0.5155487060546875, 0.533966064453125, 0.5523834228515625, 0.57080078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 10.0, 5.0, 10.0, 6.0, 6.0, 9.0, 13.0, 11.0, 18.0, 16.0, 18.0, 19.0, 33.0, 27.0, 33.0, 33.0, 42.0, 37.0, 49.0, 43.0, 40.0, 40.0, 41.0, 44.0, 35.0, 36.0, 38.0, 37.0, 30.0, 29.0, 36.0, 28.0, 25.0, 18.0, 16.0, 12.0, 17.0, 6.0, 7.0, 5.0, 6.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6662368774414062, -0.6464385986328125, -0.6266403198242188, -0.606842041015625, -0.5870437622070312, -0.5672454833984375, -0.5474472045898438, -0.52764892578125, -0.5078506469726562, -0.4880523681640625, -0.46825408935546875, -0.448455810546875, -0.42865753173828125, -0.4088592529296875, -0.38906097412109375, -0.3692626953125, -0.34946441650390625, -0.3296661376953125, -0.30986785888671875, -0.290069580078125, -0.27027130126953125, -0.2504730224609375, -0.23067474365234375, -0.21087646484375, -0.19107818603515625, -0.1712799072265625, -0.15148162841796875, -0.131683349609375, -0.11188507080078125, -0.0920867919921875, -0.07228851318359375, -0.052490234375, -0.03269195556640625, -0.0128936767578125, 0.00690460205078125, 0.026702880859375, 0.04650115966796875, 0.0662994384765625, 0.08609771728515625, 0.10589599609375, 0.12569427490234375, 0.1454925537109375, 0.16529083251953125, 0.185089111328125, 0.20488739013671875, 0.2246856689453125, 0.24448394775390625, 0.2642822265625, 0.28408050537109375, 0.3038787841796875, 0.32367706298828125, 0.343475341796875, 0.36327362060546875, 0.3830718994140625, 0.40287017822265625, 0.42266845703125, 0.44246673583984375, 0.4622650146484375, 0.48206329345703125, 0.501861572265625, 0.5216598510742188, 0.5414581298828125, 0.5612564086914062, 0.5810546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 11.0, 16.0, 31.0, 25.0, 53.0, 84.0, 122.0, 208.0, 313.0, 511.0, 960.0, 1630.0, 3052.0, 5461.0, 9759.0, 17957.0, 32491.0, 59030.0, 113305.0, 227673.0, 266138.0, 145377.0, 74216.0, 40388.0, 22104.0, 12324.0, 6846.0, 3629.0, 1955.0, 1188.0, 639.0, 375.0, 224.0, 148.0, 93.0, 61.0, 48.0, 27.0, 20.0, 13.0, 10.0, 9.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.11492919921875, -0.11156654357910156, -0.10820388793945312, -0.10484123229980469, -0.10147857666015625, -0.09811592102050781, -0.09475326538085938, -0.09139060974121094, -0.0880279541015625, -0.08466529846191406, -0.08130264282226562, -0.07793998718261719, -0.07457733154296875, -0.07121467590332031, -0.06785202026367188, -0.06448936462402344, -0.061126708984375, -0.05776405334472656, -0.054401397705078125, -0.05103874206542969, -0.04767608642578125, -0.04431343078613281, -0.040950775146484375, -0.03758811950683594, -0.0342254638671875, -0.030862808227539062, -0.027500152587890625, -0.024137496948242188, -0.02077484130859375, -0.017412185668945312, -0.014049530029296875, -0.010686874389648438, -0.00732421875, -0.0039615631103515625, -0.000598907470703125, 0.0027637481689453125, 0.00612640380859375, 0.009489059448242188, 0.012851715087890625, 0.016214370727539062, 0.0195770263671875, 0.022939682006835938, 0.026302337646484375, 0.029664993286132812, 0.03302764892578125, 0.03639030456542969, 0.039752960205078125, 0.04311561584472656, 0.046478271484375, 0.04984092712402344, 0.053203582763671875, 0.05656623840332031, 0.05992889404296875, 0.06329154968261719, 0.06665420532226562, 0.07001686096191406, 0.0733795166015625, 0.07674217224121094, 0.08010482788085938, 0.08346748352050781, 0.08683013916015625, 0.09019279479980469, 0.09355545043945312, 0.09691810607910156, 0.10028076171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 9.0, 7.0, 20.0, 15.0, 24.0, 24.0, 43.0, 56.0, 62.0, 104.0, 123.0, 112.0, 93.0, 66.0, 45.0, 24.0, 22.0, 25.0, 22.0, 18.0, 14.0, 11.0, 6.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-4.8041343688964844e-05, -4.680175334215164e-05, -4.556216299533844e-05, -4.432257264852524e-05, -4.3082982301712036e-05, -4.1843391954898834e-05, -4.060380160808563e-05, -3.936421126127243e-05, -3.812462091445923e-05, -3.6885030567646027e-05, -3.5645440220832825e-05, -3.440584987401962e-05, -3.316625952720642e-05, -3.192666918039322e-05, -3.068707883358002e-05, -2.9447488486766815e-05, -2.8207898139953613e-05, -2.696830779314041e-05, -2.572871744632721e-05, -2.4489127099514008e-05, -2.3249536752700806e-05, -2.2009946405887604e-05, -2.0770356059074402e-05, -1.95307657122612e-05, -1.8291175365447998e-05, -1.7051585018634796e-05, -1.5811994671821594e-05, -1.4572404325008392e-05, -1.333281397819519e-05, -1.2093223631381989e-05, -1.0853633284568787e-05, -9.614042937755585e-06, -8.374452590942383e-06, -7.134862244129181e-06, -5.895271897315979e-06, -4.655681550502777e-06, -3.416091203689575e-06, -2.1765008568763733e-06, -9.369105100631714e-07, 3.026798367500305e-07, 1.5422701835632324e-06, 2.7818605303764343e-06, 4.021450877189636e-06, 5.261041224002838e-06, 6.50063157081604e-06, 7.740221917629242e-06, 8.979812264442444e-06, 1.0219402611255646e-05, 1.1458992958068848e-05, 1.269858330488205e-05, 1.3938173651695251e-05, 1.5177763998508453e-05, 1.6417354345321655e-05, 1.7656944692134857e-05, 1.889653503894806e-05, 2.013612538576126e-05, 2.1375715732574463e-05, 2.2615306079387665e-05, 2.3854896426200867e-05, 2.509448677301407e-05, 2.633407711982727e-05, 2.7573667466640472e-05, 2.8813257813453674e-05, 3.0052848160266876e-05, 3.129243850708008e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 16.0, 24.0, 37.0, 50.0, 62.0, 119.0, 189.0, 378.0, 688.0, 1251.0, 3115.0, 7744.0, 22126.0, 65256.0, 201087.0, 427966.0, 212756.0, 68520.0, 23074.0, 8233.0, 3047.0, 1246.0, 695.0, 333.0, 180.0, 124.0, 83.0, 56.0, 35.0, 13.0, 20.0, 11.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.231201171875, -0.22535133361816406, -0.21950149536132812, -0.2136516571044922, -0.20780181884765625, -0.2019519805908203, -0.19610214233398438, -0.19025230407714844, -0.1844024658203125, -0.17855262756347656, -0.17270278930664062, -0.1668529510498047, -0.16100311279296875, -0.1551532745361328, -0.14930343627929688, -0.14345359802246094, -0.137603759765625, -0.13175392150878906, -0.12590408325195312, -0.12005424499511719, -0.11420440673828125, -0.10835456848144531, -0.10250473022460938, -0.09665489196777344, -0.0908050537109375, -0.08495521545410156, -0.07910537719726562, -0.07325553894042969, -0.06740570068359375, -0.06155586242675781, -0.055706024169921875, -0.04985618591308594, -0.04400634765625, -0.03815650939941406, -0.032306671142578125, -0.026456832885742188, -0.02060699462890625, -0.014757156372070312, -0.008907318115234375, -0.0030574798583984375, 0.0027923583984375, 0.008642196655273438, 0.014492034912109375, 0.020341873168945312, 0.02619171142578125, 0.03204154968261719, 0.037891387939453125, 0.04374122619628906, 0.049591064453125, 0.05544090270996094, 0.061290740966796875, 0.06714057922363281, 0.07299041748046875, 0.07884025573730469, 0.08469009399414062, 0.09053993225097656, 0.0963897705078125, 0.10223960876464844, 0.10808944702148438, 0.11393928527832031, 0.11978912353515625, 0.1256389617919922, 0.13148880004882812, 0.13733863830566406, 0.1431884765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 7.0, 5.0, 8.0, 8.0, 10.0, 27.0, 25.0, 19.0, 24.0, 23.0, 26.0, 51.0, 55.0, 68.0, 74.0, 80.0, 71.0, 82.0, 56.0, 57.0, 40.0, 34.0, 18.0, 23.0, 17.0, 16.0, 19.0, 13.0, 9.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.145294189453125, -0.14056396484375, -0.135833740234375, -0.131103515625, -0.126373291015625, -0.12164306640625, -0.116912841796875, -0.1121826171875, -0.107452392578125, -0.10272216796875, -0.097991943359375, -0.09326171875, -0.088531494140625, -0.08380126953125, -0.079071044921875, -0.0743408203125, -0.069610595703125, -0.06488037109375, -0.060150146484375, -0.055419921875, -0.050689697265625, -0.04595947265625, -0.041229248046875, -0.0364990234375, -0.031768798828125, -0.02703857421875, -0.022308349609375, -0.017578125, -0.012847900390625, -0.00811767578125, -0.003387451171875, 0.0013427734375, 0.006072998046875, 0.01080322265625, 0.015533447265625, 0.020263671875, 0.024993896484375, 0.02972412109375, 0.034454345703125, 0.0391845703125, 0.043914794921875, 0.04864501953125, 0.053375244140625, 0.05810546875, 0.062835693359375, 0.06756591796875, 0.072296142578125, 0.0770263671875, 0.081756591796875, 0.08648681640625, 0.091217041015625, 0.095947265625, 0.100677490234375, 0.10540771484375, 0.110137939453125, 0.1148681640625, 0.119598388671875, 0.12432861328125, 0.129058837890625, 0.1337890625, 0.138519287109375, 0.14324951171875, 0.147979736328125, 0.1527099609375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 9.0, 21.0, 43.0, 57.0, 84.0, 102.0, 148.0, 145.0, 118.0, 90.0, 73.0, 38.0, 30.0, 20.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4471850395202637, -3.375609874725342, -3.30403470993042, -3.232459545135498, -3.160884380340576, -3.0893094539642334, -3.0177342891693115, -2.9461591243743896, -2.8745839595794678, -2.803008794784546, -2.731433629989624, -2.659858465194702, -2.5882835388183594, -2.5167083740234375, -2.4451332092285156, -2.3735580444335938, -2.301982879638672, -2.23040771484375, -2.158832550048828, -2.0872573852539062, -2.0156822204589844, -1.944107174873352, -1.8725321292877197, -1.8009569644927979, -1.729381799697876, -1.657806634902954, -1.5862314701080322, -1.5146564245224, -1.443081259727478, -1.3715060949325562, -1.2999310493469238, -1.228355884552002, -1.156780481338501, -1.085205316543579, -1.0136301517486572, -0.9420551061630249, -0.870479941368103, -0.7989047765731812, -0.727329671382904, -0.655754566192627, -0.5841794013977051, -0.5126042366027832, -0.4410291314125061, -0.3694539964199066, -0.29787886142730713, -0.22630372643470764, -0.15472859144210815, -0.08315348625183105, -0.01157832145690918, 0.05999681353569031, 0.1315719485282898, 0.20314708352088928, 0.27472221851348877, 0.34629735350608826, 0.41787248849868774, 0.48944759368896484, 0.5610227584838867, 0.6325979232788086, 0.7041730284690857, 0.7757481336593628, 0.8473232984542847, 0.9188984632492065, 0.9904735684394836, 1.0620486736297607, 1.1336238384246826]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 7.0, 11.0, 18.0, 20.0, 25.0, 20.0, 25.0, 24.0, 28.0, 39.0, 27.0, 44.0, 34.0, 48.0, 44.0, 49.0, 40.0, 50.0, 36.0, 38.0, 36.0, 35.0, 31.0, 26.0, 37.0, 22.0, 22.0, 21.0, 16.0, 17.0, 18.0, 14.0, 6.0, 8.0, 9.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.459937334060669, -1.4134941101074219, -1.3670508861541748, -1.3206076622009277, -1.2741644382476807, -1.2277213335037231, -1.181278109550476, -1.134834885597229, -1.088391661643982, -1.0419484376907349, -0.9955052137374878, -0.9490620493888855, -0.9026188254356384, -0.8561756014823914, -0.8097324371337891, -0.763289213180542, -0.7168459892272949, -0.6704027652740479, -0.6239595413208008, -0.5775163769721985, -0.5310731530189514, -0.48462992906570435, -0.43818673491477966, -0.391743540763855, -0.3453003168106079, -0.29885709285736084, -0.25241389870643616, -0.20597068965435028, -0.1595274806022644, -0.11308427155017853, -0.06664106249809265, -0.02019786834716797, 0.0262453556060791, 0.07268856465816498, 0.11913177371025085, 0.16557498276233673, 0.2120181918144226, 0.2584614157676697, 0.30490460991859436, 0.35134780406951904, 0.3977910280227661, 0.4442342519760132, 0.49067744612693787, 0.5371206402778625, 0.5835638642311096, 0.6300070881843567, 0.676450252532959, 0.722893476486206, 0.7693367004394531, 0.8157799243927002, 0.8622231483459473, 0.9086663126945496, 0.9551095366477966, 1.001552700996399, 1.047995924949646, 1.094439148902893, 1.1408823728561401, 1.1873255968093872, 1.2337688207626343, 1.2802120447158813, 1.3266551494598389, 1.373098373413086, 1.419541597366333, 1.46598482131958, 1.5124280452728271]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 10.0, 8.0, 18.0, 21.0, 36.0, 49.0, 80.0, 128.0, 231.0, 434.0, 705.0, 1198.0, 2130.0, 3692.0, 6926.0, 12572.0, 23139.0, 43539.0, 85511.0, 189653.0, 540564.0, 1647827.0, 1048552.0, 320165.0, 130695.0, 63745.0, 32961.0, 17976.0, 9467.0, 5383.0, 3016.0, 1702.0, 895.0, 517.0, 308.0, 162.0, 104.0, 66.0, 34.0, 26.0, 18.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2427978515625, -0.23538970947265625, -0.2279815673828125, -0.22057342529296875, -0.213165283203125, -0.20575714111328125, -0.1983489990234375, -0.19094085693359375, -0.18353271484375, -0.17612457275390625, -0.1687164306640625, -0.16130828857421875, -0.153900146484375, -0.14649200439453125, -0.1390838623046875, -0.13167572021484375, -0.124267578125, -0.11685943603515625, -0.1094512939453125, -0.10204315185546875, -0.094635009765625, -0.08722686767578125, -0.0798187255859375, -0.07241058349609375, -0.06500244140625, -0.05759429931640625, -0.0501861572265625, -0.04277801513671875, -0.035369873046875, -0.02796173095703125, -0.0205535888671875, -0.01314544677734375, -0.0057373046875, 0.00167083740234375, 0.0090789794921875, 0.01648712158203125, 0.023895263671875, 0.03130340576171875, 0.0387115478515625, 0.04611968994140625, 0.05352783203125, 0.06093597412109375, 0.0683441162109375, 0.07575225830078125, 0.083160400390625, 0.09056854248046875, 0.0979766845703125, 0.10538482666015625, 0.11279296875, 0.12020111083984375, 0.1276092529296875, 0.13501739501953125, 0.142425537109375, 0.14983367919921875, 0.1572418212890625, 0.16464996337890625, 0.17205810546875, 0.17946624755859375, 0.1868743896484375, 0.19428253173828125, 0.201690673828125, 0.20909881591796875, 0.2165069580078125, 0.22391510009765625, 0.2313232421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 10.0, 8.0, 3.0, 10.0, 10.0, 5.0, 17.0, 19.0, 19.0, 23.0, 33.0, 26.0, 36.0, 28.0, 37.0, 25.0, 38.0, 42.0, 35.0, 33.0, 46.0, 43.0, 38.0, 39.0, 40.0, 38.0, 30.0, 31.0, 41.0, 36.0, 27.0, 21.0, 18.0, 10.0, 11.0, 16.0, 10.0, 9.0, 12.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.207275390625, -0.20090103149414062, -0.19452667236328125, -0.18815231323242188, -0.1817779541015625, -0.17540359497070312, -0.16902923583984375, -0.16265487670898438, -0.156280517578125, -0.14990615844726562, -0.14353179931640625, -0.13715744018554688, -0.1307830810546875, -0.12440872192382812, -0.11803436279296875, -0.11166000366210938, -0.10528564453125, -0.09891128540039062, -0.09253692626953125, -0.08616256713867188, -0.0797882080078125, -0.07341384887695312, -0.06703948974609375, -0.060665130615234375, -0.054290771484375, -0.047916412353515625, -0.04154205322265625, -0.035167694091796875, -0.0287933349609375, -0.022418975830078125, -0.01604461669921875, -0.009670257568359375, -0.0032958984375, 0.003078460693359375, 0.00945281982421875, 0.015827178955078125, 0.0222015380859375, 0.028575897216796875, 0.03495025634765625, 0.041324615478515625, 0.047698974609375, 0.054073333740234375, 0.06044769287109375, 0.06682205200195312, 0.0731964111328125, 0.07957077026367188, 0.08594512939453125, 0.09231948852539062, 0.09869384765625, 0.10506820678710938, 0.11144256591796875, 0.11781692504882812, 0.1241912841796875, 0.13056564331054688, 0.13694000244140625, 0.14331436157226562, 0.149688720703125, 0.15606307983398438, 0.16243743896484375, 0.16881179809570312, 0.1751861572265625, 0.18156051635742188, 0.18793487548828125, 0.19430923461914062, 0.20068359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 19.0, 40.0, 46.0, 78.0, 118.0, 182.0, 270.0, 371.0, 680.0, 973.0, 1593.0, 2530.0, 4053.0, 6536.0, 10889.0, 17893.0, 30498.0, 52181.0, 93137.0, 172829.0, 368105.0, 1023029.0, 1384606.0, 526130.0, 224366.0, 115497.0, 64120.0, 37195.0, 22207.0, 13082.0, 8085.0, 4723.0, 3058.0, 1812.0, 1176.0, 764.0, 471.0, 314.0, 205.0, 119.0, 91.0, 56.0, 46.0, 19.0, 16.0, 14.0, 10.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.242431640625, -0.23512649536132812, -0.22782135009765625, -0.22051620483398438, -0.2132110595703125, -0.20590591430664062, -0.19860076904296875, -0.19129562377929688, -0.183990478515625, -0.17668533325195312, -0.16938018798828125, -0.16207504272460938, -0.1547698974609375, -0.14746475219726562, -0.14015960693359375, -0.13285446166992188, -0.12554931640625, -0.11824417114257812, -0.11093902587890625, -0.10363388061523438, -0.0963287353515625, -0.08902359008789062, -0.08171844482421875, -0.07441329956054688, -0.067108154296875, -0.059803009033203125, -0.05249786376953125, -0.045192718505859375, -0.0378875732421875, -0.030582427978515625, -0.02327728271484375, -0.015972137451171875, -0.0086669921875, -0.001361846923828125, 0.00594329833984375, 0.013248443603515625, 0.0205535888671875, 0.027858734130859375, 0.03516387939453125, 0.042469024658203125, 0.049774169921875, 0.057079315185546875, 0.06438446044921875, 0.07168960571289062, 0.0789947509765625, 0.08629989624023438, 0.09360504150390625, 0.10091018676757812, 0.10821533203125, 0.11552047729492188, 0.12282562255859375, 0.13013076782226562, 0.1374359130859375, 0.14474105834960938, 0.15204620361328125, 0.15935134887695312, 0.166656494140625, 0.17396163940429688, 0.18126678466796875, 0.18857192993164062, 0.1958770751953125, 0.20318222045898438, 0.21048736572265625, 0.21779251098632812, 0.22509765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 12.0, 6.0, 13.0, 12.0, 18.0, 30.0, 35.0, 37.0, 56.0, 61.0, 86.0, 114.0, 155.0, 208.0, 321.0, 481.0, 626.0, 527.0, 350.0, 262.0, 141.0, 105.0, 88.0, 81.0, 46.0, 31.0, 32.0, 27.0, 21.0, 17.0, 12.0, 7.0, 9.0, 6.0, 6.0, 6.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.468017578125, -0.4555549621582031, -0.44309234619140625, -0.4306297302246094, -0.4181671142578125, -0.4057044982910156, -0.39324188232421875, -0.3807792663574219, -0.368316650390625, -0.3558540344238281, -0.34339141845703125, -0.3309288024902344, -0.3184661865234375, -0.3060035705566406, -0.29354095458984375, -0.2810783386230469, -0.26861572265625, -0.2561531066894531, -0.24369049072265625, -0.23122787475585938, -0.2187652587890625, -0.20630264282226562, -0.19384002685546875, -0.18137741088867188, -0.168914794921875, -0.15645217895507812, -0.14398956298828125, -0.13152694702148438, -0.1190643310546875, -0.10660171508789062, -0.09413909912109375, -0.08167648315429688, -0.0692138671875, -0.056751251220703125, -0.04428863525390625, -0.031826019287109375, -0.0193634033203125, -0.006900787353515625, 0.00556182861328125, 0.018024444580078125, 0.030487060546875, 0.042949676513671875, 0.05541229248046875, 0.06787490844726562, 0.0803375244140625, 0.09280014038085938, 0.10526275634765625, 0.11772537231445312, 0.13018798828125, 0.14265060424804688, 0.15511322021484375, 0.16757583618164062, 0.1800384521484375, 0.19250106811523438, 0.20496368408203125, 0.21742630004882812, 0.229888916015625, 0.24235153198242188, 0.25481414794921875, 0.2672767639160156, 0.2797393798828125, 0.2922019958496094, 0.30466461181640625, 0.3171272277832031, 0.32958984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 20.0, 38.0, 76.0, 111.0, 153.0, 178.0, 152.0, 125.0, 69.0, 30.0, 29.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.265247106552124, -2.149266242980957, -2.03328537940979, -1.9173043966293335, -1.8013235330581665, -1.6853426694869995, -1.569361686706543, -1.453380823135376, -1.337399959564209, -1.221419095993042, -1.105438232421875, -0.9894572496414185, -0.8734763860702515, -0.7574955224990845, -0.6415145993232727, -0.5255336761474609, -0.40955281257629395, -0.29357191920280457, -0.17759102582931519, -0.061610132455825806, 0.054370760917663574, 0.17035162448883057, 0.28633254766464233, 0.4023134708404541, 0.5182943344116211, 0.6342751979827881, 0.7502561211585999, 0.8662370443344116, 0.9822179079055786, 1.0981987714767456, 1.2141797542572021, 1.3301606178283691, 1.4461417198181152, 1.5621225833892822, 1.6781034469604492, 1.7940844297409058, 1.9100652933120728, 2.0260462760925293, 2.1420271396636963, 2.2580080032348633, 2.3739888668060303, 2.4899697303771973, 2.6059505939483643, 2.7219314575195312, 2.8379125595092773, 2.9538931846618652, 3.0698742866516113, 3.1858551502227783, 3.3018360137939453, 3.4178168773651123, 3.5337977409362793, 3.6497786045074463, 3.7657594680786133, 3.8817405700683594, 3.9977214336395264, 4.113702297210693, 4.229682922363281, 4.345664024353027, 4.461644649505615, 4.577625751495361, 4.693606376647949, 4.809587478637695, 4.925568103790283, 5.041549205780029, 5.157530307769775]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 5.0, 11.0, 14.0, 15.0, 13.0, 26.0, 22.0, 29.0, 22.0, 33.0, 31.0, 31.0, 25.0, 33.0, 36.0, 39.0, 34.0, 57.0, 38.0, 44.0, 32.0, 32.0, 29.0, 29.0, 29.0, 41.0, 29.0, 25.0, 19.0, 22.0, 26.0, 22.0, 18.0, 13.0, 13.0, 15.0, 5.0, 5.0, 5.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.2069120407104492, -1.1689149141311646, -1.1309177875518799, -1.0929205417633057, -1.054923415184021, -1.0169262886047363, -0.9789291620254517, -0.940932035446167, -0.9029348492622375, -0.8649377226829529, -0.8269405364990234, -0.7889434099197388, -0.7509462833404541, -0.7129490971565247, -0.67495197057724, -0.6369547843933105, -0.5989576578140259, -0.5609605312347412, -0.5229633450508118, -0.4849662184715271, -0.44696906208992004, -0.408971905708313, -0.3709747791290283, -0.33297762274742126, -0.2949804663658142, -0.25698330998420715, -0.2189861685037613, -0.18098902702331543, -0.14299187064170837, -0.10499471426010132, -0.06699757277965546, -0.029000431299209595, 0.008996844291687012, 0.04699399322271347, 0.08499114215373993, 0.12298829108476639, 0.16098544001579285, 0.1989825963973999, 0.23697973787784576, 0.2749768793582916, 0.3129740357398987, 0.35097119212150574, 0.3889683485031128, 0.42696547508239746, 0.4649626314640045, 0.5029597878456116, 0.5409569144248962, 0.5789541006088257, 0.6169512271881104, 0.654948353767395, 0.6929455399513245, 0.7309426665306091, 0.7689398527145386, 0.8069369792938232, 0.8449341058731079, 0.8829312324523926, 0.920928418636322, 0.9589255452156067, 0.9969227313995361, 1.0349198579788208, 1.0729169845581055, 1.1109142303466797, 1.1489113569259644, 1.186908483505249, 1.2249056100845337]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 7.0, 15.0, 30.0, 50.0, 64.0, 91.0, 128.0, 182.0, 262.0, 395.0, 542.0, 821.0, 1252.0, 1646.0, 2448.0, 3622.0, 5289.0, 8239.0, 13292.0, 23755.0, 44950.0, 90126.0, 176948.0, 253952.0, 197700.0, 103022.0, 51098.0, 26496.0, 14908.0, 8950.0, 5837.0, 3943.0, 2659.0, 1816.0, 1269.0, 851.0, 558.0, 428.0, 316.0, 191.0, 130.0, 92.0, 50.0, 50.0, 23.0, 12.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21484375, -0.20804405212402344, -0.20124435424804688, -0.1944446563720703, -0.18764495849609375, -0.1808452606201172, -0.17404556274414062, -0.16724586486816406, -0.1604461669921875, -0.15364646911621094, -0.14684677124023438, -0.1400470733642578, -0.13324737548828125, -0.1264476776123047, -0.11964797973632812, -0.11284828186035156, -0.106048583984375, -0.09924888610839844, -0.09244918823242188, -0.08564949035644531, -0.07884979248046875, -0.07205009460449219, -0.06525039672851562, -0.05845069885253906, -0.0516510009765625, -0.04485130310058594, -0.038051605224609375, -0.03125190734863281, -0.02445220947265625, -0.017652511596679688, -0.010852813720703125, -0.0040531158447265625, 0.00274658203125, 0.009546279907226562, 0.016345977783203125, 0.023145675659179688, 0.02994537353515625, 0.03674507141113281, 0.043544769287109375, 0.05034446716308594, 0.0571441650390625, 0.06394386291503906, 0.07074356079101562, 0.07754325866699219, 0.08434295654296875, 0.09114265441894531, 0.09794235229492188, 0.10474205017089844, 0.111541748046875, 0.11834144592285156, 0.12514114379882812, 0.1319408416748047, 0.13874053955078125, 0.1455402374267578, 0.15233993530273438, 0.15913963317871094, 0.1659393310546875, 0.17273902893066406, 0.17953872680664062, 0.1863384246826172, 0.19313812255859375, 0.1999378204345703, 0.20673751831054688, 0.21353721618652344, 0.2203369140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 10.0, 4.0, 9.0, 12.0, 14.0, 17.0, 15.0, 17.0, 24.0, 14.0, 26.0, 21.0, 27.0, 29.0, 35.0, 34.0, 33.0, 36.0, 47.0, 37.0, 43.0, 36.0, 33.0, 41.0, 37.0, 41.0, 32.0, 45.0, 31.0, 17.0, 23.0, 21.0, 17.0, 19.0, 18.0, 14.0, 14.0, 9.0, 13.0, 7.0, 0.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2117919921875, -0.20562171936035156, -0.19945144653320312, -0.1932811737060547, -0.18711090087890625, -0.1809406280517578, -0.17477035522460938, -0.16860008239746094, -0.1624298095703125, -0.15625953674316406, -0.15008926391601562, -0.1439189910888672, -0.13774871826171875, -0.1315784454345703, -0.12540817260742188, -0.11923789978027344, -0.113067626953125, -0.10689735412597656, -0.10072708129882812, -0.09455680847167969, -0.08838653564453125, -0.08221626281738281, -0.07604598999023438, -0.06987571716308594, -0.0637054443359375, -0.05753517150878906, -0.051364898681640625, -0.04519462585449219, -0.03902435302734375, -0.03285408020019531, -0.026683807373046875, -0.020513534545898438, -0.01434326171875, -0.008172988891601562, -0.002002716064453125, 0.0041675567626953125, 0.01033782958984375, 0.016508102416992188, 0.022678375244140625, 0.028848648071289062, 0.0350189208984375, 0.04118919372558594, 0.047359466552734375, 0.05352973937988281, 0.05970001220703125, 0.06587028503417969, 0.07204055786132812, 0.07821083068847656, 0.084381103515625, 0.09055137634277344, 0.09672164916992188, 0.10289192199707031, 0.10906219482421875, 0.11523246765136719, 0.12140274047851562, 0.12757301330566406, 0.1337432861328125, 0.13991355895996094, 0.14608383178710938, 0.1522541046142578, 0.15842437744140625, 0.1645946502685547, 0.17076492309570312, 0.17693519592285156, 0.18310546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 12.0, 8.0, 20.0, 18.0, 26.0, 39.0, 44.0, 103.0, 166.0, 254.0, 407.0, 747.0, 1230.0, 2326.0, 4317.0, 8260.0, 16756.0, 36492.0, 90519.0, 227858.0, 338905.0, 187338.0, 72749.0, 30231.0, 14261.0, 7063.0, 3691.0, 1969.0, 1137.0, 628.0, 369.0, 220.0, 128.0, 85.0, 43.0, 40.0, 23.0, 25.0, 9.0, 9.0, 5.0, 5.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.30078125, -0.2908821105957031, -0.28098297119140625, -0.2710838317871094, -0.2611846923828125, -0.2512855529785156, -0.24138641357421875, -0.23148727416992188, -0.221588134765625, -0.21168899536132812, -0.20178985595703125, -0.19189071655273438, -0.1819915771484375, -0.17209243774414062, -0.16219329833984375, -0.15229415893554688, -0.14239501953125, -0.13249588012695312, -0.12259674072265625, -0.11269760131835938, -0.1027984619140625, -0.09289932250976562, -0.08300018310546875, -0.07310104370117188, -0.063201904296875, -0.053302764892578125, -0.04340362548828125, -0.033504486083984375, -0.0236053466796875, -0.013706207275390625, -0.00380706787109375, 0.006092071533203125, 0.0159912109375, 0.025890350341796875, 0.03578948974609375, 0.045688629150390625, 0.0555877685546875, 0.06548690795898438, 0.07538604736328125, 0.08528518676757812, 0.095184326171875, 0.10508346557617188, 0.11498260498046875, 0.12488174438476562, 0.1347808837890625, 0.14468002319335938, 0.15457916259765625, 0.16447830200195312, 0.17437744140625, 0.18427658081054688, 0.19417572021484375, 0.20407485961914062, 0.2139739990234375, 0.22387313842773438, 0.23377227783203125, 0.24367141723632812, 0.253570556640625, 0.2634696960449219, 0.27336883544921875, 0.2832679748535156, 0.2931671142578125, 0.3030662536621094, 0.31296539306640625, 0.3228645324707031, 0.332763671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 9.0, 21.0, 11.0, 20.0, 23.0, 28.0, 22.0, 23.0, 27.0, 35.0, 40.0, 41.0, 37.0, 50.0, 39.0, 50.0, 48.0, 44.0, 32.0, 47.0, 47.0, 40.0, 37.0, 35.0, 25.0, 35.0, 27.0, 21.0, 17.0, 9.0, 10.0, 10.0, 5.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.603515625, -0.58416748046875, -0.5648193359375, -0.54547119140625, -0.526123046875, -0.50677490234375, -0.4874267578125, -0.46807861328125, -0.44873046875, -0.42938232421875, -0.4100341796875, -0.39068603515625, -0.371337890625, -0.35198974609375, -0.3326416015625, -0.31329345703125, -0.2939453125, -0.27459716796875, -0.2552490234375, -0.23590087890625, -0.216552734375, -0.19720458984375, -0.1778564453125, -0.15850830078125, -0.13916015625, -0.11981201171875, -0.1004638671875, -0.08111572265625, -0.061767578125, -0.04241943359375, -0.0230712890625, -0.00372314453125, 0.015625, 0.03497314453125, 0.0543212890625, 0.07366943359375, 0.093017578125, 0.11236572265625, 0.1317138671875, 0.15106201171875, 0.17041015625, 0.18975830078125, 0.2091064453125, 0.22845458984375, 0.247802734375, 0.26715087890625, 0.2864990234375, 0.30584716796875, 0.3251953125, 0.34454345703125, 0.3638916015625, 0.38323974609375, 0.402587890625, 0.42193603515625, 0.4412841796875, 0.46063232421875, 0.47998046875, 0.49932861328125, 0.5186767578125, 0.53802490234375, 0.557373046875, 0.57672119140625, 0.5960693359375, 0.61541748046875, 0.634765625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 8.0, 13.0, 11.0, 24.0, 52.0, 82.0, 146.0, 353.0, 830.0, 2155.0, 6619.0, 21822.0, 83261.0, 355013.0, 429173.0, 108445.0, 27885.0, 8214.0, 2644.0, 986.0, 409.0, 174.0, 100.0, 64.0, 34.0, 12.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.2243328094482422, -0.21734237670898438, -0.21035194396972656, -0.20336151123046875, -0.19637107849121094, -0.18938064575195312, -0.1823902130126953, -0.1753997802734375, -0.1684093475341797, -0.16141891479492188, -0.15442848205566406, -0.14743804931640625, -0.14044761657714844, -0.13345718383789062, -0.1264667510986328, -0.119476318359375, -0.11248588562011719, -0.10549545288085938, -0.09850502014160156, -0.09151458740234375, -0.08452415466308594, -0.07753372192382812, -0.07054328918457031, -0.0635528564453125, -0.05656242370605469, -0.049571990966796875, -0.04258155822753906, -0.03559112548828125, -0.028600692749023438, -0.021610260009765625, -0.014619827270507812, -0.00762939453125, -0.0006389617919921875, 0.006351470947265625, 0.013341903686523438, 0.02033233642578125, 0.027322769165039062, 0.034313201904296875, 0.04130363464355469, 0.0482940673828125, 0.05528450012207031, 0.062274932861328125, 0.06926536560058594, 0.07625579833984375, 0.08324623107910156, 0.09023666381835938, 0.09722709655761719, 0.104217529296875, 0.11120796203613281, 0.11819839477539062, 0.12518882751464844, 0.13217926025390625, 0.13916969299316406, 0.14616012573242188, 0.1531505584716797, 0.1601409912109375, 0.1671314239501953, 0.17412185668945312, 0.18111228942871094, 0.18810272216796875, 0.19509315490722656, 0.20208358764648438, 0.2090740203857422, 0.216064453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 12.0, 15.0, 10.0, 13.0, 22.0, 24.0, 36.0, 46.0, 65.0, 100.0, 108.0, 94.0, 101.0, 85.0, 72.0, 43.0, 31.0, 28.0, 20.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3795833587646484e-05, -3.264378756284714e-05, -3.149174153804779e-05, -3.0339695513248444e-05, -2.9187649488449097e-05, -2.803560346364975e-05, -2.6883557438850403e-05, -2.5731511414051056e-05, -2.457946538925171e-05, -2.3427419364452362e-05, -2.2275373339653015e-05, -2.1123327314853668e-05, -1.997128129005432e-05, -1.8819235265254974e-05, -1.7667189240455627e-05, -1.651514321565628e-05, -1.5363097190856934e-05, -1.4211051166057587e-05, -1.305900514125824e-05, -1.1906959116458893e-05, -1.0754913091659546e-05, -9.602867066860199e-06, -8.450821042060852e-06, -7.298775017261505e-06, -6.146728992462158e-06, -4.994682967662811e-06, -3.842636942863464e-06, -2.6905909180641174e-06, -1.5385448932647705e-06, -3.864988684654236e-07, 7.655471563339233e-07, 1.9175931811332703e-06, 3.069639205932617e-06, 4.221685230731964e-06, 5.373731255531311e-06, 6.525777280330658e-06, 7.677823305130005e-06, 8.829869329929352e-06, 9.981915354728699e-06, 1.1133961379528046e-05, 1.2286007404327393e-05, 1.343805342912674e-05, 1.4590099453926086e-05, 1.5742145478725433e-05, 1.689419150352478e-05, 1.8046237528324127e-05, 1.9198283553123474e-05, 2.035032957792282e-05, 2.1502375602722168e-05, 2.2654421627521515e-05, 2.3806467652320862e-05, 2.495851367712021e-05, 2.6110559701919556e-05, 2.7262605726718903e-05, 2.841465175151825e-05, 2.9566697776317596e-05, 3.071874380111694e-05, 3.187078982591629e-05, 3.302283585071564e-05, 3.4174881875514984e-05, 3.532692790031433e-05, 3.647897392511368e-05, 3.7631019949913025e-05, 3.878306597471237e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 15.0, 13.0, 17.0, 23.0, 33.0, 68.0, 101.0, 175.0, 293.0, 521.0, 1083.0, 2112.0, 4806.0, 12125.0, 32927.0, 95059.0, 262786.0, 367316.0, 173603.0, 59655.0, 21227.0, 8060.0, 3356.0, 1471.0, 773.0, 390.0, 182.0, 118.0, 72.0, 50.0, 52.0, 25.0, 17.0, 8.0, 7.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.147705078125, -0.14248275756835938, -0.13726043701171875, -0.13203811645507812, -0.1268157958984375, -0.12159347534179688, -0.11637115478515625, -0.11114883422851562, -0.105926513671875, -0.10070419311523438, -0.09548187255859375, -0.09025955200195312, -0.0850372314453125, -0.07981491088867188, -0.07459259033203125, -0.06937026977539062, -0.06414794921875, -0.058925628662109375, -0.05370330810546875, -0.048480987548828125, -0.0432586669921875, -0.038036346435546875, -0.03281402587890625, -0.027591705322265625, -0.022369384765625, -0.017147064208984375, -0.01192474365234375, -0.006702423095703125, -0.0014801025390625, 0.003742218017578125, 0.00896453857421875, 0.014186859130859375, 0.0194091796875, 0.024631500244140625, 0.02985382080078125, 0.035076141357421875, 0.0402984619140625, 0.045520782470703125, 0.05074310302734375, 0.055965423583984375, 0.061187744140625, 0.06641006469726562, 0.07163238525390625, 0.07685470581054688, 0.0820770263671875, 0.08729934692382812, 0.09252166748046875, 0.09774398803710938, 0.10296630859375, 0.10818862915039062, 0.11341094970703125, 0.11863327026367188, 0.1238555908203125, 0.12907791137695312, 0.13430023193359375, 0.13952255249023438, 0.144744873046875, 0.14996719360351562, 0.15518951416015625, 0.16041183471679688, 0.1656341552734375, 0.17085647583007812, 0.17607879638671875, 0.18130111694335938, 0.1865234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 9.0, 12.0, 13.0, 7.0, 19.0, 22.0, 20.0, 32.0, 46.0, 43.0, 63.0, 73.0, 73.0, 89.0, 72.0, 71.0, 72.0, 41.0, 45.0, 30.0, 29.0, 23.0, 20.0, 14.0, 12.0, 8.0, 6.0, 2.0, 6.0, 6.0, 5.0, 4.0, 0.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12167739868164062, -0.11652374267578125, -0.11137008666992188, -0.1062164306640625, -0.10106277465820312, -0.09590911865234375, -0.09075546264648438, -0.085601806640625, -0.08044815063476562, -0.07529449462890625, -0.07014083862304688, -0.0649871826171875, -0.059833526611328125, -0.05467987060546875, -0.049526214599609375, -0.04437255859375, -0.039218902587890625, -0.03406524658203125, -0.028911590576171875, -0.0237579345703125, -0.018604278564453125, -0.01345062255859375, -0.008296966552734375, -0.003143310546875, 0.002010345458984375, 0.00716400146484375, 0.012317657470703125, 0.0174713134765625, 0.022624969482421875, 0.02777862548828125, 0.032932281494140625, 0.0380859375, 0.043239593505859375, 0.04839324951171875, 0.053546905517578125, 0.0587005615234375, 0.06385421752929688, 0.06900787353515625, 0.07416152954101562, 0.079315185546875, 0.08446884155273438, 0.08962249755859375, 0.09477615356445312, 0.0999298095703125, 0.10508346557617188, 0.11023712158203125, 0.11539077758789062, 0.12054443359375, 0.12569808959960938, 0.13085174560546875, 0.13600540161132812, 0.1411590576171875, 0.14631271362304688, 0.15146636962890625, 0.15662002563476562, 0.161773681640625, 0.16692733764648438, 0.17208099365234375, 0.17723464965820312, 0.1823883056640625, 0.18754196166992188, 0.19269561767578125, 0.19784927368164062, 0.2030029296875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 14.0, 24.0, 37.0, 94.0, 134.0, 161.0, 159.0, 144.0, 93.0, 64.0, 40.0, 13.0, 9.0, 6.0, 1.0, 4.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5153822898864746, -2.4366567134857178, -2.357931137084961, -2.279205560684204, -2.2004799842834473, -2.1217546463012695, -2.0430290699005127, -1.9643034934997559, -1.885577917098999, -1.8068523406982422, -1.7281267642974854, -1.649401307106018, -1.5706757307052612, -1.4919501543045044, -1.413224697113037, -1.3344991207122803, -1.2557735443115234, -1.1770479679107666, -1.0983223915100098, -1.0195969343185425, -0.9408713579177856, -0.8621457815170288, -0.7834202647209167, -0.7046947479248047, -0.6259691715240479, -0.547243595123291, -0.46851807832717896, -0.3897925317287445, -0.31106698513031006, -0.2323414385318756, -0.15361589193344116, -0.0748903751373291, 0.0038352012634277344, 0.08256074786186218, 0.16128629446029663, 0.24001184105873108, 0.3187373876571655, 0.3974629342556, 0.4761884808540344, 0.5549139976501465, 0.6336395740509033, 0.7123651504516602, 0.7910906672477722, 0.8698161840438843, 0.9485417604446411, 1.027267336845398, 1.1059927940368652, 1.184718370437622, 1.263443946838379, 1.3421695232391357, 1.4208950996398926, 1.4996205568313599, 1.5783461332321167, 1.6570717096328735, 1.7357971668243408, 1.8145227432250977, 1.8932483196258545, 1.9719738960266113, 2.050699472427368, 2.129425048828125, 2.2081503868103027, 2.2868759632110596, 2.3656015396118164, 2.4443271160125732, 2.52305269241333]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 10.0, 12.0, 15.0, 10.0, 14.0, 14.0, 19.0, 16.0, 20.0, 24.0, 44.0, 29.0, 28.0, 32.0, 34.0, 43.0, 34.0, 32.0, 31.0, 47.0, 27.0, 48.0, 38.0, 42.0, 24.0, 26.0, 31.0, 30.0, 26.0, 21.0, 27.0, 19.0, 22.0, 19.0, 16.0, 11.0, 9.0, 6.0, 7.0, 8.0, 6.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.3916316032409668, -1.3497425317764282, -1.3078535795211792, -1.2659645080566406, -1.224075436592102, -1.182186484336853, -1.1402974128723145, -1.0984084606170654, -1.0565193891525269, -1.0146303176879883, -0.9727413058280945, -0.9308522939682007, -0.8889632821083069, -0.8470742702484131, -0.8051851987838745, -0.7632961869239807, -0.7214071154594421, -0.6795181035995483, -0.6376290321350098, -0.595740020275116, -0.5538510084152222, -0.5119619369506836, -0.4700729250907898, -0.428183913230896, -0.3862948715686798, -0.3444058299064636, -0.3025168180465698, -0.26062777638435364, -0.21873874962329865, -0.17684972286224365, -0.13496068120002747, -0.09307166934013367, -0.05118262767791748, -0.00929359719157219, 0.0325954332947731, 0.07448446750640869, 0.11637349426746368, 0.15826252102851868, 0.20015156269073486, 0.24204057455062866, 0.28392961621284485, 0.32581865787506104, 0.36770766973495483, 0.409596711397171, 0.4514857530593872, 0.493374764919281, 0.5352637767791748, 0.5771528482437134, 0.6190418601036072, 0.660930871963501, 0.7028199434280396, 0.7447089552879333, 0.7865979671478271, 0.8284870386123657, 0.8703760504722595, 0.9122650623321533, 0.9541541337966919, 0.9960431456565857, 1.0379321575164795, 1.079821228981018, 1.1217103004455566, 1.1635992527008057, 1.2054883241653442, 1.2473773956298828, 1.2892663478851318]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 8.0, 5.0, 13.0, 11.0, 18.0, 26.0, 31.0, 50.0, 101.0, 157.0, 276.0, 541.0, 953.0, 2025.0, 4021.0, 8592.0, 18406.0, 41505.0, 98964.0, 271433.0, 937431.0, 1780271.0, 680126.0, 208386.0, 79200.0, 33472.0, 14715.0, 6788.0, 3233.0, 1628.0, 801.0, 448.0, 250.0, 142.0, 94.0, 45.0, 48.0, 22.0, 15.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28841400146484375, -0.2792205810546875, -0.27002716064453125, -0.260833740234375, -0.25164031982421875, -0.2424468994140625, -0.23325347900390625, -0.22406005859375, -0.21486663818359375, -0.2056732177734375, -0.19647979736328125, -0.187286376953125, -0.17809295654296875, -0.1688995361328125, -0.15970611572265625, -0.1505126953125, -0.14131927490234375, -0.1321258544921875, -0.12293243408203125, -0.113739013671875, -0.10454559326171875, -0.0953521728515625, -0.08615875244140625, -0.07696533203125, -0.06777191162109375, -0.0585784912109375, -0.04938507080078125, -0.040191650390625, -0.03099822998046875, -0.0218048095703125, -0.01261138916015625, -0.00341796875, 0.00577545166015625, 0.0149688720703125, 0.02416229248046875, 0.033355712890625, 0.04254913330078125, 0.0517425537109375, 0.06093597412109375, 0.07012939453125, 0.07932281494140625, 0.0885162353515625, 0.09770965576171875, 0.106903076171875, 0.11609649658203125, 0.1252899169921875, 0.13448333740234375, 0.1436767578125, 0.15287017822265625, 0.1620635986328125, 0.17125701904296875, 0.180450439453125, 0.18964385986328125, 0.1988372802734375, 0.20803070068359375, 0.21722412109375, 0.22641754150390625, 0.2356109619140625, 0.24480438232421875, 0.253997802734375, 0.26319122314453125, 0.2723846435546875, 0.28157806396484375, 0.290771484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 1.0, 5.0, 4.0, 5.0, 8.0, 3.0, 6.0, 13.0, 14.0, 14.0, 12.0, 23.0, 20.0, 22.0, 31.0, 38.0, 28.0, 13.0, 34.0, 35.0, 32.0, 43.0, 41.0, 34.0, 43.0, 49.0, 40.0, 37.0, 41.0, 40.0, 34.0, 30.0, 26.0, 27.0, 20.0, 15.0, 23.0, 12.0, 17.0, 15.0, 11.0, 7.0, 5.0, 7.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.19580078125, -0.18971633911132812, -0.18363189697265625, -0.17754745483398438, -0.1714630126953125, -0.16537857055664062, -0.15929412841796875, -0.15320968627929688, -0.147125244140625, -0.14104080200195312, -0.13495635986328125, -0.12887191772460938, -0.1227874755859375, -0.11670303344726562, -0.11061859130859375, -0.10453414916992188, -0.09844970703125, -0.09236526489257812, -0.08628082275390625, -0.08019638061523438, -0.0741119384765625, -0.06802749633789062, -0.06194305419921875, -0.055858612060546875, -0.049774169921875, -0.043689727783203125, -0.03760528564453125, -0.031520843505859375, -0.0254364013671875, -0.019351959228515625, -0.01326751708984375, -0.007183074951171875, -0.0010986328125, 0.004985809326171875, 0.01107025146484375, 0.017154693603515625, 0.0232391357421875, 0.029323577880859375, 0.03540802001953125, 0.041492462158203125, 0.047576904296875, 0.053661346435546875, 0.05974578857421875, 0.06583023071289062, 0.0719146728515625, 0.07799911499023438, 0.08408355712890625, 0.09016799926757812, 0.09625244140625, 0.10233688354492188, 0.10842132568359375, 0.11450576782226562, 0.1205902099609375, 0.12667465209960938, 0.13275909423828125, 0.13884353637695312, 0.144927978515625, 0.15101242065429688, 0.15709686279296875, 0.16318130493164062, 0.1692657470703125, 0.17535018920898438, 0.18143463134765625, 0.18751907348632812, 0.193603515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 17.0, 28.0, 34.0, 52.0, 72.0, 106.0, 182.0, 279.0, 452.0, 688.0, 1256.0, 2259.0, 3956.0, 7229.0, 13575.0, 26076.0, 50996.0, 106618.0, 240051.0, 667001.0, 1700238.0, 844365.0, 284393.0, 123656.0, 58403.0, 29152.0, 15126.0, 7986.0, 4274.0, 2287.0, 1384.0, 786.0, 482.0, 292.0, 184.0, 106.0, 74.0, 52.0, 32.0, 24.0, 12.0, 14.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.25537109375, -0.2470245361328125, -0.238677978515625, -0.2303314208984375, -0.22198486328125, -0.2136383056640625, -0.205291748046875, -0.1969451904296875, -0.1885986328125, -0.1802520751953125, -0.171905517578125, -0.1635589599609375, -0.15521240234375, -0.1468658447265625, -0.138519287109375, -0.1301727294921875, -0.121826171875, -0.1134796142578125, -0.105133056640625, -0.0967864990234375, -0.08843994140625, -0.0800933837890625, -0.071746826171875, -0.0634002685546875, -0.0550537109375, -0.0467071533203125, -0.038360595703125, -0.0300140380859375, -0.02166748046875, -0.0133209228515625, -0.004974365234375, 0.0033721923828125, 0.01171875, 0.0200653076171875, 0.028411865234375, 0.0367584228515625, 0.04510498046875, 0.0534515380859375, 0.061798095703125, 0.0701446533203125, 0.0784912109375, 0.0868377685546875, 0.095184326171875, 0.1035308837890625, 0.11187744140625, 0.1202239990234375, 0.128570556640625, 0.1369171142578125, 0.145263671875, 0.1536102294921875, 0.161956787109375, 0.1703033447265625, 0.17864990234375, 0.1869964599609375, 0.195343017578125, 0.2036895751953125, 0.2120361328125, 0.2203826904296875, 0.228729248046875, 0.2370758056640625, 0.24542236328125, 0.2537689208984375, 0.262115478515625, 0.2704620361328125, 0.27880859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 4.0, 7.0, 14.0, 7.0, 11.0, 21.0, 33.0, 30.0, 45.0, 57.0, 51.0, 84.0, 84.0, 120.0, 175.0, 230.0, 307.0, 430.0, 491.0, 488.0, 366.0, 237.0, 193.0, 129.0, 93.0, 75.0, 52.0, 45.0, 32.0, 43.0, 27.0, 15.0, 17.0, 14.0, 5.0, 8.0, 3.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.42626953125, -0.414337158203125, -0.40240478515625, -0.390472412109375, -0.3785400390625, -0.366607666015625, -0.35467529296875, -0.342742919921875, -0.330810546875, -0.318878173828125, -0.30694580078125, -0.295013427734375, -0.2830810546875, -0.271148681640625, -0.25921630859375, -0.247283935546875, -0.2353515625, -0.223419189453125, -0.21148681640625, -0.199554443359375, -0.1876220703125, -0.175689697265625, -0.16375732421875, -0.151824951171875, -0.139892578125, -0.127960205078125, -0.11602783203125, -0.104095458984375, -0.0921630859375, -0.080230712890625, -0.06829833984375, -0.056365966796875, -0.04443359375, -0.032501220703125, -0.02056884765625, -0.008636474609375, 0.0032958984375, 0.015228271484375, 0.02716064453125, 0.039093017578125, 0.051025390625, 0.062957763671875, 0.07489013671875, 0.086822509765625, 0.0987548828125, 0.110687255859375, 0.12261962890625, 0.134552001953125, 0.146484375, 0.158416748046875, 0.17034912109375, 0.182281494140625, 0.1942138671875, 0.206146240234375, 0.21807861328125, 0.230010986328125, 0.241943359375, 0.253875732421875, 0.26580810546875, 0.277740478515625, 0.2896728515625, 0.301605224609375, 0.31353759765625, 0.325469970703125, 0.33740234375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 16.0, 20.0, 23.0, 32.0, 49.0, 62.0, 96.0, 87.0, 108.0, 101.0, 93.0, 72.0, 66.0, 43.0, 36.0, 30.0, 18.0, 5.0, 11.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.531419038772583, -2.465644598007202, -2.399869918823242, -2.3340954780578613, -2.2683210372924805, -2.2025465965270996, -2.1367721557617188, -2.070997476577759, -2.005223035812378, -1.939448595046997, -1.8736740350723267, -1.8078994750976562, -1.7421250343322754, -1.6763505935668945, -1.6105760335922241, -1.5448014736175537, -1.4790270328521729, -1.413252592086792, -1.3474780321121216, -1.2817034721374512, -1.2159290313720703, -1.1501545906066895, -1.084380030632019, -1.0186054706573486, -0.9528310298919678, -0.8870565295219421, -0.8212820291519165, -0.7555075287818909, -0.6897330284118652, -0.6239585280418396, -0.558184027671814, -0.49240952730178833, -0.4266350269317627, -0.36086052656173706, -0.2950860261917114, -0.2293115258216858, -0.16353702545166016, -0.09776252508163452, -0.03198802471160889, 0.03378647565841675, 0.09956097602844238, 0.16533547639846802, 0.23110997676849365, 0.2968844771385193, 0.3626589775085449, 0.42843347787857056, 0.4942079782485962, 0.5599824786186218, 0.6257569789886475, 0.6915314793586731, 0.7573059797286987, 0.8230804800987244, 0.88885498046875, 0.9546294808387756, 1.0204039812088013, 1.0861785411834717, 1.1519529819488525, 1.2177274227142334, 1.2835019826889038, 1.3492765426635742, 1.415050983428955, 1.480825424194336, 1.5465999841690063, 1.6123745441436768, 1.6781489849090576]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 4.0, 8.0, 7.0, 12.0, 6.0, 12.0, 5.0, 11.0, 24.0, 14.0, 23.0, 27.0, 31.0, 28.0, 20.0, 28.0, 23.0, 34.0, 43.0, 47.0, 29.0, 38.0, 37.0, 42.0, 38.0, 34.0, 34.0, 39.0, 23.0, 33.0, 33.0, 24.0, 31.0, 21.0, 13.0, 24.0, 17.0, 18.0, 12.0, 4.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2270749807357788, -1.1858819723129272, -1.1446889638900757, -1.1034959554672241, -1.0623029470443726, -1.021109938621521, -0.9799169898033142, -0.9387239813804626, -0.8975309729576111, -0.8563379645347595, -0.815144956111908, -0.7739519476890564, -0.7327589988708496, -0.691565990447998, -0.6503729820251465, -0.6091799736022949, -0.5679869651794434, -0.5267939567565918, -0.48560094833374023, -0.44440796971321106, -0.4032149612903595, -0.36202195286750793, -0.32082897424697876, -0.2796359658241272, -0.23844295740127563, -0.19724994897842407, -0.1560569554567337, -0.11486395448446274, -0.07367095351219177, -0.03247794508934021, 0.008715048432350159, 0.04990804195404053, 0.09110116958618164, 0.1322941780090332, 0.17348717153072357, 0.21468016505241394, 0.2558731734752655, 0.29706618189811707, 0.33825916051864624, 0.3794521689414978, 0.42064517736434937, 0.4618381857872009, 0.5030311942100525, 0.544224202632904, 0.5854171514511108, 0.6266101598739624, 0.667803168296814, 0.7089961767196655, 0.7501891851425171, 0.7913821935653687, 0.8325752019882202, 0.8737682104110718, 0.9149612188339233, 0.9561542272567749, 0.9973471760749817, 1.0385401248931885, 1.07973313331604, 1.1209261417388916, 1.1621191501617432, 1.2033121585845947, 1.2445051670074463, 1.2856981754302979, 1.3268911838531494, 1.368084192276001, 1.4092772006988525]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 17.0, 16.0, 35.0, 46.0, 69.0, 130.0, 178.0, 272.0, 385.0, 582.0, 834.0, 1220.0, 1820.0, 2692.0, 3862.0, 5601.0, 8376.0, 12793.0, 21410.0, 42164.0, 114587.0, 313505.0, 307170.0, 110726.0, 40973.0, 20718.0, 12505.0, 8226.0, 5491.0, 3832.0, 2695.0, 1805.0, 1259.0, 796.0, 612.0, 385.0, 257.0, 180.0, 107.0, 75.0, 45.0, 31.0, 21.0, 15.0, 10.0, 5.0, 5.0, 3.0, 4.0], "bins": [-0.38134765625, -0.3710365295410156, -0.36072540283203125, -0.3504142761230469, -0.3401031494140625, -0.3297920227050781, -0.31948089599609375, -0.3091697692871094, -0.298858642578125, -0.2885475158691406, -0.27823638916015625, -0.2679252624511719, -0.2576141357421875, -0.24730300903320312, -0.23699188232421875, -0.22668075561523438, -0.21636962890625, -0.20605850219726562, -0.19574737548828125, -0.18543624877929688, -0.1751251220703125, -0.16481399536132812, -0.15450286865234375, -0.14419174194335938, -0.133880615234375, -0.12356948852539062, -0.11325836181640625, -0.10294723510742188, -0.0926361083984375, -0.08232498168945312, -0.07201385498046875, -0.061702728271484375, -0.0513916015625, -0.041080474853515625, -0.03076934814453125, -0.020458221435546875, -0.0101470947265625, 0.000164031982421875, 0.01047515869140625, 0.020786285400390625, 0.031097412109375, 0.041408538818359375, 0.05171966552734375, 0.062030792236328125, 0.0723419189453125, 0.08265304565429688, 0.09296417236328125, 0.10327529907226562, 0.11358642578125, 0.12389755249023438, 0.13420867919921875, 0.14451980590820312, 0.1548309326171875, 0.16514205932617188, 0.17545318603515625, 0.18576431274414062, 0.196075439453125, 0.20638656616210938, 0.21669769287109375, 0.22700881958007812, 0.2373199462890625, 0.24763107299804688, 0.25794219970703125, 0.2682533264160156, 0.278564453125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 6.0, 6.0, 9.0, 13.0, 13.0, 19.0, 17.0, 18.0, 18.0, 24.0, 33.0, 33.0, 22.0, 36.0, 38.0, 43.0, 42.0, 41.0, 47.0, 54.0, 31.0, 46.0, 38.0, 44.0, 23.0, 49.0, 30.0, 29.0, 22.0, 17.0, 24.0, 17.0, 13.0, 12.0, 11.0, 9.0, 8.0, 4.0, 10.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.19287109375, -0.1864147186279297, -0.17995834350585938, -0.17350196838378906, -0.16704559326171875, -0.16058921813964844, -0.15413284301757812, -0.1476764678955078, -0.1412200927734375, -0.1347637176513672, -0.12830734252929688, -0.12185096740722656, -0.11539459228515625, -0.10893821716308594, -0.10248184204101562, -0.09602546691894531, -0.089569091796875, -0.08311271667480469, -0.07665634155273438, -0.07019996643066406, -0.06374359130859375, -0.05728721618652344, -0.050830841064453125, -0.04437446594238281, -0.0379180908203125, -0.03146171569824219, -0.025005340576171875, -0.018548965454101562, -0.01209259033203125, -0.0056362152099609375, 0.000820159912109375, 0.0072765350341796875, 0.01373291015625, 0.020189285278320312, 0.026645660400390625, 0.03310203552246094, 0.03955841064453125, 0.04601478576660156, 0.052471160888671875, 0.05892753601074219, 0.0653839111328125, 0.07184028625488281, 0.07829666137695312, 0.08475303649902344, 0.09120941162109375, 0.09766578674316406, 0.10412216186523438, 0.11057853698730469, 0.117034912109375, 0.12349128723144531, 0.12994766235351562, 0.13640403747558594, 0.14286041259765625, 0.14931678771972656, 0.15577316284179688, 0.1622295379638672, 0.1686859130859375, 0.1751422882080078, 0.18159866333007812, 0.18805503845214844, 0.19451141357421875, 0.20096778869628906, 0.20742416381835938, 0.2138805389404297, 0.2203369140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 13.0, 16.0, 25.0, 26.0, 71.0, 99.0, 153.0, 293.0, 646.0, 1376.0, 3429.0, 9889.0, 30628.0, 118171.0, 585835.0, 228245.0, 46696.0, 14600.0, 4857.0, 1747.0, 791.0, 405.0, 216.0, 119.0, 69.0, 55.0, 20.0, 17.0, 11.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.7713470458984375, -0.749725341796875, -0.7281036376953125, -0.70648193359375, -0.6848602294921875, -0.663238525390625, -0.6416168212890625, -0.6199951171875, -0.5983734130859375, -0.576751708984375, -0.5551300048828125, -0.53350830078125, -0.5118865966796875, -0.490264892578125, -0.4686431884765625, -0.447021484375, -0.4253997802734375, -0.403778076171875, -0.3821563720703125, -0.36053466796875, -0.3389129638671875, -0.317291259765625, -0.2956695556640625, -0.2740478515625, -0.2524261474609375, -0.230804443359375, -0.2091827392578125, -0.18756103515625, -0.1659393310546875, -0.144317626953125, -0.1226959228515625, -0.10107421875, -0.0794525146484375, -0.057830810546875, -0.0362091064453125, -0.01458740234375, 0.0070343017578125, 0.028656005859375, 0.0502777099609375, 0.0718994140625, 0.0935211181640625, 0.115142822265625, 0.1367645263671875, 0.15838623046875, 0.1800079345703125, 0.201629638671875, 0.2232513427734375, 0.244873046875, 0.2664947509765625, 0.288116455078125, 0.3097381591796875, 0.33135986328125, 0.3529815673828125, 0.374603271484375, 0.3962249755859375, 0.4178466796875, 0.4394683837890625, 0.461090087890625, 0.4827117919921875, 0.50433349609375, 0.5259552001953125, 0.547576904296875, 0.5691986083984375, 0.5908203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 3.0, 10.0, 3.0, 8.0, 6.0, 13.0, 13.0, 15.0, 15.0, 27.0, 26.0, 23.0, 33.0, 35.0, 33.0, 40.0, 57.0, 51.0, 49.0, 50.0, 47.0, 45.0, 39.0, 35.0, 36.0, 43.0, 36.0, 30.0, 26.0, 35.0, 25.0, 11.0, 14.0, 15.0, 5.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6295700073242188, -0.6097259521484375, -0.5898818969726562, -0.570037841796875, -0.5501937866210938, -0.5303497314453125, -0.5105056762695312, -0.49066162109375, -0.47081756591796875, -0.4509735107421875, -0.43112945556640625, -0.411285400390625, -0.39144134521484375, -0.3715972900390625, -0.35175323486328125, -0.3319091796875, -0.31206512451171875, -0.2922210693359375, -0.27237701416015625, -0.252532958984375, -0.23268890380859375, -0.2128448486328125, -0.19300079345703125, -0.17315673828125, -0.15331268310546875, -0.1334686279296875, -0.11362457275390625, -0.093780517578125, -0.07393646240234375, -0.0540924072265625, -0.03424835205078125, -0.014404296875, 0.00543975830078125, 0.0252838134765625, 0.04512786865234375, 0.064971923828125, 0.08481597900390625, 0.1046600341796875, 0.12450408935546875, 0.14434814453125, 0.16419219970703125, 0.1840362548828125, 0.20388031005859375, 0.223724365234375, 0.24356842041015625, 0.2634124755859375, 0.28325653076171875, 0.3031005859375, 0.32294464111328125, 0.3427886962890625, 0.36263275146484375, 0.382476806640625, 0.40232086181640625, 0.4221649169921875, 0.44200897216796875, 0.46185302734375, 0.48169708251953125, 0.5015411376953125, 0.5213851928710938, 0.541229248046875, 0.5610733032226562, 0.5809173583984375, 0.6007614135742188, 0.62060546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 10.0, 6.0, 16.0, 20.0, 23.0, 42.0, 48.0, 68.0, 107.0, 175.0, 259.0, 418.0, 628.0, 964.0, 1570.0, 2568.0, 4377.0, 8299.0, 17082.0, 44070.0, 136544.0, 366386.0, 301746.0, 99394.0, 33373.0, 13801.0, 6787.0, 3735.0, 2243.0, 1368.0, 853.0, 542.0, 337.0, 235.0, 154.0, 92.0, 72.0, 46.0, 26.0, 20.0, 17.0, 13.0, 8.0, 8.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1427001953125, -0.13822174072265625, -0.1337432861328125, -0.12926483154296875, -0.124786376953125, -0.12030792236328125, -0.1158294677734375, -0.11135101318359375, -0.10687255859375, -0.10239410400390625, -0.0979156494140625, -0.09343719482421875, -0.088958740234375, -0.08448028564453125, -0.0800018310546875, -0.07552337646484375, -0.071044921875, -0.06656646728515625, -0.0620880126953125, -0.05760955810546875, -0.053131103515625, -0.04865264892578125, -0.0441741943359375, -0.03969573974609375, -0.03521728515625, -0.03073883056640625, -0.0262603759765625, -0.02178192138671875, -0.017303466796875, -0.01282501220703125, -0.0083465576171875, -0.00386810302734375, 0.0006103515625, 0.00508880615234375, 0.0095672607421875, 0.01404571533203125, 0.018524169921875, 0.02300262451171875, 0.0274810791015625, 0.03195953369140625, 0.03643798828125, 0.04091644287109375, 0.0453948974609375, 0.04987335205078125, 0.054351806640625, 0.05883026123046875, 0.0633087158203125, 0.06778717041015625, 0.072265625, 0.07674407958984375, 0.0812225341796875, 0.08570098876953125, 0.090179443359375, 0.09465789794921875, 0.0991363525390625, 0.10361480712890625, 0.10809326171875, 0.11257171630859375, 0.1170501708984375, 0.12152862548828125, 0.126007080078125, 0.13048553466796875, 0.1349639892578125, 0.13944244384765625, 0.1439208984375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 10.0, 11.0, 8.0, 20.0, 29.0, 81.0, 206.0, 288.0, 184.0, 74.0, 30.0, 16.0, 13.0, 13.0, 12.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011712312698364258, -0.00011381600052118301, -0.00011050887405872345, -0.00010720174759626389, -0.00010389462113380432, -0.00010058749467134476, -9.728036820888519e-05, -9.397324174642563e-05, -9.066611528396606e-05, -8.73589888215065e-05, -8.405186235904694e-05, -8.074473589658737e-05, -7.743760943412781e-05, -7.413048297166824e-05, -7.082335650920868e-05, -6.751623004674911e-05, -6.420910358428955e-05, -6.0901977121829987e-05, -5.759485065937042e-05, -5.428772419691086e-05, -5.0980597734451294e-05, -4.767347127199173e-05, -4.4366344809532166e-05, -4.10592183470726e-05, -3.775209188461304e-05, -3.444496542215347e-05, -3.113783895969391e-05, -2.7830712497234344e-05, -2.452358603477478e-05, -2.1216459572315216e-05, -1.7909333109855652e-05, -1.4602206647396088e-05, -1.1295080184936523e-05, -7.98795372247696e-06, -4.680827260017395e-06, -1.3737007975578308e-06, 1.9334256649017334e-06, 5.240552127361298e-06, 8.547678589820862e-06, 1.1854805052280426e-05, 1.516193151473999e-05, 1.8469057977199554e-05, 2.177618443965912e-05, 2.5083310902118683e-05, 2.8390437364578247e-05, 3.169756382703781e-05, 3.5004690289497375e-05, 3.831181675195694e-05, 4.1618943214416504e-05, 4.492606967687607e-05, 4.823319613933563e-05, 5.1540322601795197e-05, 5.484744906425476e-05, 5.8154575526714325e-05, 6.146170198917389e-05, 6.476882845163345e-05, 6.807595491409302e-05, 7.138308137655258e-05, 7.469020783901215e-05, 7.799733430147171e-05, 8.130446076393127e-05, 8.461158722639084e-05, 8.79187136888504e-05, 9.122584015130997e-05, 9.453296661376953e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 14.0, 10.0, 20.0, 15.0, 35.0, 47.0, 78.0, 101.0, 225.0, 305.0, 556.0, 1057.0, 2032.0, 4114.0, 8655.0, 20115.0, 53294.0, 155028.0, 332752.0, 287060.0, 113676.0, 39857.0, 15522.0, 6963.0, 3280.0, 1611.0, 955.0, 436.0, 257.0, 160.0, 108.0, 72.0, 35.0, 30.0, 32.0, 13.0, 15.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.13623046875, -0.13208389282226562, -0.12793731689453125, -0.12379074096679688, -0.1196441650390625, -0.11549758911132812, -0.11135101318359375, -0.10720443725585938, -0.103057861328125, -0.09891128540039062, -0.09476470947265625, -0.09061813354492188, -0.0864715576171875, -0.08232498168945312, -0.07817840576171875, -0.07403182983398438, -0.06988525390625, -0.06573867797851562, -0.06159210205078125, -0.057445526123046875, -0.0532989501953125, -0.049152374267578125, -0.04500579833984375, -0.040859222412109375, -0.036712646484375, -0.032566070556640625, -0.02841949462890625, -0.024272918701171875, -0.0201263427734375, -0.015979766845703125, -0.01183319091796875, -0.007686614990234375, -0.0035400390625, 0.000606536865234375, 0.00475311279296875, 0.008899688720703125, 0.0130462646484375, 0.017192840576171875, 0.02133941650390625, 0.025485992431640625, 0.029632568359375, 0.033779144287109375, 0.03792572021484375, 0.042072296142578125, 0.0462188720703125, 0.050365447998046875, 0.05451202392578125, 0.058658599853515625, 0.06280517578125, 0.06695175170898438, 0.07109832763671875, 0.07524490356445312, 0.0793914794921875, 0.08353805541992188, 0.08768463134765625, 0.09183120727539062, 0.095977783203125, 0.10012435913085938, 0.10427093505859375, 0.10841751098632812, 0.1125640869140625, 0.11671066284179688, 0.12085723876953125, 0.12500381469726562, 0.129150390625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 10.0, 14.0, 14.0, 19.0, 19.0, 14.0, 39.0, 37.0, 52.0, 55.0, 57.0, 76.0, 82.0, 64.0, 58.0, 55.0, 55.0, 47.0, 56.0, 27.0, 36.0, 25.0, 12.0, 16.0, 9.0, 6.0, 3.0, 3.0, 9.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11749267578125, -0.1131582260131836, -0.10882377624511719, -0.10448932647705078, -0.10015487670898438, -0.09582042694091797, -0.09148597717285156, -0.08715152740478516, -0.08281707763671875, -0.07848262786865234, -0.07414817810058594, -0.06981372833251953, -0.06547927856445312, -0.06114482879638672, -0.05681037902832031, -0.052475929260253906, -0.0481414794921875, -0.043807029724121094, -0.03947257995605469, -0.03513813018798828, -0.030803680419921875, -0.02646923065185547, -0.022134780883789062, -0.017800331115722656, -0.01346588134765625, -0.009131431579589844, -0.0047969818115234375, -0.00046253204345703125, 0.003871917724609375, 0.008206367492675781, 0.012540817260742188, 0.016875267028808594, 0.021209716796875, 0.025544166564941406, 0.029878616333007812, 0.03421306610107422, 0.038547515869140625, 0.04288196563720703, 0.04721641540527344, 0.051550865173339844, 0.05588531494140625, 0.060219764709472656, 0.06455421447753906, 0.06888866424560547, 0.07322311401367188, 0.07755756378173828, 0.08189201354980469, 0.0862264633178711, 0.0905609130859375, 0.0948953628540039, 0.09922981262207031, 0.10356426239013672, 0.10789871215820312, 0.11223316192626953, 0.11656761169433594, 0.12090206146240234, 0.12523651123046875, 0.12957096099853516, 0.13390541076660156, 0.13823986053466797, 0.14257431030273438, 0.14690876007080078, 0.1512432098388672, 0.1555776596069336, 0.159912109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 20.0, 56.0, 115.0, 197.0, 215.0, 184.0, 99.0, 73.0, 22.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.959807395935059, -5.839235782623291, -5.718664169311523, -5.598092079162598, -5.47752046585083, -5.3569488525390625, -5.236377239227295, -5.115805625915527, -4.995233535766602, -4.874661922454834, -4.754090309143066, -4.633518218994141, -4.512946605682373, -4.3923749923706055, -4.271803379058838, -4.15123176574707, -4.030660152435303, -3.910088539123535, -3.7895166873931885, -3.668945074081421, -3.548373222351074, -3.4278016090393066, -3.307229995727539, -3.1866581439971924, -3.0660862922668457, -2.945514678955078, -2.8249428272247314, -2.704371213912964, -2.583799362182617, -2.4632277488708496, -2.342656135559082, -2.2220842838287354, -2.1015126705169678, -1.9809409379959106, -1.8603692054748535, -1.739797592163086, -1.6192258596420288, -1.4986541271209717, -1.3780823945999146, -1.2575106620788574, -1.1369390487670898, -1.0163673162460327, -0.8957956433296204, -0.7752239108085632, -0.6546522378921509, -0.5340805053710938, -0.4135087728500366, -0.29293709993362427, -0.17236530780792236, -0.051793597638607025, 0.06877811253070831, 0.18934983015060425, 0.309921532869339, 0.43049323558807373, 0.5510649681091309, 0.6716366410255432, 0.7922083735466003, 0.9127801060676575, 1.0333517789840698, 1.153923511505127, 1.274495244026184, 1.3950669765472412, 1.5156385898590088, 1.636210322380066, 1.756782054901123]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 8.0, 5.0, 10.0, 13.0, 20.0, 12.0, 12.0, 23.0, 21.0, 22.0, 33.0, 33.0, 40.0, 38.0, 24.0, 34.0, 31.0, 37.0, 46.0, 47.0, 54.0, 39.0, 37.0, 32.0, 31.0, 33.0, 32.0, 32.0, 34.0, 29.0, 27.0, 15.0, 14.0, 12.0, 12.0, 6.0, 6.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.550621509552002, -1.50503408908844, -1.459446668624878, -1.4138593673706055, -1.3682719469070435, -1.3226845264434814, -1.277097225189209, -1.231509804725647, -1.185922384262085, -1.140334963798523, -1.094747543334961, -1.0491602420806885, -1.0035728216171265, -0.9579854011535645, -0.9123980402946472, -0.86681067943573, -0.821223258972168, -0.775635838508606, -0.7300484776496887, -0.6844611167907715, -0.6388736963272095, -0.5932862758636475, -0.5476989150047302, -0.502111554145813, -0.456524133682251, -0.41093674302101135, -0.36534935235977173, -0.3197619616985321, -0.2741745710372925, -0.22858718037605286, -0.18299978971481323, -0.1374123990535736, -0.09182500839233398, -0.04623761773109436, -0.0006502270698547363, 0.04493716359138489, 0.09052455425262451, 0.13611194491386414, 0.18169933557510376, 0.22728672623634338, 0.272874116897583, 0.31846150755882263, 0.36404889822006226, 0.4096362888813019, 0.4552236795425415, 0.5008111000061035, 0.5463984608650208, 0.591985821723938, 0.6375732421875, 0.683160662651062, 0.7287480235099792, 0.7743353843688965, 0.8199228048324585, 0.8655102252960205, 0.9110975861549377, 0.956684947013855, 1.002272367477417, 1.047859787940979, 1.093447208404541, 1.1390345096588135, 1.1846219301223755, 1.2302093505859375, 1.27579665184021, 1.321384072303772, 1.366971492767334]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 12.0, 10.0, 22.0, 28.0, 26.0, 48.0, 74.0, 146.0, 253.0, 476.0, 984.0, 2027.0, 3999.0, 8564.0, 19121.0, 44256.0, 116359.0, 392472.0, 1397838.0, 1533388.0, 457284.0, 131453.0, 47862.0, 20036.0, 9250.0, 4142.0, 1932.0, 996.0, 470.0, 301.0, 163.0, 90.0, 56.0, 32.0, 22.0, 28.0, 20.0, 7.0, 11.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3046875, -0.2951812744140625, -0.285675048828125, -0.2761688232421875, -0.26666259765625, -0.2571563720703125, -0.247650146484375, -0.2381439208984375, -0.2286376953125, -0.2191314697265625, -0.209625244140625, -0.2001190185546875, -0.19061279296875, -0.1811065673828125, -0.171600341796875, -0.1620941162109375, -0.152587890625, -0.1430816650390625, -0.133575439453125, -0.1240692138671875, -0.11456298828125, -0.1050567626953125, -0.095550537109375, -0.0860443115234375, -0.0765380859375, -0.0670318603515625, -0.057525634765625, -0.0480194091796875, -0.03851318359375, -0.0290069580078125, -0.019500732421875, -0.0099945068359375, -0.00048828125, 0.0090179443359375, 0.018524169921875, 0.0280303955078125, 0.03753662109375, 0.0470428466796875, 0.056549072265625, 0.0660552978515625, 0.0755615234375, 0.0850677490234375, 0.094573974609375, 0.1040802001953125, 0.11358642578125, 0.1230926513671875, 0.132598876953125, 0.1421051025390625, 0.151611328125, 0.1611175537109375, 0.170623779296875, 0.1801300048828125, 0.18963623046875, 0.1991424560546875, 0.208648681640625, 0.2181549072265625, 0.2276611328125, 0.2371673583984375, 0.246673583984375, 0.2561798095703125, 0.26568603515625, 0.2751922607421875, 0.284698486328125, 0.2942047119140625, 0.3037109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 7.0, 6.0, 10.0, 10.0, 13.0, 16.0, 15.0, 17.0, 32.0, 21.0, 31.0, 29.0, 37.0, 38.0, 38.0, 42.0, 40.0, 38.0, 48.0, 69.0, 45.0, 44.0, 42.0, 42.0, 36.0, 35.0, 36.0, 28.0, 22.0, 16.0, 20.0, 11.0, 10.0, 14.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24279022216796875, -0.2350921630859375, -0.22739410400390625, -0.219696044921875, -0.21199798583984375, -0.2042999267578125, -0.19660186767578125, -0.18890380859375, -0.18120574951171875, -0.1735076904296875, -0.16580963134765625, -0.158111572265625, -0.15041351318359375, -0.1427154541015625, -0.13501739501953125, -0.1273193359375, -0.11962127685546875, -0.1119232177734375, -0.10422515869140625, -0.096527099609375, -0.08882904052734375, -0.0811309814453125, -0.07343292236328125, -0.06573486328125, -0.05803680419921875, -0.0503387451171875, -0.04264068603515625, -0.034942626953125, -0.02724456787109375, -0.0195465087890625, -0.01184844970703125, -0.004150390625, 0.00354766845703125, 0.0112457275390625, 0.01894378662109375, 0.026641845703125, 0.03433990478515625, 0.0420379638671875, 0.04973602294921875, 0.05743408203125, 0.06513214111328125, 0.0728302001953125, 0.08052825927734375, 0.088226318359375, 0.09592437744140625, 0.1036224365234375, 0.11132049560546875, 0.1190185546875, 0.12671661376953125, 0.1344146728515625, 0.14211273193359375, 0.149810791015625, 0.15750885009765625, 0.1652069091796875, 0.17290496826171875, 0.18060302734375, 0.18830108642578125, 0.1959991455078125, 0.20369720458984375, 0.211395263671875, 0.21909332275390625, 0.2267913818359375, 0.23448944091796875, 0.2421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 11.0, 10.0, 11.0, 14.0, 26.0, 50.0, 51.0, 70.0, 109.0, 149.0, 196.0, 406.0, 625.0, 1069.0, 2122.0, 3879.0, 7742.0, 16714.0, 36338.0, 83315.0, 214384.0, 724219.0, 2001211.0, 732909.0, 216672.0, 83592.0, 36013.0, 16197.0, 7678.0, 3832.0, 1947.0, 1047.0, 602.0, 333.0, 229.0, 160.0, 110.0, 70.0, 45.0, 30.0, 17.0, 22.0, 12.0, 10.0, 9.0, 7.0, 8.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.3130607604980469, -0.30312347412109375, -0.2931861877441406, -0.2832489013671875, -0.2733116149902344, -0.26337432861328125, -0.2534370422363281, -0.243499755859375, -0.23356246948242188, -0.22362518310546875, -0.21368789672851562, -0.2037506103515625, -0.19381332397460938, -0.18387603759765625, -0.17393875122070312, -0.16400146484375, -0.15406417846679688, -0.14412689208984375, -0.13418960571289062, -0.1242523193359375, -0.11431503295898438, -0.10437774658203125, -0.09444046020507812, -0.084503173828125, -0.07456588745117188, -0.06462860107421875, -0.054691314697265625, -0.0447540283203125, -0.034816741943359375, -0.02487945556640625, -0.014942169189453125, -0.0050048828125, 0.004932403564453125, 0.01486968994140625, 0.024806976318359375, 0.0347442626953125, 0.044681549072265625, 0.05461883544921875, 0.06455612182617188, 0.074493408203125, 0.08443069458007812, 0.09436798095703125, 0.10430526733398438, 0.1142425537109375, 0.12417984008789062, 0.13411712646484375, 0.14405441284179688, 0.15399169921875, 0.16392898559570312, 0.17386627197265625, 0.18380355834960938, 0.1937408447265625, 0.20367813110351562, 0.21361541748046875, 0.22355270385742188, 0.233489990234375, 0.24342727661132812, 0.25336456298828125, 0.2633018493652344, 0.2732391357421875, 0.2831764221191406, 0.29311370849609375, 0.3030509948730469, 0.31298828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 8.0, 8.0, 11.0, 16.0, 23.0, 30.0, 33.0, 62.0, 82.0, 89.0, 112.0, 160.0, 250.0, 341.0, 549.0, 620.0, 489.0, 339.0, 238.0, 165.0, 109.0, 74.0, 66.0, 40.0, 36.0, 25.0, 15.0, 18.0, 10.0, 10.0, 5.0, 6.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.57373046875, -0.5591773986816406, -0.5446243286132812, -0.5300712585449219, -0.5155181884765625, -0.5009651184082031, -0.48641204833984375, -0.4718589782714844, -0.457305908203125, -0.4427528381347656, -0.42819976806640625, -0.4136466979980469, -0.3990936279296875, -0.3845405578613281, -0.36998748779296875, -0.3554344177246094, -0.34088134765625, -0.3263282775878906, -0.31177520751953125, -0.2972221374511719, -0.2826690673828125, -0.2681159973144531, -0.25356292724609375, -0.23900985717773438, -0.224456787109375, -0.20990371704101562, -0.19535064697265625, -0.18079757690429688, -0.1662445068359375, -0.15169143676757812, -0.13713836669921875, -0.12258529663085938, -0.1080322265625, -0.09347915649414062, -0.07892608642578125, -0.06437301635742188, -0.0498199462890625, -0.035266876220703125, -0.02071380615234375, -0.006160736083984375, 0.008392333984375, 0.022945404052734375, 0.03749847412109375, 0.052051544189453125, 0.0666046142578125, 0.08115768432617188, 0.09571075439453125, 0.11026382446289062, 0.12481689453125, 0.13936996459960938, 0.15392303466796875, 0.16847610473632812, 0.1830291748046875, 0.19758224487304688, 0.21213531494140625, 0.22668838500976562, 0.241241455078125, 0.2557945251464844, 0.27034759521484375, 0.2849006652832031, 0.2994537353515625, 0.3140068054199219, 0.32855987548828125, 0.3431129455566406, 0.357666015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 8.0, 11.0, 35.0, 64.0, 91.0, 134.0, 163.0, 159.0, 135.0, 92.0, 64.0, 24.0, 13.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4740829467773438, -3.3548779487609863, -3.235672950744629, -3.1164677143096924, -2.997262716293335, -2.8780577182769775, -2.758852481842041, -2.6396474838256836, -2.520442485809326, -2.4012374877929688, -2.2820324897766113, -2.162827253341675, -2.0436222553253174, -1.92441725730896, -1.805212140083313, -1.686007022857666, -1.5668020248413086, -1.4475970268249512, -1.3283919095993042, -1.2091867923736572, -1.0899817943572998, -0.9707767367362976, -0.8515716791152954, -0.7323666214942932, -0.613161563873291, -0.4939565062522888, -0.3747514486312866, -0.2555463910102844, -0.13634133338928223, -0.01713627576828003, 0.10206878185272217, 0.22127383947372437, 0.34047889709472656, 0.45968395471572876, 0.578889012336731, 0.6980940699577332, 0.8172991275787354, 0.9365041851997375, 1.0557092428207397, 1.1749143600463867, 1.2941193580627441, 1.4133243560791016, 1.5325294733047485, 1.6517345905303955, 1.770939588546753, 1.8901445865631104, 2.009349822998047, 2.1285548210144043, 2.2477598190307617, 2.366964817047119, 2.4861698150634766, 2.605375051498413, 2.7245800495147705, 2.843785047531128, 2.9629902839660645, 3.082195281982422, 3.2014002799987793, 3.3206052780151367, 3.439810276031494, 3.5590155124664307, 3.678220510482788, 3.7974255084991455, 3.916630744934082, 4.0358357429504395, 4.155040740966797]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 7.0, 7.0, 10.0, 6.0, 14.0, 15.0, 16.0, 17.0, 22.0, 20.0, 34.0, 33.0, 36.0, 34.0, 32.0, 45.0, 50.0, 53.0, 45.0, 39.0, 50.0, 45.0, 34.0, 39.0, 39.0, 36.0, 26.0, 25.0, 23.0, 27.0, 22.0, 20.0, 15.0, 18.0, 7.0, 9.0, 3.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8102275133132935, -1.7579783201217651, -1.7057290077209473, -1.653479814529419, -1.6012306213378906, -1.5489814281463623, -1.496732234954834, -1.4444829225540161, -1.3922337293624878, -1.3399845361709595, -1.2877352237701416, -1.2354860305786133, -1.183236837387085, -1.1309876441955566, -1.0787384510040283, -1.0264891386032104, -0.9742399454116821, -0.9219907522201538, -0.8697414994239807, -0.8174922466278076, -0.7652430534362793, -0.712993860244751, -0.6607446074485779, -0.6084953546524048, -0.5562461614608765, -0.5039969682693481, -0.45174771547317505, -0.39949849247932434, -0.34724926948547363, -0.2950000464916229, -0.24275082349777222, -0.1905016005039215, -0.13825225830078125, -0.08600303530693054, -0.033753812313079834, 0.018495410680770874, 0.07074463367462158, 0.12299385666847229, 0.175243079662323, 0.2274923026561737, 0.2797415256500244, 0.3319907486438751, 0.38423997163772583, 0.43648919463157654, 0.48873841762542725, 0.5409876108169556, 0.5932368636131287, 0.6454861164093018, 0.6977353096008301, 0.7499845027923584, 0.8022337555885315, 0.8544830083847046, 0.9067322015762329, 0.9589813947677612, 1.011230707168579, 1.0634799003601074, 1.1157290935516357, 1.167978286743164, 1.2202274799346924, 1.2724767923355103, 1.3247259855270386, 1.376975178718567, 1.4292244911193848, 1.481473684310913, 1.5337228775024414]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 9.0, 28.0, 43.0, 51.0, 85.0, 147.0, 229.0, 394.0, 681.0, 1185.0, 1962.0, 3113.0, 5023.0, 8551.0, 13467.0, 22953.0, 44262.0, 118051.0, 314865.0, 303271.0, 111470.0, 42385.0, 21919.0, 13294.0, 8231.0, 5163.0, 2994.0, 1909.0, 1107.0, 681.0, 408.0, 245.0, 138.0, 90.0, 59.0, 25.0, 22.0, 17.0, 4.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.32118988037109375, -0.3101043701171875, -0.29901885986328125, -0.287933349609375, -0.27684783935546875, -0.2657623291015625, -0.25467681884765625, -0.24359130859375, -0.23250579833984375, -0.2214202880859375, -0.21033477783203125, -0.199249267578125, -0.18816375732421875, -0.1770782470703125, -0.16599273681640625, -0.1549072265625, -0.14382171630859375, -0.1327362060546875, -0.12165069580078125, -0.110565185546875, -0.09947967529296875, -0.0883941650390625, -0.07730865478515625, -0.06622314453125, -0.05513763427734375, -0.0440521240234375, -0.03296661376953125, -0.021881103515625, -0.01079559326171875, 0.0002899169921875, 0.01137542724609375, 0.0224609375, 0.03354644775390625, 0.0446319580078125, 0.05571746826171875, 0.066802978515625, 0.07788848876953125, 0.0889739990234375, 0.10005950927734375, 0.11114501953125, 0.12223052978515625, 0.1333160400390625, 0.14440155029296875, 0.155487060546875, 0.16657257080078125, 0.1776580810546875, 0.18874359130859375, 0.1998291015625, 0.21091461181640625, 0.2220001220703125, 0.23308563232421875, 0.244171142578125, 0.25525665283203125, 0.2663421630859375, 0.27742767333984375, 0.28851318359375, 0.29959869384765625, 0.3106842041015625, 0.32176971435546875, 0.332855224609375, 0.34394073486328125, 0.3550262451171875, 0.36611175537109375, 0.377197265625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 12.0, 12.0, 11.0, 14.0, 22.0, 20.0, 25.0, 23.0, 35.0, 25.0, 43.0, 43.0, 41.0, 37.0, 47.0, 34.0, 53.0, 44.0, 42.0, 47.0, 42.0, 42.0, 42.0, 35.0, 24.0, 36.0, 23.0, 24.0, 16.0, 12.0, 15.0, 15.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.265869140625, -0.25786590576171875, -0.2498626708984375, -0.24185943603515625, -0.233856201171875, -0.22585296630859375, -0.2178497314453125, -0.20984649658203125, -0.20184326171875, -0.19384002685546875, -0.1858367919921875, -0.17783355712890625, -0.169830322265625, -0.16182708740234375, -0.1538238525390625, -0.14582061767578125, -0.1378173828125, -0.12981414794921875, -0.1218109130859375, -0.11380767822265625, -0.105804443359375, -0.09780120849609375, -0.0897979736328125, -0.08179473876953125, -0.07379150390625, -0.06578826904296875, -0.0577850341796875, -0.04978179931640625, -0.041778564453125, -0.03377532958984375, -0.0257720947265625, -0.01776885986328125, -0.009765625, -0.00176239013671875, 0.0062408447265625, 0.01424407958984375, 0.022247314453125, 0.03025054931640625, 0.0382537841796875, 0.04625701904296875, 0.05426025390625, 0.06226348876953125, 0.0702667236328125, 0.07826995849609375, 0.086273193359375, 0.09427642822265625, 0.1022796630859375, 0.11028289794921875, 0.1182861328125, 0.12628936767578125, 0.1342926025390625, 0.14229583740234375, 0.150299072265625, 0.15830230712890625, 0.1663055419921875, 0.17430877685546875, 0.18231201171875, 0.19031524658203125, 0.1983184814453125, 0.20632171630859375, 0.214324951171875, 0.22232818603515625, 0.2303314208984375, 0.23833465576171875, 0.246337890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 8.0, 10.0, 13.0, 11.0, 32.0, 41.0, 80.0, 107.0, 175.0, 270.0, 500.0, 855.0, 1724.0, 4243.0, 11446.0, 35310.0, 158584.0, 613381.0, 165258.0, 36466.0, 11724.0, 4362.0, 1865.0, 852.0, 480.0, 281.0, 172.0, 90.0, 54.0, 57.0, 30.0, 21.0, 8.0, 12.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79052734375, -0.766937255859375, -0.74334716796875, -0.719757080078125, -0.6961669921875, -0.672576904296875, -0.64898681640625, -0.625396728515625, -0.601806640625, -0.578216552734375, -0.55462646484375, -0.531036376953125, -0.5074462890625, -0.483856201171875, -0.46026611328125, -0.436676025390625, -0.4130859375, -0.389495849609375, -0.36590576171875, -0.342315673828125, -0.3187255859375, -0.295135498046875, -0.27154541015625, -0.247955322265625, -0.224365234375, -0.200775146484375, -0.17718505859375, -0.153594970703125, -0.1300048828125, -0.106414794921875, -0.08282470703125, -0.059234619140625, -0.03564453125, -0.012054443359375, 0.01153564453125, 0.035125732421875, 0.0587158203125, 0.082305908203125, 0.10589599609375, 0.129486083984375, 0.153076171875, 0.176666259765625, 0.20025634765625, 0.223846435546875, 0.2474365234375, 0.271026611328125, 0.29461669921875, 0.318206787109375, 0.341796875, 0.365386962890625, 0.38897705078125, 0.412567138671875, 0.4361572265625, 0.459747314453125, 0.48333740234375, 0.506927490234375, 0.530517578125, 0.554107666015625, 0.57769775390625, 0.601287841796875, 0.6248779296875, 0.648468017578125, 0.67205810546875, 0.695648193359375, 0.71923828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 8.0, 8.0, 12.0, 17.0, 18.0, 27.0, 32.0, 25.0, 45.0, 33.0, 38.0, 45.0, 52.0, 51.0, 49.0, 65.0, 49.0, 40.0, 61.0, 42.0, 41.0, 35.0, 31.0, 38.0, 23.0, 18.0, 15.0, 13.0, 10.0, 8.0, 8.0, 10.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-1.08984375, -1.0627212524414062, -1.0355987548828125, -1.0084762573242188, -0.981353759765625, -0.9542312622070312, -0.9271087646484375, -0.8999862670898438, -0.87286376953125, -0.8457412719726562, -0.8186187744140625, -0.7914962768554688, -0.764373779296875, -0.7372512817382812, -0.7101287841796875, -0.6830062866210938, -0.6558837890625, -0.6287612915039062, -0.6016387939453125, -0.5745162963867188, -0.547393798828125, -0.5202713012695312, -0.4931488037109375, -0.46602630615234375, -0.43890380859375, -0.41178131103515625, -0.3846588134765625, -0.35753631591796875, -0.330413818359375, -0.30329132080078125, -0.2761688232421875, -0.24904632568359375, -0.221923828125, -0.19480133056640625, -0.1676788330078125, -0.14055633544921875, -0.113433837890625, -0.08631134033203125, -0.0591888427734375, -0.03206634521484375, -0.00494384765625, 0.02217864990234375, 0.0493011474609375, 0.07642364501953125, 0.103546142578125, 0.13066864013671875, 0.1577911376953125, 0.18491363525390625, 0.2120361328125, 0.23915863037109375, 0.2662811279296875, 0.29340362548828125, 0.320526123046875, 0.34764862060546875, 0.3747711181640625, 0.40189361572265625, 0.42901611328125, 0.45613861083984375, 0.4832611083984375, 0.5103836059570312, 0.537506103515625, 0.5646286010742188, 0.5917510986328125, 0.6188735961914062, 0.64599609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 3.0, 6.0, 12.0, 10.0, 15.0, 18.0, 26.0, 46.0, 67.0, 85.0, 164.0, 237.0, 410.0, 673.0, 1178.0, 2103.0, 3779.0, 6978.0, 13065.0, 25269.0, 52340.0, 123406.0, 301854.0, 293479.0, 119680.0, 50950.0, 24517.0, 12651.0, 6720.0, 3868.0, 2028.0, 1106.0, 696.0, 405.0, 243.0, 138.0, 98.0, 72.0, 47.0, 27.0, 17.0, 16.0, 17.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.1353759765625, -0.1312713623046875, -0.127166748046875, -0.1230621337890625, -0.11895751953125, -0.1148529052734375, -0.110748291015625, -0.1066436767578125, -0.1025390625, -0.0984344482421875, -0.094329833984375, -0.0902252197265625, -0.08612060546875, -0.0820159912109375, -0.077911376953125, -0.0738067626953125, -0.0697021484375, -0.0655975341796875, -0.061492919921875, -0.0573883056640625, -0.05328369140625, -0.0491790771484375, -0.045074462890625, -0.0409698486328125, -0.036865234375, -0.0327606201171875, -0.028656005859375, -0.0245513916015625, -0.02044677734375, -0.0163421630859375, -0.012237548828125, -0.0081329345703125, -0.0040283203125, 7.62939453125e-05, 0.004180908203125, 0.0082855224609375, 0.01239013671875, 0.0164947509765625, 0.020599365234375, 0.0247039794921875, 0.02880859375, 0.0329132080078125, 0.037017822265625, 0.0411224365234375, 0.04522705078125, 0.0493316650390625, 0.053436279296875, 0.0575408935546875, 0.0616455078125, 0.0657501220703125, 0.069854736328125, 0.0739593505859375, 0.07806396484375, 0.0821685791015625, 0.086273193359375, 0.0903778076171875, 0.094482421875, 0.0985870361328125, 0.102691650390625, 0.1067962646484375, 0.11090087890625, 0.1150054931640625, 0.119110107421875, 0.1232147216796875, 0.1273193359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 5.0, 4.0, 2.0, 5.0, 4.0, 11.0, 13.0, 11.0, 19.0, 14.0, 31.0, 45.0, 63.0, 79.0, 95.0, 114.0, 120.0, 81.0, 72.0, 58.0, 39.0, 21.0, 21.0, 14.0, 8.0, 7.0, 6.0, 3.0, 1.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2378902435302734e-05, -4.0901824831962585e-05, -3.9424747228622437e-05, -3.794766962528229e-05, -3.647059202194214e-05, -3.499351441860199e-05, -3.351643681526184e-05, -3.203935921192169e-05, -3.056228160858154e-05, -2.9085204005241394e-05, -2.7608126401901245e-05, -2.6131048798561096e-05, -2.4653971195220947e-05, -2.31768935918808e-05, -2.169981598854065e-05, -2.02227383852005e-05, -1.874566078186035e-05, -1.7268583178520203e-05, -1.5791505575180054e-05, -1.4314427971839905e-05, -1.2837350368499756e-05, -1.1360272765159607e-05, -9.883195161819458e-06, -8.406117558479309e-06, -6.92903995513916e-06, -5.451962351799011e-06, -3.974884748458862e-06, -2.4978071451187134e-06, -1.0207295417785645e-06, 4.5634806156158447e-07, 1.9334256649017334e-06, 3.4105032682418823e-06, 4.887580871582031e-06, 6.36465847492218e-06, 7.841736078262329e-06, 9.318813681602478e-06, 1.0795891284942627e-05, 1.2272968888282776e-05, 1.3750046491622925e-05, 1.5227124094963074e-05, 1.6704201698303223e-05, 1.818127930164337e-05, 1.965835690498352e-05, 2.113543450832367e-05, 2.261251211166382e-05, 2.4089589715003967e-05, 2.5566667318344116e-05, 2.7043744921684265e-05, 2.8520822525024414e-05, 2.9997900128364563e-05, 3.147497773170471e-05, 3.295205533504486e-05, 3.442913293838501e-05, 3.590621054172516e-05, 3.738328814506531e-05, 3.8860365748405457e-05, 4.0337443351745605e-05, 4.1814520955085754e-05, 4.32915985584259e-05, 4.476867616176605e-05, 4.62457537651062e-05, 4.772283136844635e-05, 4.91999089717865e-05, 5.067698657512665e-05, 5.21540641784668e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 14.0, 13.0, 18.0, 26.0, 24.0, 40.0, 83.0, 96.0, 131.0, 177.0, 209.0, 341.0, 501.0, 874.0, 1560.0, 2862.0, 5661.0, 11688.0, 23857.0, 49499.0, 115147.0, 272076.0, 307448.0, 140763.0, 59651.0, 27874.0, 13433.0, 6579.0, 3285.0, 1782.0, 978.0, 595.0, 373.0, 240.0, 177.0, 120.0, 94.0, 69.0, 57.0, 37.0, 35.0, 22.0, 10.0, 7.0, 11.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.124755859375, -0.12087059020996094, -0.11698532104492188, -0.11310005187988281, -0.10921478271484375, -0.10532951354980469, -0.10144424438476562, -0.09755897521972656, -0.0936737060546875, -0.08978843688964844, -0.08590316772460938, -0.08201789855957031, -0.07813262939453125, -0.07424736022949219, -0.07036209106445312, -0.06647682189941406, -0.062591552734375, -0.05870628356933594, -0.054821014404296875, -0.05093574523925781, -0.04705047607421875, -0.04316520690917969, -0.039279937744140625, -0.03539466857910156, -0.0315093994140625, -0.027624130249023438, -0.023738861083984375, -0.019853591918945312, -0.01596832275390625, -0.012083053588867188, -0.008197784423828125, -0.0043125152587890625, -0.00042724609375, 0.0034580230712890625, 0.007343292236328125, 0.011228561401367188, 0.01511383056640625, 0.018999099731445312, 0.022884368896484375, 0.026769638061523438, 0.0306549072265625, 0.03454017639160156, 0.038425445556640625, 0.04231071472167969, 0.04619598388671875, 0.05008125305175781, 0.053966522216796875, 0.05785179138183594, 0.061737060546875, 0.06562232971191406, 0.06950759887695312, 0.07339286804199219, 0.07727813720703125, 0.08116340637207031, 0.08504867553710938, 0.08893394470214844, 0.0928192138671875, 0.09670448303222656, 0.10058975219726562, 0.10447502136230469, 0.10836029052734375, 0.11224555969238281, 0.11613082885742188, 0.12001609802246094, 0.1239013671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 3.0, 6.0, 10.0, 10.0, 13.0, 20.0, 18.0, 29.0, 22.0, 46.0, 47.0, 64.0, 71.0, 65.0, 68.0, 55.0, 58.0, 58.0, 58.0, 42.0, 35.0, 27.0, 19.0, 24.0, 22.0, 15.0, 17.0, 6.0, 4.0, 14.0, 6.0, 6.0, 5.0, 5.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.13665008544921875, -0.1319427490234375, -0.12723541259765625, -0.122528076171875, -0.11782073974609375, -0.1131134033203125, -0.10840606689453125, -0.10369873046875, -0.09899139404296875, -0.0942840576171875, -0.08957672119140625, -0.084869384765625, -0.08016204833984375, -0.0754547119140625, -0.07074737548828125, -0.0660400390625, -0.06133270263671875, -0.0566253662109375, -0.05191802978515625, -0.047210693359375, -0.04250335693359375, -0.0377960205078125, -0.03308868408203125, -0.02838134765625, -0.02367401123046875, -0.0189666748046875, -0.01425933837890625, -0.009552001953125, -0.00484466552734375, -0.0001373291015625, 0.00457000732421875, 0.00927734375, 0.01398468017578125, 0.0186920166015625, 0.02339935302734375, 0.028106689453125, 0.03281402587890625, 0.0375213623046875, 0.04222869873046875, 0.04693603515625, 0.05164337158203125, 0.0563507080078125, 0.06105804443359375, 0.065765380859375, 0.07047271728515625, 0.0751800537109375, 0.07988739013671875, 0.0845947265625, 0.08930206298828125, 0.0940093994140625, 0.09871673583984375, 0.103424072265625, 0.10813140869140625, 0.1128387451171875, 0.11754608154296875, 0.12225341796875, 0.12696075439453125, 0.1316680908203125, 0.13637542724609375, 0.141082763671875, 0.14579010009765625, 0.1504974365234375, 0.15520477294921875, 0.159912109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 13.0, 77.0, 323.0, 416.0, 134.0, 28.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.496549606323242, -13.22790241241455, -12.95925521850586, -12.690608024597168, -12.421960830688477, -12.153313636779785, -11.884666442871094, -11.616019248962402, -11.347372055053711, -11.07872486114502, -10.810077667236328, -10.541430473327637, -10.272783279418945, -10.004136085510254, -9.735488891601562, -9.466841697692871, -9.19819450378418, -8.929547309875488, -8.660900115966797, -8.392252922058105, -8.123605728149414, -7.854958534240723, -7.586311340332031, -7.31766414642334, -7.049015998840332, -6.780368804931641, -6.511721611022949, -6.243074417114258, -5.974427223205566, -5.705780029296875, -5.437132835388184, -5.168485641479492, -4.899839401245117, -4.631192207336426, -4.362545013427734, -4.093897819519043, -3.8252506256103516, -3.55660343170166, -3.2879559993743896, -3.0193088054656982, -2.7506613731384277, -2.4820141792297363, -2.213366985321045, -1.944719672203064, -1.6760724782943726, -1.4074252843856812, -1.1387779712677002, -0.8701307773590088, -0.6014835834503174, -0.3328363597393036, -0.0641891360282898, 0.2044581174850464, 0.4731053113937378, 0.7417525053024292, 1.0103998184204102, 1.2790470123291016, 1.547694206237793, 1.8163414001464844, 2.084988594055176, 2.353635787963867, 2.6222829818725586, 2.89093017578125, 3.1595776081085205, 3.428224802017212, 3.6968719959259033]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 4.0, 11.0, 10.0, 15.0, 13.0, 13.0, 19.0, 18.0, 22.0, 26.0, 36.0, 29.0, 34.0, 32.0, 36.0, 45.0, 37.0, 33.0, 40.0, 53.0, 27.0, 36.0, 45.0, 39.0, 44.0, 36.0, 40.0, 37.0, 18.0, 24.0, 23.0, 18.0, 16.0, 18.0, 7.0, 10.0, 5.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7047542333602905, -1.6506109237670898, -1.5964676141738892, -1.5423243045806885, -1.4881809949874878, -1.434037685394287, -1.3798943758010864, -1.3257510662078857, -1.271607756614685, -1.2174644470214844, -1.1633211374282837, -1.109177827835083, -1.0550345182418823, -1.0008912086486816, -0.946747899055481, -0.8926045894622803, -0.8384612798690796, -0.7843179702758789, -0.7301746606826782, -0.6760313510894775, -0.6218880414962769, -0.5677447319030762, -0.5136014223098755, -0.4594581127166748, -0.4053148031234741, -0.35117149353027344, -0.29702818393707275, -0.24288487434387207, -0.1887415647506714, -0.1345982551574707, -0.08045494556427002, -0.026311635971069336, 0.027831554412841797, 0.08197486400604248, 0.13611817359924316, 0.19026148319244385, 0.24440479278564453, 0.2985481023788452, 0.3526914119720459, 0.4068347215652466, 0.46097803115844727, 0.515121340751648, 0.5692646503448486, 0.6234079599380493, 0.67755126953125, 0.7316945791244507, 0.7858378887176514, 0.839981198310852, 0.8941245079040527, 0.9482678174972534, 1.002411127090454, 1.0565544366836548, 1.1106977462768555, 1.1648410558700562, 1.2189843654632568, 1.2731276750564575, 1.3272709846496582, 1.3814142942428589, 1.4355576038360596, 1.4897009134292603, 1.543844223022461, 1.5979875326156616, 1.6521308422088623, 1.706274151802063, 1.7604174613952637]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 12.0, 16.0, 29.0, 30.0, 30.0, 66.0, 89.0, 135.0, 185.0, 311.0, 498.0, 797.0, 1279.0, 1988.0, 3345.0, 5381.0, 8862.0, 15423.0, 27632.0, 51004.0, 102358.0, 222347.0, 496111.0, 916970.0, 1050525.0, 664787.0, 320273.0, 147051.0, 71003.0, 36612.0, 20160.0, 11658.0, 6857.0, 4112.0, 2370.0, 1418.0, 927.0, 606.0, 321.0, 230.0, 148.0, 92.0, 72.0, 53.0, 45.0, 26.0, 18.0, 11.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1798095703125, -0.1738605499267578, -0.16791152954101562, -0.16196250915527344, -0.15601348876953125, -0.15006446838378906, -0.14411544799804688, -0.1381664276123047, -0.1322174072265625, -0.1262683868408203, -0.12031936645507812, -0.11437034606933594, -0.10842132568359375, -0.10247230529785156, -0.09652328491210938, -0.09057426452636719, -0.084625244140625, -0.07867622375488281, -0.07272720336914062, -0.06677818298339844, -0.06082916259765625, -0.05488014221191406, -0.048931121826171875, -0.04298210144042969, -0.0370330810546875, -0.031084060668945312, -0.025135040283203125, -0.019186019897460938, -0.01323699951171875, -0.0072879791259765625, -0.001338958740234375, 0.0046100616455078125, 0.01055908203125, 0.016508102416992188, 0.022457122802734375, 0.028406143188476562, 0.03435516357421875, 0.04030418395996094, 0.046253204345703125, 0.05220222473144531, 0.0581512451171875, 0.06410026550292969, 0.07004928588867188, 0.07599830627441406, 0.08194732666015625, 0.08789634704589844, 0.09384536743164062, 0.09979438781738281, 0.105743408203125, 0.11169242858886719, 0.11764144897460938, 0.12359046936035156, 0.12953948974609375, 0.13548851013183594, 0.14143753051757812, 0.1473865509033203, 0.1533355712890625, 0.1592845916748047, 0.16523361206054688, 0.17118263244628906, 0.17713165283203125, 0.18308067321777344, 0.18902969360351562, 0.1949787139892578, 0.200927734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 1.0, 8.0, 3.0, 5.0, 8.0, 15.0, 17.0, 16.0, 14.0, 8.0, 19.0, 20.0, 37.0, 28.0, 20.0, 29.0, 36.0, 42.0, 36.0, 32.0, 44.0, 34.0, 41.0, 37.0, 38.0, 46.0, 31.0, 41.0, 31.0, 35.0, 25.0, 31.0, 22.0, 34.0, 20.0, 14.0, 13.0, 12.0, 8.0, 10.0, 7.0, 3.0, 12.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2333984375, -0.22637367248535156, -0.21934890747070312, -0.2123241424560547, -0.20529937744140625, -0.1982746124267578, -0.19124984741210938, -0.18422508239746094, -0.1772003173828125, -0.17017555236816406, -0.16315078735351562, -0.1561260223388672, -0.14910125732421875, -0.1420764923095703, -0.13505172729492188, -0.12802696228027344, -0.121002197265625, -0.11397743225097656, -0.10695266723632812, -0.09992790222167969, -0.09290313720703125, -0.08587837219238281, -0.07885360717773438, -0.07182884216308594, -0.0648040771484375, -0.05777931213378906, -0.050754547119140625, -0.04372978210449219, -0.03670501708984375, -0.029680252075195312, -0.022655487060546875, -0.015630722045898438, -0.00860595703125, -0.0015811920166015625, 0.005443572998046875, 0.012468338012695312, 0.01949310302734375, 0.026517868041992188, 0.033542633056640625, 0.04056739807128906, 0.0475921630859375, 0.05461692810058594, 0.061641693115234375, 0.06866645812988281, 0.07569122314453125, 0.08271598815917969, 0.08974075317382812, 0.09676551818847656, 0.103790283203125, 0.11081504821777344, 0.11783981323242188, 0.12486457824707031, 0.13188934326171875, 0.1389141082763672, 0.14593887329101562, 0.15296363830566406, 0.1599884033203125, 0.16701316833496094, 0.17403793334960938, 0.1810626983642578, 0.18808746337890625, 0.1951122283935547, 0.20213699340820312, 0.20916175842285156, 0.2161865234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 12.0, 7.0, 21.0, 31.0, 44.0, 74.0, 90.0, 181.0, 261.0, 535.0, 879.0, 1860.0, 5038.0, 18176.0, 89999.0, 627141.0, 2897018.0, 459104.0, 70875.0, 14918.0, 4286.0, 1730.0, 832.0, 454.0, 266.0, 159.0, 104.0, 63.0, 45.0, 26.0, 15.0, 12.0, 9.0, 3.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.81396484375, -0.79278564453125, -0.7716064453125, -0.75042724609375, -0.729248046875, -0.70806884765625, -0.6868896484375, -0.66571044921875, -0.64453125, -0.62335205078125, -0.6021728515625, -0.58099365234375, -0.559814453125, -0.53863525390625, -0.5174560546875, -0.49627685546875, -0.47509765625, -0.45391845703125, -0.4327392578125, -0.41156005859375, -0.390380859375, -0.36920166015625, -0.3480224609375, -0.32684326171875, -0.3056640625, -0.28448486328125, -0.2633056640625, -0.24212646484375, -0.220947265625, -0.19976806640625, -0.1785888671875, -0.15740966796875, -0.13623046875, -0.11505126953125, -0.0938720703125, -0.07269287109375, -0.051513671875, -0.03033447265625, -0.0091552734375, 0.01202392578125, 0.033203125, 0.05438232421875, 0.0755615234375, 0.09674072265625, 0.117919921875, 0.13909912109375, 0.1602783203125, 0.18145751953125, 0.20263671875, 0.22381591796875, 0.2449951171875, 0.26617431640625, 0.287353515625, 0.30853271484375, 0.3297119140625, 0.35089111328125, 0.3720703125, 0.39324951171875, 0.4144287109375, 0.43560791015625, 0.456787109375, 0.47796630859375, 0.4991455078125, 0.52032470703125, 0.54150390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 15.0, 26.0, 39.0, 49.0, 83.0, 109.0, 145.0, 254.0, 440.0, 698.0, 714.0, 580.0, 307.0, 211.0, 133.0, 78.0, 45.0, 41.0, 22.0, 16.0, 11.0, 12.0, 11.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5888900756835938, -0.5664520263671875, -0.5440139770507812, -0.521575927734375, -0.49913787841796875, -0.4766998291015625, -0.45426177978515625, -0.43182373046875, -0.40938568115234375, -0.3869476318359375, -0.36450958251953125, -0.342071533203125, -0.31963348388671875, -0.2971954345703125, -0.27475738525390625, -0.2523193359375, -0.22988128662109375, -0.2074432373046875, -0.18500518798828125, -0.162567138671875, -0.14012908935546875, -0.1176910400390625, -0.09525299072265625, -0.07281494140625, -0.05037689208984375, -0.0279388427734375, -0.00550079345703125, 0.016937255859375, 0.03937530517578125, 0.0618133544921875, 0.08425140380859375, 0.106689453125, 0.12912750244140625, 0.1515655517578125, 0.17400360107421875, 0.196441650390625, 0.21887969970703125, 0.2413177490234375, 0.26375579833984375, 0.28619384765625, 0.30863189697265625, 0.3310699462890625, 0.35350799560546875, 0.375946044921875, 0.39838409423828125, 0.4208221435546875, 0.44326019287109375, 0.4656982421875, 0.48813629150390625, 0.5105743408203125, 0.5330123901367188, 0.555450439453125, 0.5778884887695312, 0.6003265380859375, 0.6227645874023438, 0.64520263671875, 0.6676406860351562, 0.6900787353515625, 0.7125167846679688, 0.734954833984375, 0.7573928833007812, 0.7798309326171875, 0.8022689819335938, 0.82470703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 19.0, 61.0, 146.0, 213.0, 210.0, 163.0, 102.0, 44.0, 18.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.847646713256836, -4.670276641845703, -4.49290657043457, -4.3155364990234375, -4.138166427612305, -3.960796356201172, -3.78342604637146, -3.606055974960327, -3.4286859035491943, -3.2513158321380615, -3.0739457607269287, -2.896575450897217, -2.719205379486084, -2.541835308074951, -2.3644652366638184, -2.1870951652526855, -2.0097250938415527, -1.83235502243042, -1.654984951019287, -1.4776147603988647, -1.300244688987732, -1.1228746175765991, -0.9455044269561768, -0.768134355545044, -0.5907642841339111, -0.41339418292045593, -0.23602408170700073, -0.058653950691223145, 0.11871612071990967, 0.2960861921310425, 0.47345638275146484, 0.6508264541625977, 0.8281960487365723, 1.005566120147705, 1.182936191558838, 1.3603063821792603, 1.537676453590393, 1.7150465250015259, 1.8924167156219482, 2.069786787033081, 2.247156858444214, 2.4245269298553467, 2.6018970012664795, 2.7792673110961914, 2.956637382507324, 3.134007453918457, 3.31137752532959, 3.4887475967407227, 3.6661176681518555, 3.8434877395629883, 4.020857810974121, 4.198227882385254, 4.375597953796387, 4.5529680252075195, 4.730338096618652, 4.907708168029785, 5.085078239440918, 5.262448310852051, 5.439818382263184, 5.617188453674316, 5.794558525085449, 5.971928596496582, 6.149298667907715, 6.326668739318848, 6.504039287567139]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 4.0, 9.0, 6.0, 5.0, 12.0, 17.0, 13.0, 23.0, 20.0, 23.0, 33.0, 27.0, 32.0, 31.0, 41.0, 31.0, 34.0, 51.0, 44.0, 52.0, 41.0, 43.0, 45.0, 46.0, 41.0, 38.0, 33.0, 35.0, 23.0, 22.0, 21.0, 20.0, 15.0, 14.0, 9.0, 9.0, 3.0, 6.0, 7.0, 7.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.784436821937561, -1.7271194458007812, -1.6698020696640015, -1.6124846935272217, -1.555167317390442, -1.497849941253662, -1.4405324459075928, -1.383215069770813, -1.3258976936340332, -1.2685803174972534, -1.2112629413604736, -1.1539455652236938, -1.096628189086914, -1.0393106937408447, -0.9819933772087097, -0.9246759414672852, -0.8673586249351501, -0.8100412487983704, -0.7527238726615906, -0.695406436920166, -0.6380890607833862, -0.5807716846466064, -0.5234543085098267, -0.4661369025707245, -0.4088195264339447, -0.3515021502971649, -0.29418474435806274, -0.23686736822128296, -0.17954997718334198, -0.122232586145401, -0.06491521000862122, -0.007597804069519043, 0.04971957206726074, 0.10703696310520172, 0.1643543541431427, 0.22167173027992249, 0.27898913621902466, 0.33630651235580444, 0.39362388849258423, 0.4509412944316864, 0.5082587003707886, 0.5655760765075684, 0.6228934526443481, 0.6802108287811279, 0.7375282645225525, 0.7948456406593323, 0.8521630167961121, 0.9094804525375366, 0.9667977690696716, 1.0241152048110962, 1.081432580947876, 1.1387499570846558, 1.1960673332214355, 1.2533847093582153, 1.3107020854949951, 1.368019461631775, 1.4253368377685547, 1.4826542139053345, 1.5399715900421143, 1.597288966178894, 1.6546063423156738, 1.7119238376617432, 1.7692410945892334, 1.8265585899353027, 1.8838759660720825]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 4.0, 9.0, 10.0, 15.0, 34.0, 59.0, 62.0, 96.0, 175.0, 238.0, 357.0, 562.0, 835.0, 1413.0, 2341.0, 4030.0, 6762.0, 11925.0, 20478.0, 39142.0, 85908.0, 213923.0, 327483.0, 181067.0, 72899.0, 34328.0, 18395.0, 10776.0, 6062.0, 3515.0, 2187.0, 1303.0, 746.0, 494.0, 304.0, 183.0, 140.0, 83.0, 61.0, 37.0, 34.0, 18.0, 12.0, 17.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.332763671875, -0.3218193054199219, -0.31087493896484375, -0.2999305725097656, -0.2889862060546875, -0.2780418395996094, -0.26709747314453125, -0.2561531066894531, -0.245208740234375, -0.23426437377929688, -0.22332000732421875, -0.21237564086914062, -0.2014312744140625, -0.19048690795898438, -0.17954254150390625, -0.16859817504882812, -0.15765380859375, -0.14670944213867188, -0.13576507568359375, -0.12482070922851562, -0.1138763427734375, -0.10293197631835938, -0.09198760986328125, -0.08104324340820312, -0.070098876953125, -0.059154510498046875, -0.04821014404296875, -0.037265777587890625, -0.0263214111328125, -0.015377044677734375, -0.00443267822265625, 0.006511688232421875, 0.0174560546875, 0.028400421142578125, 0.03934478759765625, 0.050289154052734375, 0.0612335205078125, 0.07217788696289062, 0.08312225341796875, 0.09406661987304688, 0.105010986328125, 0.11595535278320312, 0.12689971923828125, 0.13784408569335938, 0.1487884521484375, 0.15973281860351562, 0.17067718505859375, 0.18162155151367188, 0.19256591796875, 0.20351028442382812, 0.21445465087890625, 0.22539901733398438, 0.2363433837890625, 0.24728775024414062, 0.25823211669921875, 0.2691764831542969, 0.280120849609375, 0.2910652160644531, 0.30200958251953125, 0.3129539489746094, 0.3238983154296875, 0.3348426818847656, 0.34578704833984375, 0.3567314147949219, 0.36767578125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 10.0, 4.0, 10.0, 8.0, 18.0, 11.0, 25.0, 24.0, 17.0, 17.0, 25.0, 31.0, 25.0, 27.0, 29.0, 40.0, 46.0, 45.0, 35.0, 32.0, 46.0, 43.0, 38.0, 41.0, 38.0, 31.0, 46.0, 28.0, 23.0, 25.0, 18.0, 26.0, 17.0, 15.0, 16.0, 10.0, 9.0, 7.0, 7.0, 3.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2291259765625, -0.2218608856201172, -0.21459579467773438, -0.20733070373535156, -0.20006561279296875, -0.19280052185058594, -0.18553543090820312, -0.1782703399658203, -0.1710052490234375, -0.1637401580810547, -0.15647506713867188, -0.14920997619628906, -0.14194488525390625, -0.13467979431152344, -0.12741470336914062, -0.12014961242675781, -0.112884521484375, -0.10561943054199219, -0.09835433959960938, -0.09108924865722656, -0.08382415771484375, -0.07655906677246094, -0.06929397583007812, -0.06202888488769531, -0.0547637939453125, -0.04749870300292969, -0.040233612060546875, -0.03296852111816406, -0.02570343017578125, -0.018438339233398438, -0.011173248291015625, -0.0039081573486328125, 0.00335693359375, 0.010622024536132812, 0.017887115478515625, 0.025152206420898438, 0.03241729736328125, 0.03968238830566406, 0.046947479248046875, 0.05421257019042969, 0.0614776611328125, 0.06874275207519531, 0.07600784301757812, 0.08327293395996094, 0.09053802490234375, 0.09780311584472656, 0.10506820678710938, 0.11233329772949219, 0.119598388671875, 0.1268634796142578, 0.13412857055664062, 0.14139366149902344, 0.14865875244140625, 0.15592384338378906, 0.16318893432617188, 0.1704540252685547, 0.1777191162109375, 0.1849842071533203, 0.19224929809570312, 0.19951438903808594, 0.20677947998046875, 0.21404457092285156, 0.22130966186523438, 0.2285747528076172, 0.23583984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 2.0, 11.0, 14.0, 20.0, 23.0, 43.0, 82.0, 104.0, 160.0, 293.0, 527.0, 1027.0, 2399.0, 6449.0, 21942.0, 93720.0, 528412.0, 316231.0, 54700.0, 14170.0, 4569.0, 1781.0, 852.0, 420.0, 232.0, 131.0, 91.0, 50.0, 32.0, 16.0, 13.0, 7.0, 7.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7919921875, -0.7645187377929688, -0.7370452880859375, -0.7095718383789062, -0.682098388671875, -0.6546249389648438, -0.6271514892578125, -0.5996780395507812, -0.57220458984375, -0.5447311401367188, -0.5172576904296875, -0.48978424072265625, -0.462310791015625, -0.43483734130859375, -0.4073638916015625, -0.37989044189453125, -0.3524169921875, -0.32494354248046875, -0.2974700927734375, -0.26999664306640625, -0.242523193359375, -0.21504974365234375, -0.1875762939453125, -0.16010284423828125, -0.13262939453125, -0.10515594482421875, -0.0776824951171875, -0.05020904541015625, -0.022735595703125, 0.00473785400390625, 0.0322113037109375, 0.05968475341796875, 0.087158203125, 0.11463165283203125, 0.1421051025390625, 0.16957855224609375, 0.197052001953125, 0.22452545166015625, 0.2519989013671875, 0.27947235107421875, 0.30694580078125, 0.33441925048828125, 0.3618927001953125, 0.38936614990234375, 0.416839599609375, 0.44431304931640625, 0.4717864990234375, 0.49925994873046875, 0.5267333984375, 0.5542068481445312, 0.5816802978515625, 0.6091537475585938, 0.636627197265625, 0.6641006469726562, 0.6915740966796875, 0.7190475463867188, 0.74652099609375, 0.7739944458007812, 0.8014678955078125, 0.8289413452148438, 0.856414794921875, 0.8838882446289062, 0.9113616943359375, 0.9388351440429688, 0.96630859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 5.0, 8.0, 5.0, 11.0, 13.0, 19.0, 19.0, 27.0, 32.0, 35.0, 26.0, 42.0, 45.0, 49.0, 63.0, 62.0, 66.0, 56.0, 53.0, 39.0, 38.0, 40.0, 44.0, 38.0, 24.0, 27.0, 20.0, 17.0, 15.0, 9.0, 10.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.017578125, -0.9888839721679688, -0.9601898193359375, -0.9314956665039062, -0.902801513671875, -0.8741073608398438, -0.8454132080078125, -0.8167190551757812, -0.78802490234375, -0.7593307495117188, -0.7306365966796875, -0.7019424438476562, -0.673248291015625, -0.6445541381835938, -0.6158599853515625, -0.5871658325195312, -0.5584716796875, -0.5297775268554688, -0.5010833740234375, -0.47238922119140625, -0.443695068359375, -0.41500091552734375, -0.3863067626953125, -0.35761260986328125, -0.32891845703125, -0.30022430419921875, -0.2715301513671875, -0.24283599853515625, -0.214141845703125, -0.18544769287109375, -0.1567535400390625, -0.12805938720703125, -0.099365234375, -0.07067108154296875, -0.0419769287109375, -0.01328277587890625, 0.015411376953125, 0.04410552978515625, 0.0727996826171875, 0.10149383544921875, 0.13018798828125, 0.15888214111328125, 0.1875762939453125, 0.21627044677734375, 0.244964599609375, 0.27365875244140625, 0.3023529052734375, 0.33104705810546875, 0.3597412109375, 0.38843536376953125, 0.4171295166015625, 0.44582366943359375, 0.474517822265625, 0.5032119750976562, 0.5319061279296875, 0.5606002807617188, 0.58929443359375, 0.6179885864257812, 0.6466827392578125, 0.6753768920898438, 0.704071044921875, 0.7327651977539062, 0.7614593505859375, 0.7901535034179688, 0.81884765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 4.0, 12.0, 26.0, 25.0, 39.0, 64.0, 100.0, 133.0, 269.0, 407.0, 711.0, 1204.0, 2136.0, 3632.0, 6692.0, 12480.0, 24918.0, 53865.0, 134649.0, 318392.0, 283220.0, 112843.0, 45892.0, 21658.0, 11122.0, 6062.0, 3371.0, 1941.0, 1053.0, 617.0, 387.0, 252.0, 119.0, 71.0, 51.0, 29.0, 25.0, 13.0, 16.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12758255004882812, -0.12284088134765625, -0.11809921264648438, -0.1133575439453125, -0.10861587524414062, -0.10387420654296875, -0.09913253784179688, -0.094390869140625, -0.08964920043945312, -0.08490753173828125, -0.08016586303710938, -0.0754241943359375, -0.07068252563476562, -0.06594085693359375, -0.061199188232421875, -0.05645751953125, -0.051715850830078125, -0.04697418212890625, -0.042232513427734375, -0.0374908447265625, -0.032749176025390625, -0.02800750732421875, -0.023265838623046875, -0.018524169921875, -0.013782501220703125, -0.00904083251953125, -0.004299163818359375, 0.0004425048828125, 0.005184173583984375, 0.00992584228515625, 0.014667510986328125, 0.0194091796875, 0.024150848388671875, 0.02889251708984375, 0.033634185791015625, 0.0383758544921875, 0.043117523193359375, 0.04785919189453125, 0.052600860595703125, 0.057342529296875, 0.062084197998046875, 0.06682586669921875, 0.07156753540039062, 0.0763092041015625, 0.08105087280273438, 0.08579254150390625, 0.09053421020507812, 0.09527587890625, 0.10001754760742188, 0.10475921630859375, 0.10950088500976562, 0.1142425537109375, 0.11898422241210938, 0.12372589111328125, 0.12846755981445312, 0.133209228515625, 0.13795089721679688, 0.14269256591796875, 0.14743423461914062, 0.1521759033203125, 0.15691757202148438, 0.16165924072265625, 0.16640090942382812, 0.171142578125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 8.0, 7.0, 13.0, 28.0, 22.0, 29.0, 41.0, 54.0, 79.0, 106.0, 118.0, 115.0, 67.0, 71.0, 36.0, 40.0, 18.0, 21.0, 25.0, 11.0, 11.0, 8.0, 10.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.435943603515625e-05, -5.2745454013347626e-05, -5.1131471991539e-05, -4.951748996973038e-05, -4.790350794792175e-05, -4.628952592611313e-05, -4.4675543904304504e-05, -4.306156188249588e-05, -4.1447579860687256e-05, -3.983359783887863e-05, -3.821961581707001e-05, -3.660563379526138e-05, -3.499165177345276e-05, -3.3377669751644135e-05, -3.176368772983551e-05, -3.0149705708026886e-05, -2.8535723686218262e-05, -2.6921741664409637e-05, -2.5307759642601013e-05, -2.369377762079239e-05, -2.2079795598983765e-05, -2.046581357717514e-05, -1.8851831555366516e-05, -1.7237849533557892e-05, -1.5623867511749268e-05, -1.4009885489940643e-05, -1.2395903468132019e-05, -1.0781921446323395e-05, -9.16793942451477e-06, -7.553957402706146e-06, -5.939975380897522e-06, -4.325993359088898e-06, -2.7120113372802734e-06, -1.0980293154716492e-06, 5.159527063369751e-07, 2.1299347281455994e-06, 3.7439167499542236e-06, 5.357898771762848e-06, 6.971880793571472e-06, 8.585862815380096e-06, 1.019984483718872e-05, 1.1813826858997345e-05, 1.342780888080597e-05, 1.5041790902614594e-05, 1.6655772924423218e-05, 1.8269754946231842e-05, 1.9883736968040466e-05, 2.149771898984909e-05, 2.3111701011657715e-05, 2.472568303346634e-05, 2.6339665055274963e-05, 2.7953647077083588e-05, 2.9567629098892212e-05, 3.1181611120700836e-05, 3.279559314250946e-05, 3.4409575164318085e-05, 3.602355718612671e-05, 3.763753920793533e-05, 3.925152122974396e-05, 4.086550325155258e-05, 4.2479485273361206e-05, 4.409346729516983e-05, 4.5707449316978455e-05, 4.732143133878708e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 15.0, 26.0, 28.0, 49.0, 83.0, 184.0, 320.0, 746.0, 1667.0, 4879.0, 18355.0, 97942.0, 523426.0, 332200.0, 52059.0, 10959.0, 3209.0, 1235.0, 541.0, 275.0, 129.0, 87.0, 59.0, 21.0, 15.0, 5.0, 6.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.254638671875, -0.24548721313476562, -0.23633575439453125, -0.22718429565429688, -0.2180328369140625, -0.20888137817382812, -0.19972991943359375, -0.19057846069335938, -0.181427001953125, -0.17227554321289062, -0.16312408447265625, -0.15397262573242188, -0.1448211669921875, -0.13566970825195312, -0.12651824951171875, -0.11736679077148438, -0.10821533203125, -0.09906387329101562, -0.08991241455078125, -0.08076095581054688, -0.0716094970703125, -0.062458038330078125, -0.05330657958984375, -0.044155120849609375, -0.035003662109375, -0.025852203369140625, -0.01670074462890625, -0.007549285888671875, 0.0016021728515625, 0.010753631591796875, 0.01990509033203125, 0.029056549072265625, 0.0382080078125, 0.047359466552734375, 0.05651092529296875, 0.06566238403320312, 0.0748138427734375, 0.08396530151367188, 0.09311676025390625, 0.10226821899414062, 0.111419677734375, 0.12057113647460938, 0.12972259521484375, 0.13887405395507812, 0.1480255126953125, 0.15717697143554688, 0.16632843017578125, 0.17547988891601562, 0.18463134765625, 0.19378280639648438, 0.20293426513671875, 0.21208572387695312, 0.2212371826171875, 0.23038864135742188, 0.23954010009765625, 0.24869155883789062, 0.257843017578125, 0.2669944763183594, 0.27614593505859375, 0.2852973937988281, 0.2944488525390625, 0.3036003112792969, 0.31275177001953125, 0.3219032287597656, 0.3310546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 2.0, 10.0, 14.0, 17.0, 24.0, 25.0, 31.0, 57.0, 56.0, 70.0, 109.0, 98.0, 93.0, 90.0, 66.0, 53.0, 38.0, 29.0, 20.0, 22.0, 12.0, 9.0, 10.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1761474609375, -0.1687145233154297, -0.16128158569335938, -0.15384864807128906, -0.14641571044921875, -0.13898277282714844, -0.13154983520507812, -0.12411689758300781, -0.1166839599609375, -0.10925102233886719, -0.10181808471679688, -0.09438514709472656, -0.08695220947265625, -0.07951927185058594, -0.07208633422851562, -0.06465339660644531, -0.057220458984375, -0.04978752136230469, -0.042354583740234375, -0.03492164611816406, -0.02748870849609375, -0.020055770874023438, -0.012622833251953125, -0.0051898956298828125, 0.0022430419921875, 0.009675979614257812, 0.017108917236328125, 0.024541854858398438, 0.03197479248046875, 0.03940773010253906, 0.046840667724609375, 0.05427360534667969, 0.06170654296875, 0.06913948059082031, 0.07657241821289062, 0.08400535583496094, 0.09143829345703125, 0.09887123107910156, 0.10630416870117188, 0.11373710632324219, 0.1211700439453125, 0.1286029815673828, 0.13603591918945312, 0.14346885681152344, 0.15090179443359375, 0.15833473205566406, 0.16576766967773438, 0.1732006072998047, 0.180633544921875, 0.1880664825439453, 0.19549942016601562, 0.20293235778808594, 0.21036529541015625, 0.21779823303222656, 0.22523117065429688, 0.2326641082763672, 0.2400970458984375, 0.2475299835205078, 0.2549629211425781, 0.26239585876464844, 0.26982879638671875, 0.27726173400878906, 0.2846946716308594, 0.2921276092529297, 0.299560546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 21.0, 50.0, 86.0, 143.0, 163.0, 171.0, 159.0, 90.0, 50.0, 21.0, 13.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.850337982177734, -4.73552131652832, -4.6207051277160645, -4.50588846206665, -4.3910722732543945, -4.2762556076049805, -4.161438941955566, -4.0466227531433105, -3.9318060874938965, -3.8169896602630615, -3.7021732330322266, -3.5873565673828125, -3.4725401401519775, -3.3577237129211426, -3.2429072856903076, -3.1280908584594727, -3.0132744312286377, -2.8984580039978027, -2.7836415767669678, -2.668825149536133, -2.5540084838867188, -2.439192056655884, -2.324375629425049, -2.209559202194214, -2.094742774963379, -1.979926347732544, -1.8651098012924194, -1.7502933740615845, -1.63547682762146, -1.520660400390625, -1.40584397315979, -1.291027545928955, -1.176210641860962, -1.061394214630127, -0.9465776681900024, -0.8317612409591675, -0.7169447541236877, -0.602128267288208, -0.48731184005737305, -0.3724953532218933, -0.2576788663864136, -0.14286239445209503, -0.02804592251777649, 0.08677053451538086, 0.2015870213508606, 0.31640350818634033, 0.4312199354171753, 0.546036422252655, 0.6608529090881348, 0.7756693959236145, 0.8904858827590942, 1.0053023099899292, 1.1201188564300537, 1.2349352836608887, 1.3497517108917236, 1.4645681381225586, 1.579384684562683, 1.694201111793518, 1.8090176582336426, 1.9238340854644775, 2.0386505126953125, 2.1534671783447266, 2.2682833671569824, 2.3831000328063965, 2.4979164600372314]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 11.0, 9.0, 7.0, 10.0, 10.0, 18.0, 16.0, 15.0, 24.0, 22.0, 18.0, 41.0, 39.0, 43.0, 27.0, 41.0, 46.0, 40.0, 52.0, 38.0, 28.0, 40.0, 43.0, 38.0, 33.0, 37.0, 28.0, 30.0, 25.0, 25.0, 21.0, 16.0, 26.0, 15.0, 16.0, 9.0, 11.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.1224443912506104, -2.06425142288208, -2.00605845451355, -1.947865605354309, -1.8896727561950684, -1.831479787826538, -1.7732868194580078, -1.7150938510894775, -1.6569010019302368, -1.5987080335617065, -1.5405151844024658, -1.4823222160339355, -1.4241292476654053, -1.3659363985061646, -1.3077434301376343, -1.2495505809783936, -1.1913576126098633, -1.133164644241333, -1.0749717950820923, -1.016778826713562, -0.9585859179496765, -0.900393009185791, -0.8422000408172607, -0.7840071320533752, -0.7258142232894897, -0.6676213145256042, -0.6094284057617188, -0.5512354373931885, -0.493042528629303, -0.4348496198654175, -0.3766566812992096, -0.3184637427330017, -0.2602708339691162, -0.20207791030406952, -0.14388498663902283, -0.08569206297397614, -0.027499139308929443, 0.030693769454956055, 0.08888670802116394, 0.14707964658737183, 0.20527255535125732, 0.2634654641151428, 0.3216584026813507, 0.3798513412475586, 0.4380442500114441, 0.4962371587753296, 0.5544301271438599, 0.6126230359077454, 0.6708159446716309, 0.7290088534355164, 0.7872017621994019, 0.8453947305679321, 0.9035876393318176, 0.9617805480957031, 1.0199735164642334, 1.0781664848327637, 1.1363593339920044, 1.1945523023605347, 1.2527451515197754, 1.3109381198883057, 1.369131088256836, 1.4273239374160767, 1.485516905784607, 1.5437097549438477, 1.601902723312378]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 20.0, 21.0, 43.0, 68.0, 101.0, 168.0, 278.0, 491.0, 980.0, 1847.0, 3674.0, 7673.0, 16368.0, 38138.0, 103168.0, 320208.0, 955024.0, 1499753.0, 823007.0, 273107.0, 89290.0, 33157.0, 14056.0, 6750.0, 3168.0, 1647.0, 906.0, 452.0, 264.0, 171.0, 90.0, 61.0, 42.0, 30.0, 16.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.268310546875, -0.259490966796875, -0.25067138671875, -0.241851806640625, -0.2330322265625, -0.224212646484375, -0.21539306640625, -0.206573486328125, -0.19775390625, -0.188934326171875, -0.18011474609375, -0.171295166015625, -0.1624755859375, -0.153656005859375, -0.14483642578125, -0.136016845703125, -0.127197265625, -0.118377685546875, -0.10955810546875, -0.100738525390625, -0.0919189453125, -0.083099365234375, -0.07427978515625, -0.065460205078125, -0.056640625, -0.047821044921875, -0.03900146484375, -0.030181884765625, -0.0213623046875, -0.012542724609375, -0.00372314453125, 0.005096435546875, 0.013916015625, 0.022735595703125, 0.03155517578125, 0.040374755859375, 0.0491943359375, 0.058013916015625, 0.06683349609375, 0.075653076171875, 0.08447265625, 0.093292236328125, 0.10211181640625, 0.110931396484375, 0.1197509765625, 0.128570556640625, 0.13739013671875, 0.146209716796875, 0.155029296875, 0.163848876953125, 0.17266845703125, 0.181488037109375, 0.1903076171875, 0.199127197265625, 0.20794677734375, 0.216766357421875, 0.2255859375, 0.234405517578125, 0.24322509765625, 0.252044677734375, 0.2608642578125, 0.269683837890625, 0.27850341796875, 0.287322998046875, 0.296142578125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 1.0, 7.0, 8.0, 10.0, 10.0, 5.0, 14.0, 18.0, 15.0, 11.0, 22.0, 22.0, 29.0, 40.0, 37.0, 39.0, 55.0, 43.0, 40.0, 55.0, 43.0, 44.0, 54.0, 43.0, 29.0, 42.0, 41.0, 35.0, 36.0, 26.0, 21.0, 26.0, 7.0, 15.0, 8.0, 11.0, 12.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.273681640625, -0.2649574279785156, -0.25623321533203125, -0.24750900268554688, -0.2387847900390625, -0.23006057739257812, -0.22133636474609375, -0.21261215209960938, -0.203887939453125, -0.19516372680664062, -0.18643951416015625, -0.17771530151367188, -0.1689910888671875, -0.16026687622070312, -0.15154266357421875, -0.14281845092773438, -0.13409423828125, -0.12537002563476562, -0.11664581298828125, -0.10792160034179688, -0.0991973876953125, -0.09047317504882812, -0.08174896240234375, -0.07302474975585938, -0.064300537109375, -0.055576324462890625, -0.04685211181640625, -0.038127899169921875, -0.0294036865234375, -0.020679473876953125, -0.01195526123046875, -0.003231048583984375, 0.0054931640625, 0.014217376708984375, 0.02294158935546875, 0.031665802001953125, 0.0403900146484375, 0.049114227294921875, 0.05783843994140625, 0.06656265258789062, 0.075286865234375, 0.08401107788085938, 0.09273529052734375, 0.10145950317382812, 0.1101837158203125, 0.11890792846679688, 0.12763214111328125, 0.13635635375976562, 0.14508056640625, 0.15380477905273438, 0.16252899169921875, 0.17125320434570312, 0.1799774169921875, 0.18870162963867188, 0.19742584228515625, 0.20615005493164062, 0.214874267578125, 0.22359848022460938, 0.23232269287109375, 0.24104690551757812, 0.2497711181640625, 0.2584953308105469, 0.26721954345703125, 0.2759437561035156, 0.28466796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 8.0, 9.0, 21.0, 32.0, 43.0, 69.0, 126.0, 216.0, 377.0, 783.0, 1700.0, 4572.0, 15863.0, 76785.0, 552122.0, 2970068.0, 477508.0, 70983.0, 15287.0, 4420.0, 1718.0, 714.0, 377.0, 203.0, 95.0, 59.0, 33.0, 29.0, 24.0, 12.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5771484375, -0.5553436279296875, -0.533538818359375, -0.5117340087890625, -0.48992919921875, -0.4681243896484375, -0.446319580078125, -0.4245147705078125, -0.4027099609375, -0.3809051513671875, -0.359100341796875, -0.3372955322265625, -0.31549072265625, -0.2936859130859375, -0.271881103515625, -0.2500762939453125, -0.228271484375, -0.2064666748046875, -0.184661865234375, -0.1628570556640625, -0.14105224609375, -0.1192474365234375, -0.097442626953125, -0.0756378173828125, -0.0538330078125, -0.0320281982421875, -0.010223388671875, 0.0115814208984375, 0.03338623046875, 0.0551910400390625, 0.076995849609375, 0.0988006591796875, 0.12060546875, 0.1424102783203125, 0.164215087890625, 0.1860198974609375, 0.20782470703125, 0.2296295166015625, 0.251434326171875, 0.2732391357421875, 0.2950439453125, 0.3168487548828125, 0.338653564453125, 0.3604583740234375, 0.38226318359375, 0.4040679931640625, 0.425872802734375, 0.4476776123046875, 0.469482421875, 0.4912872314453125, 0.513092041015625, 0.5348968505859375, 0.55670166015625, 0.5785064697265625, 0.600311279296875, 0.6221160888671875, 0.6439208984375, 0.6657257080078125, 0.687530517578125, 0.7093353271484375, 0.73114013671875, 0.7529449462890625, 0.774749755859375, 0.7965545654296875, 0.818359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 12.0, 24.0, 22.0, 42.0, 55.0, 68.0, 110.0, 157.0, 261.0, 511.0, 653.0, 646.0, 519.0, 312.0, 220.0, 129.0, 94.0, 66.0, 38.0, 32.0, 30.0, 23.0, 12.0, 11.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8173828125, -0.796478271484375, -0.77557373046875, -0.754669189453125, -0.7337646484375, -0.712860107421875, -0.69195556640625, -0.671051025390625, -0.650146484375, -0.629241943359375, -0.60833740234375, -0.587432861328125, -0.5665283203125, -0.545623779296875, -0.52471923828125, -0.503814697265625, -0.48291015625, -0.462005615234375, -0.44110107421875, -0.420196533203125, -0.3992919921875, -0.378387451171875, -0.35748291015625, -0.336578369140625, -0.315673828125, -0.294769287109375, -0.27386474609375, -0.252960205078125, -0.2320556640625, -0.211151123046875, -0.19024658203125, -0.169342041015625, -0.1484375, -0.127532958984375, -0.10662841796875, -0.085723876953125, -0.0648193359375, -0.043914794921875, -0.02301025390625, -0.002105712890625, 0.018798828125, 0.039703369140625, 0.06060791015625, 0.081512451171875, 0.1024169921875, 0.123321533203125, 0.14422607421875, 0.165130615234375, 0.18603515625, 0.206939697265625, 0.22784423828125, 0.248748779296875, 0.2696533203125, 0.290557861328125, 0.31146240234375, 0.332366943359375, 0.353271484375, 0.374176025390625, 0.39508056640625, 0.415985107421875, 0.4368896484375, 0.457794189453125, 0.47869873046875, 0.499603271484375, 0.5205078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 24.0, 89.0, 224.0, 330.0, 217.0, 62.0, 30.0, 11.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.941411972045898, -5.68803071975708, -5.43464994430542, -5.181268692016602, -4.927887916564941, -4.674506664276123, -4.421125411987305, -4.1677446365356445, -3.914363384246826, -3.660982370376587, -3.4076013565063477, -3.1542201042175293, -2.90083909034729, -2.647458076477051, -2.3940768241882324, -2.140695810317993, -1.887314796447754, -1.6339337825775146, -1.3805526494979858, -1.127171516418457, -0.8737905025482178, -0.6204094886779785, -0.3670283555984497, -0.1136472225189209, 0.13973379135131836, 0.3931148648262024, 0.6464959383010864, 0.8998770117759705, 1.1532580852508545, 1.4066390991210938, 1.6600202322006226, 1.9134013652801514, 2.166783332824707, 2.4201643466949463, 2.6735453605651855, 2.926926612854004, 3.180307626724243, 3.4336886405944824, 3.687069892883301, 3.94045090675354, 4.193831920623779, 4.447213172912598, 4.700593948364258, 4.953975200653076, 5.2073564529418945, 5.460737228393555, 5.714118480682373, 5.967499732971191, 6.220880508422852, 6.47426176071167, 6.72764253616333, 6.981023788452148, 7.234404563903809, 7.487785816192627, 7.741167068481445, 7.9945478439331055, 8.247928619384766, 8.501309394836426, 8.754691123962402, 9.008071899414062, 9.261452674865723, 9.514833450317383, 9.76821517944336, 10.02159595489502, 10.274977684020996]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 12.0, 13.0, 11.0, 14.0, 14.0, 20.0, 18.0, 16.0, 17.0, 28.0, 35.0, 32.0, 42.0, 44.0, 44.0, 56.0, 43.0, 46.0, 57.0, 52.0, 26.0, 37.0, 27.0, 30.0, 33.0, 35.0, 26.0, 26.0, 27.0, 21.0, 17.0, 10.0, 17.0, 12.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5471638441085815, -1.4908968210220337, -1.4346296787261963, -1.3783626556396484, -1.3220956325531006, -1.2658284902572632, -1.2095614671707153, -1.153294324874878, -1.09702730178833, -1.0407602787017822, -0.9844931364059448, -0.928226113319397, -0.8719590306282043, -0.8156919479370117, -0.7594249248504639, -0.7031578421592712, -0.6468907594680786, -0.590623676776886, -0.5343565940856934, -0.4780895709991455, -0.4218224883079529, -0.36555540561676025, -0.30928835272789, -0.2530212998390198, -0.19675421714782715, -0.14048714935779572, -0.08422008156776428, -0.02795301377773285, 0.028314054012298584, 0.08458113670349121, 0.14084818959236145, 0.1971152424812317, 0.25338244438171387, 0.3096495270729065, 0.36591657996177673, 0.422183632850647, 0.4784507155418396, 0.5347177982330322, 0.5909848213195801, 0.6472519040107727, 0.7035189867019653, 0.759786069393158, 0.8160531520843506, 0.8723201751708984, 0.9285872578620911, 0.9848543405532837, 1.0411213636398315, 1.097388505935669, 1.1536555290222168, 1.2099225521087646, 1.266189694404602, 1.32245671749115, 1.3787238597869873, 1.4349908828735352, 1.491257905960083, 1.5475249290466309, 1.6037920713424683, 1.6600590944290161, 1.7163262367248535, 1.7725932598114014, 1.8288602828979492, 1.8851274251937866, 1.9413944482803345, 1.9976615905761719, 2.0539286136627197]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 8.0, 16.0, 23.0, 24.0, 34.0, 53.0, 71.0, 121.0, 167.0, 298.0, 443.0, 774.0, 1257.0, 2219.0, 3903.0, 7051.0, 12894.0, 24227.0, 46164.0, 83646.0, 136361.0, 185403.0, 190831.0, 147035.0, 92604.0, 51884.0, 27881.0, 14771.0, 7842.0, 4390.0, 2578.0, 1385.0, 785.0, 509.0, 299.0, 202.0, 137.0, 90.0, 53.0, 26.0, 27.0, 16.0, 10.0, 15.0, 8.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1976318359375, -0.19147491455078125, -0.1853179931640625, -0.17916107177734375, -0.173004150390625, -0.16684722900390625, -0.1606903076171875, -0.15453338623046875, -0.14837646484375, -0.14221954345703125, -0.1360626220703125, -0.12990570068359375, -0.123748779296875, -0.11759185791015625, -0.1114349365234375, -0.10527801513671875, -0.09912109375, -0.09296417236328125, -0.0868072509765625, -0.08065032958984375, -0.074493408203125, -0.06833648681640625, -0.0621795654296875, -0.05602264404296875, -0.04986572265625, -0.04370880126953125, -0.0375518798828125, -0.03139495849609375, -0.025238037109375, -0.01908111572265625, -0.0129241943359375, -0.00676727294921875, -0.0006103515625, 0.00554656982421875, 0.0117034912109375, 0.01786041259765625, 0.024017333984375, 0.03017425537109375, 0.0363311767578125, 0.04248809814453125, 0.04864501953125, 0.05480194091796875, 0.0609588623046875, 0.06711578369140625, 0.073272705078125, 0.07942962646484375, 0.0855865478515625, 0.09174346923828125, 0.097900390625, 0.10405731201171875, 0.1102142333984375, 0.11637115478515625, 0.122528076171875, 0.12868499755859375, 0.1348419189453125, 0.14099884033203125, 0.14715576171875, 0.15331268310546875, 0.1594696044921875, 0.16562652587890625, 0.171783447265625, 0.17794036865234375, 0.1840972900390625, 0.19025421142578125, 0.1964111328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 17.0, 16.0, 15.0, 19.0, 21.0, 17.0, 22.0, 45.0, 25.0, 26.0, 37.0, 43.0, 36.0, 33.0, 51.0, 42.0, 43.0, 44.0, 38.0, 37.0, 37.0, 29.0, 31.0, 35.0, 28.0, 31.0, 26.0, 32.0, 14.0, 17.0, 16.0, 12.0, 6.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.22265625, -0.215240478515625, -0.20782470703125, -0.200408935546875, -0.1929931640625, -0.185577392578125, -0.17816162109375, -0.170745849609375, -0.163330078125, -0.155914306640625, -0.14849853515625, -0.141082763671875, -0.1336669921875, -0.126251220703125, -0.11883544921875, -0.111419677734375, -0.10400390625, -0.096588134765625, -0.08917236328125, -0.081756591796875, -0.0743408203125, -0.066925048828125, -0.05950927734375, -0.052093505859375, -0.044677734375, -0.037261962890625, -0.02984619140625, -0.022430419921875, -0.0150146484375, -0.007598876953125, -0.00018310546875, 0.007232666015625, 0.0146484375, 0.022064208984375, 0.02947998046875, 0.036895751953125, 0.0443115234375, 0.051727294921875, 0.05914306640625, 0.066558837890625, 0.073974609375, 0.081390380859375, 0.08880615234375, 0.096221923828125, 0.1036376953125, 0.111053466796875, 0.11846923828125, 0.125885009765625, 0.13330078125, 0.140716552734375, 0.14813232421875, 0.155548095703125, 0.1629638671875, 0.170379638671875, 0.17779541015625, 0.185211181640625, 0.192626953125, 0.200042724609375, 0.20745849609375, 0.214874267578125, 0.2222900390625, 0.229705810546875, 0.23712158203125, 0.244537353515625, 0.251953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 4.0, 7.0, 16.0, 17.0, 23.0, 36.0, 53.0, 85.0, 100.0, 144.0, 261.0, 392.0, 634.0, 1224.0, 2270.0, 4739.0, 10126.0, 23046.0, 54012.0, 125704.0, 245870.0, 278889.0, 168015.0, 74440.0, 31467.0, 13954.0, 6294.0, 3060.0, 1532.0, 792.0, 463.0, 285.0, 188.0, 127.0, 85.0, 56.0, 40.0, 33.0, 14.0, 13.0, 10.0, 6.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.308837890625, -0.2989349365234375, -0.289031982421875, -0.2791290283203125, -0.26922607421875, -0.2593231201171875, -0.249420166015625, -0.2395172119140625, -0.2296142578125, -0.2197113037109375, -0.209808349609375, -0.1999053955078125, -0.19000244140625, -0.1800994873046875, -0.170196533203125, -0.1602935791015625, -0.150390625, -0.1404876708984375, -0.130584716796875, -0.1206817626953125, -0.11077880859375, -0.1008758544921875, -0.090972900390625, -0.0810699462890625, -0.0711669921875, -0.0612640380859375, -0.051361083984375, -0.0414581298828125, -0.03155517578125, -0.0216522216796875, -0.011749267578125, -0.0018463134765625, 0.008056640625, 0.0179595947265625, 0.027862548828125, 0.0377655029296875, 0.04766845703125, 0.0575714111328125, 0.067474365234375, 0.0773773193359375, 0.0872802734375, 0.0971832275390625, 0.107086181640625, 0.1169891357421875, 0.12689208984375, 0.1367950439453125, 0.146697998046875, 0.1566009521484375, 0.16650390625, 0.1764068603515625, 0.186309814453125, 0.1962127685546875, 0.20611572265625, 0.2160186767578125, 0.225921630859375, 0.2358245849609375, 0.2457275390625, 0.2556304931640625, 0.265533447265625, 0.2754364013671875, 0.28533935546875, 0.2952423095703125, 0.305145263671875, 0.3150482177734375, 0.324951171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 18.0, 12.0, 7.0, 16.0, 28.0, 19.0, 29.0, 32.0, 37.0, 35.0, 48.0, 41.0, 40.0, 49.0, 53.0, 55.0, 45.0, 48.0, 54.0, 42.0, 42.0, 33.0, 39.0, 30.0, 25.0, 17.0, 15.0, 20.0, 19.0, 10.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76318359375, -0.737335205078125, -0.71148681640625, -0.685638427734375, -0.6597900390625, -0.633941650390625, -0.60809326171875, -0.582244873046875, -0.556396484375, -0.530548095703125, -0.50469970703125, -0.478851318359375, -0.4530029296875, -0.427154541015625, -0.40130615234375, -0.375457763671875, -0.349609375, -0.323760986328125, -0.29791259765625, -0.272064208984375, -0.2462158203125, -0.220367431640625, -0.19451904296875, -0.168670654296875, -0.142822265625, -0.116973876953125, -0.09112548828125, -0.065277099609375, -0.0394287109375, -0.013580322265625, 0.01226806640625, 0.038116455078125, 0.06396484375, 0.089813232421875, 0.11566162109375, 0.141510009765625, 0.1673583984375, 0.193206787109375, 0.21905517578125, 0.244903564453125, 0.270751953125, 0.296600341796875, 0.32244873046875, 0.348297119140625, 0.3741455078125, 0.399993896484375, 0.42584228515625, 0.451690673828125, 0.4775390625, 0.503387451171875, 0.52923583984375, 0.555084228515625, 0.5809326171875, 0.606781005859375, 0.63262939453125, 0.658477783203125, 0.684326171875, 0.710174560546875, 0.73602294921875, 0.761871337890625, 0.7877197265625, 0.813568115234375, 0.83941650390625, 0.865264892578125, 0.89111328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 16.0, 17.0, 33.0, 51.0, 90.0, 158.0, 222.0, 438.0, 844.0, 1974.0, 4247.0, 10461.0, 25417.0, 62406.0, 142083.0, 257774.0, 268910.0, 155470.0, 68935.0, 28285.0, 11800.0, 4805.0, 2014.0, 945.0, 518.0, 253.0, 140.0, 87.0, 51.0, 30.0, 21.0, 19.0, 12.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12524032592773438, -0.12120819091796875, -0.11717605590820312, -0.1131439208984375, -0.10911178588867188, -0.10507965087890625, -0.10104751586914062, -0.097015380859375, -0.09298324584960938, -0.08895111083984375, -0.08491897583007812, -0.0808868408203125, -0.07685470581054688, -0.07282257080078125, -0.06879043579101562, -0.06475830078125, -0.060726165771484375, -0.05669403076171875, -0.052661895751953125, -0.0486297607421875, -0.044597625732421875, -0.04056549072265625, -0.036533355712890625, -0.032501220703125, -0.028469085693359375, -0.02443695068359375, -0.020404815673828125, -0.0163726806640625, -0.012340545654296875, -0.00830841064453125, -0.004276275634765625, -0.000244140625, 0.003787994384765625, 0.00782012939453125, 0.011852264404296875, 0.0158843994140625, 0.019916534423828125, 0.02394866943359375, 0.027980804443359375, 0.032012939453125, 0.036045074462890625, 0.04007720947265625, 0.044109344482421875, 0.0481414794921875, 0.052173614501953125, 0.05620574951171875, 0.060237884521484375, 0.06427001953125, 0.06830215454101562, 0.07233428955078125, 0.07636642456054688, 0.0803985595703125, 0.08443069458007812, 0.08846282958984375, 0.09249496459960938, 0.096527099609375, 0.10055923461914062, 0.10459136962890625, 0.10862350463867188, 0.1126556396484375, 0.11668777465820312, 0.12071990966796875, 0.12475204467773438, 0.1287841796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 11.0, 15.0, 16.0, 19.0, 26.0, 22.0, 22.0, 27.0, 35.0, 44.0, 43.0, 62.0, 68.0, 65.0, 58.0, 63.0, 59.0, 43.0, 39.0, 33.0, 29.0, 29.0, 21.0, 17.0, 25.0, 17.0, 15.0, 10.0, 6.0, 4.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.24249267578125e-05, -3.149546682834625e-05, -3.0566006898880005e-05, -2.9636546969413757e-05, -2.870708703994751e-05, -2.7777627110481262e-05, -2.6848167181015015e-05, -2.5918707251548767e-05, -2.498924732208252e-05, -2.4059787392616272e-05, -2.3130327463150024e-05, -2.2200867533683777e-05, -2.127140760421753e-05, -2.0341947674751282e-05, -1.9412487745285034e-05, -1.8483027815818787e-05, -1.755356788635254e-05, -1.662410795688629e-05, -1.5694648027420044e-05, -1.4765188097953796e-05, -1.3835728168487549e-05, -1.2906268239021301e-05, -1.1976808309555054e-05, -1.1047348380088806e-05, -1.0117888450622559e-05, -9.188428521156311e-06, -8.258968591690063e-06, -7.329508662223816e-06, -6.400048732757568e-06, -5.470588803291321e-06, -4.541128873825073e-06, -3.6116689443588257e-06, -2.682209014892578e-06, -1.7527490854263306e-06, -8.23289155960083e-07, 1.0617077350616455e-07, 1.0356307029724121e-06, 1.9650906324386597e-06, 2.8945505619049072e-06, 3.824010491371155e-06, 4.753470420837402e-06, 5.68293035030365e-06, 6.6123902797698975e-06, 7.541850209236145e-06, 8.471310138702393e-06, 9.40077006816864e-06, 1.0330229997634888e-05, 1.1259689927101135e-05, 1.2189149856567383e-05, 1.311860978603363e-05, 1.4048069715499878e-05, 1.4977529644966125e-05, 1.5906989574432373e-05, 1.683644950389862e-05, 1.7765909433364868e-05, 1.8695369362831116e-05, 1.9624829292297363e-05, 2.055428922176361e-05, 2.148374915122986e-05, 2.2413209080696106e-05, 2.3342669010162354e-05, 2.42721289396286e-05, 2.520158886909485e-05, 2.6131048798561096e-05, 2.7060508728027344e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 12.0, 13.0, 20.0, 27.0, 46.0, 71.0, 102.0, 175.0, 290.0, 500.0, 837.0, 1574.0, 2860.0, 6267.0, 13975.0, 31620.0, 68701.0, 140288.0, 224693.0, 238841.0, 162201.0, 84044.0, 38735.0, 16966.0, 7840.0, 3716.0, 1782.0, 994.0, 491.0, 341.0, 178.0, 96.0, 68.0, 55.0, 42.0, 25.0, 18.0, 15.0, 9.0, 8.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10321044921875, -0.09978485107421875, -0.0963592529296875, -0.09293365478515625, -0.089508056640625, -0.08608245849609375, -0.0826568603515625, -0.07923126220703125, -0.0758056640625, -0.07238006591796875, -0.0689544677734375, -0.06552886962890625, -0.062103271484375, -0.05867767333984375, -0.0552520751953125, -0.05182647705078125, -0.04840087890625, -0.04497528076171875, -0.0415496826171875, -0.03812408447265625, -0.034698486328125, -0.03127288818359375, -0.0278472900390625, -0.02442169189453125, -0.02099609375, -0.01757049560546875, -0.0141448974609375, -0.01071929931640625, -0.007293701171875, -0.00386810302734375, -0.0004425048828125, 0.00298309326171875, 0.00640869140625, 0.00983428955078125, 0.0132598876953125, 0.01668548583984375, 0.020111083984375, 0.02353668212890625, 0.0269622802734375, 0.03038787841796875, 0.0338134765625, 0.03723907470703125, 0.0406646728515625, 0.04409027099609375, 0.047515869140625, 0.05094146728515625, 0.0543670654296875, 0.05779266357421875, 0.06121826171875, 0.06464385986328125, 0.0680694580078125, 0.07149505615234375, 0.074920654296875, 0.07834625244140625, 0.0817718505859375, 0.08519744873046875, 0.088623046875, 0.09204864501953125, 0.0954742431640625, 0.09889984130859375, 0.102325439453125, 0.10575103759765625, 0.1091766357421875, 0.11260223388671875, 0.11602783203125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 13.0, 11.0, 13.0, 28.0, 30.0, 33.0, 28.0, 37.0, 41.0, 61.0, 79.0, 56.0, 75.0, 60.0, 60.0, 61.0, 47.0, 57.0, 37.0, 26.0, 24.0, 28.0, 19.0, 14.0, 13.0, 13.0, 11.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11631488800048828, -0.11184120178222656, -0.10736751556396484, -0.10289382934570312, -0.0984201431274414, -0.09394645690917969, -0.08947277069091797, -0.08499908447265625, -0.08052539825439453, -0.07605171203613281, -0.0715780258178711, -0.06710433959960938, -0.06263065338134766, -0.05815696716308594, -0.05368328094482422, -0.0492095947265625, -0.04473590850830078, -0.04026222229003906, -0.035788536071777344, -0.031314849853515625, -0.026841163635253906, -0.022367477416992188, -0.01789379119873047, -0.01342010498046875, -0.008946418762207031, -0.0044727325439453125, 9.5367431640625e-07, 0.004474639892578125, 0.008948326110839844, 0.013422012329101562, 0.01789569854736328, 0.022369384765625, 0.02684307098388672, 0.03131675720214844, 0.035790443420410156, 0.040264129638671875, 0.044737815856933594, 0.04921150207519531, 0.05368518829345703, 0.05815887451171875, 0.06263256072998047, 0.06710624694824219, 0.0715799331665039, 0.07605361938476562, 0.08052730560302734, 0.08500099182128906, 0.08947467803955078, 0.0939483642578125, 0.09842205047607422, 0.10289573669433594, 0.10736942291259766, 0.11184310913085938, 0.1163167953491211, 0.12079048156738281, 0.12526416778564453, 0.12973785400390625, 0.13421154022216797, 0.1386852264404297, 0.1431589126586914, 0.14763259887695312, 0.15210628509521484, 0.15657997131347656, 0.16105365753173828, 0.16552734375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 24.0, 116.0, 307.0, 379.0, 121.0, 36.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.563634872436523, -9.376860618591309, -9.190086364746094, -9.003311157226562, -8.816536903381348, -8.629762649536133, -8.442988395690918, -8.256214141845703, -8.069439888000488, -7.882665634155273, -7.6958909034729, -7.5091166496276855, -7.322342395782471, -7.135567665100098, -6.948793411254883, -6.762019157409668, -6.575244426727295, -6.38847017288208, -6.201695442199707, -6.014921188354492, -5.828146934509277, -5.6413726806640625, -5.4545979499816895, -5.267823696136475, -5.081048965454102, -4.894274711608887, -4.707499980926514, -4.520725727081299, -4.333951473236084, -4.147176742553711, -3.960402488708496, -3.7736282348632812, -3.586853504180908, -3.4000790119171143, -3.2133047580718994, -3.0265302658081055, -2.8397560119628906, -2.6529815196990967, -2.4662070274353027, -2.279432773590088, -2.092658281326294, -1.9058839082717896, -1.7191095352172852, -1.5323350429534912, -1.3455606698989868, -1.1587862968444824, -0.9720118045806885, -0.7852374315261841, -0.5984630584716797, -0.4116886556148529, -0.22491425275802612, -0.03813982009887695, 0.14863455295562744, 0.33540892601013184, 0.5221834182739258, 0.7089577913284302, 0.8957321643829346, 1.082506537437439, 1.2692809104919434, 1.4560554027557373, 1.6428297758102417, 1.829604148864746, 2.01637864112854, 2.203153133392334, 2.389927387237549]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 8.0, 1.0, 8.0, 4.0, 7.0, 5.0, 8.0, 16.0, 13.0, 12.0, 20.0, 16.0, 24.0, 34.0, 32.0, 25.0, 46.0, 38.0, 36.0, 50.0, 31.0, 36.0, 35.0, 38.0, 45.0, 46.0, 40.0, 43.0, 30.0, 29.0, 23.0, 26.0, 31.0, 32.0, 8.0, 16.0, 15.0, 13.0, 6.0, 13.0, 11.0, 5.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7588622570037842, -1.7036851644515991, -1.648508071899414, -1.593330979347229, -1.538153886795044, -1.4829769134521484, -1.4277997016906738, -1.3726227283477783, -1.3174456357955933, -1.2622685432434082, -1.2070914506912231, -1.151914358139038, -1.096737265586853, -1.041560173034668, -0.9863831400871277, -0.9312061071395874, -0.8760289549827576, -0.8208518624305725, -0.7656747698783875, -0.7104977369308472, -0.6553206443786621, -0.600143551826477, -0.544966459274292, -0.4897893965244293, -0.43461230397224426, -0.3794352114200592, -0.32425814867019653, -0.2690810561180115, -0.2139039784669876, -0.15872690081596375, -0.10354980826377869, -0.048372745513916016, 0.006804347038269043, 0.061981428414583206, 0.11715850979089737, 0.17233559489250183, 0.2275126725435257, 0.28268975019454956, 0.3378668427467346, 0.3930439054965973, 0.44822099804878235, 0.503398060798645, 0.5585751533508301, 0.6137522459030151, 0.6689293384552002, 0.7241064310073853, 0.7792835235595703, 0.8344605565071106, 0.8896376490592957, 0.9448147416114807, 0.9999918341636658, 1.055168867111206, 1.1103459596633911, 1.1655230522155762, 1.2207001447677612, 1.2758772373199463, 1.3310543298721313, 1.3862314224243164, 1.4414085149765015, 1.4965856075286865, 1.5517627000808716, 1.6069397926330566, 1.6621167659759521, 1.7172938585281372, 1.7724709510803223]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 3.0, 13.0, 18.0, 27.0, 40.0, 59.0, 65.0, 129.0, 206.0, 355.0, 550.0, 960.0, 1633.0, 3062.0, 6122.0, 13583.0, 34543.0, 105549.0, 342657.0, 949761.0, 1439213.0, 848264.0, 298064.0, 93071.0, 31694.0, 12226.0, 5613.0, 2916.0, 1594.0, 859.0, 520.0, 301.0, 208.0, 120.0, 86.0, 68.0, 32.0, 30.0, 23.0, 15.0, 11.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2452392578125, -0.2371807098388672, -0.22912216186523438, -0.22106361389160156, -0.21300506591796875, -0.20494651794433594, -0.19688796997070312, -0.1888294219970703, -0.1807708740234375, -0.1727123260498047, -0.16465377807617188, -0.15659523010253906, -0.14853668212890625, -0.14047813415527344, -0.13241958618164062, -0.12436103820800781, -0.116302490234375, -0.10824394226074219, -0.10018539428710938, -0.09212684631347656, -0.08406829833984375, -0.07600975036621094, -0.06795120239257812, -0.05989265441894531, -0.0518341064453125, -0.04377555847167969, -0.035717010498046875, -0.027658462524414062, -0.01959991455078125, -0.011541366577148438, -0.003482818603515625, 0.0045757293701171875, 0.01263427734375, 0.020692825317382812, 0.028751373291015625, 0.03680992126464844, 0.04486846923828125, 0.05292701721191406, 0.060985565185546875, 0.06904411315917969, 0.0771026611328125, 0.08516120910644531, 0.09321975708007812, 0.10127830505371094, 0.10933685302734375, 0.11739540100097656, 0.12545394897460938, 0.1335124969482422, 0.141571044921875, 0.1496295928955078, 0.15768814086914062, 0.16574668884277344, 0.17380523681640625, 0.18186378479003906, 0.18992233276367188, 0.1979808807373047, 0.2060394287109375, 0.2140979766845703, 0.22215652465820312, 0.23021507263183594, 0.23827362060546875, 0.24633216857910156, 0.2543907165527344, 0.2624492645263672, 0.2705078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 6.0, 6.0, 9.0, 14.0, 17.0, 13.0, 15.0, 25.0, 28.0, 24.0, 29.0, 32.0, 29.0, 36.0, 38.0, 34.0, 41.0, 30.0, 49.0, 47.0, 40.0, 49.0, 46.0, 38.0, 29.0, 47.0, 39.0, 16.0, 27.0, 29.0, 20.0, 14.0, 15.0, 12.0, 12.0, 6.0, 8.0, 5.0, 5.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2762947082519531, -0.26767730712890625, -0.2590599060058594, -0.2504425048828125, -0.24182510375976562, -0.23320770263671875, -0.22459030151367188, -0.215972900390625, -0.20735549926757812, -0.19873809814453125, -0.19012069702148438, -0.1815032958984375, -0.17288589477539062, -0.16426849365234375, -0.15565109252929688, -0.14703369140625, -0.13841629028320312, -0.12979888916015625, -0.12118148803710938, -0.1125640869140625, -0.10394668579101562, -0.09532928466796875, -0.08671188354492188, -0.078094482421875, -0.06947708129882812, -0.06085968017578125, -0.052242279052734375, -0.0436248779296875, -0.035007476806640625, -0.02639007568359375, -0.017772674560546875, -0.0091552734375, -0.000537872314453125, 0.00807952880859375, 0.016696929931640625, 0.0253143310546875, 0.033931732177734375, 0.04254913330078125, 0.051166534423828125, 0.059783935546875, 0.06840133666992188, 0.07701873779296875, 0.08563613891601562, 0.0942535400390625, 0.10287094116210938, 0.11148834228515625, 0.12010574340820312, 0.12872314453125, 0.13734054565429688, 0.14595794677734375, 0.15457534790039062, 0.1631927490234375, 0.17181015014648438, 0.18042755126953125, 0.18904495239257812, 0.197662353515625, 0.20627975463867188, 0.21489715576171875, 0.22351455688476562, 0.2321319580078125, 0.24074935913085938, 0.24936676025390625, 0.2579841613769531, 0.2666015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 12.0, 27.0, 29.0, 36.0, 77.0, 116.0, 200.0, 348.0, 696.0, 1380.0, 3128.0, 8312.0, 25421.0, 96514.0, 541629.0, 2671361.0, 685869.0, 113715.0, 29281.0, 9300.0, 3552.0, 1507.0, 740.0, 392.0, 255.0, 112.0, 101.0, 59.0, 31.0, 21.0, 14.0, 12.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488037109375, -0.47304534912109375, -0.4580535888671875, -0.44306182861328125, -0.428070068359375, -0.41307830810546875, -0.3980865478515625, -0.38309478759765625, -0.36810302734375, -0.35311126708984375, -0.3381195068359375, -0.32312774658203125, -0.308135986328125, -0.29314422607421875, -0.2781524658203125, -0.26316070556640625, -0.2481689453125, -0.23317718505859375, -0.2181854248046875, -0.20319366455078125, -0.188201904296875, -0.17321014404296875, -0.1582183837890625, -0.14322662353515625, -0.12823486328125, -0.11324310302734375, -0.0982513427734375, -0.08325958251953125, -0.068267822265625, -0.05327606201171875, -0.0382843017578125, -0.02329254150390625, -0.00830078125, 0.00669097900390625, 0.0216827392578125, 0.03667449951171875, 0.051666259765625, 0.06665802001953125, 0.0816497802734375, 0.09664154052734375, 0.11163330078125, 0.12662506103515625, 0.1416168212890625, 0.15660858154296875, 0.171600341796875, 0.18659210205078125, 0.2015838623046875, 0.21657562255859375, 0.2315673828125, 0.24655914306640625, 0.2615509033203125, 0.27654266357421875, 0.291534423828125, 0.30652618408203125, 0.3215179443359375, 0.33650970458984375, 0.35150146484375, 0.36649322509765625, 0.3814849853515625, 0.39647674560546875, 0.411468505859375, 0.42646026611328125, 0.4414520263671875, 0.45644378662109375, 0.471435546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 8.0, 8.0, 16.0, 15.0, 16.0, 32.0, 32.0, 50.0, 82.0, 85.0, 160.0, 234.0, 370.0, 495.0, 574.0, 499.0, 446.0, 258.0, 172.0, 136.0, 104.0, 62.0, 44.0, 50.0, 24.0, 19.0, 16.0, 12.0, 11.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42724609375, -0.412872314453125, -0.39849853515625, -0.384124755859375, -0.3697509765625, -0.355377197265625, -0.34100341796875, -0.326629638671875, -0.312255859375, -0.297882080078125, -0.28350830078125, -0.269134521484375, -0.2547607421875, -0.240386962890625, -0.22601318359375, -0.211639404296875, -0.197265625, -0.182891845703125, -0.16851806640625, -0.154144287109375, -0.1397705078125, -0.125396728515625, -0.11102294921875, -0.096649169921875, -0.082275390625, -0.067901611328125, -0.05352783203125, -0.039154052734375, -0.0247802734375, -0.010406494140625, 0.00396728515625, 0.018341064453125, 0.03271484375, 0.047088623046875, 0.06146240234375, 0.075836181640625, 0.0902099609375, 0.104583740234375, 0.11895751953125, 0.133331298828125, 0.147705078125, 0.162078857421875, 0.17645263671875, 0.190826416015625, 0.2052001953125, 0.219573974609375, 0.23394775390625, 0.248321533203125, 0.2626953125, 0.277069091796875, 0.29144287109375, 0.305816650390625, 0.3201904296875, 0.334564208984375, 0.34893798828125, 0.363311767578125, 0.377685546875, 0.392059326171875, 0.40643310546875, 0.420806884765625, 0.4351806640625, 0.449554443359375, 0.46392822265625, 0.478302001953125, 0.49267578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 20.0, 38.0, 70.0, 75.0, 122.0, 149.0, 151.0, 134.0, 86.0, 56.0, 36.0, 22.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.725496292114258, -3.6404967308044434, -3.555497169494629, -3.4704978466033936, -3.385498285293579, -3.3004987239837646, -3.21549916267395, -3.130499839782715, -3.0455002784729004, -2.960500717163086, -2.8755011558532715, -2.790501832962036, -2.7055022716522217, -2.6205027103424072, -2.5355031490325928, -2.4505038261413574, -2.365504264831543, -2.2805047035217285, -2.195505142211914, -2.1105058193206787, -2.0255062580108643, -1.9405066967010498, -1.8555071353912354, -1.7705076932907104, -1.6855080127716064, -1.600508451461792, -1.515509009361267, -1.4305094480514526, -1.3455100059509277, -1.2605104446411133, -1.1755108833312988, -1.090511441230774, -1.0055121183395386, -0.9205126166343689, -0.8355131149291992, -0.7505135536193848, -0.6655141115188599, -0.5805145502090454, -0.49551504850387573, -0.41051554679870605, -0.3255160450935364, -0.2405165433883667, -0.15551702678203583, -0.07051751017570496, 0.014481991529464722, 0.0994814932346344, 0.18448102474212646, 0.26948052644729614, 0.3544800281524658, 0.4394795298576355, 0.5244790315628052, 0.6094785928726196, 0.6944780349731445, 0.779477596282959, 0.8644770979881287, 0.9494765996932983, 1.0344760417938232, 1.1194756031036377, 1.2044750452041626, 1.289474606513977, 1.374474048614502, 1.4594736099243164, 1.5444731712341309, 1.6294726133346558, 1.7144721746444702]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 0.0, 9.0, 6.0, 16.0, 10.0, 14.0, 16.0, 23.0, 26.0, 23.0, 34.0, 29.0, 31.0, 28.0, 43.0, 33.0, 49.0, 40.0, 34.0, 47.0, 44.0, 27.0, 40.0, 37.0, 44.0, 38.0, 40.0, 19.0, 29.0, 23.0, 18.0, 25.0, 11.0, 14.0, 17.0, 12.0, 8.0, 10.0, 8.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3053736686706543, -1.2651443481445312, -1.2249149084091187, -1.1846855878829956, -1.1444562673568726, -1.10422682762146, -1.063997507095337, -1.0237681865692139, -0.9835387468338013, -0.9433093667030334, -0.9030800461769104, -0.8628506660461426, -0.8226212859153748, -0.7823919057846069, -0.7421625852584839, -0.7019332051277161, -0.661703884601593, -0.6214745044708252, -0.5812451839447021, -0.5410158038139343, -0.5007864236831665, -0.46055707335472107, -0.42032772302627563, -0.3800983428955078, -0.3398689925670624, -0.29963964223861694, -0.2594102621078491, -0.2191809117794037, -0.17895154654979706, -0.13872218132019043, -0.098492830991745, -0.05826345086097717, -0.01803410053253174, 0.02219526097178459, 0.06242462247610092, 0.10265398025512695, 0.14288334548473358, 0.1831127107143402, 0.22334206104278564, 0.26357144117355347, 0.3038007915019989, 0.34403014183044434, 0.38425952196121216, 0.4244888722896576, 0.464718222618103, 0.5049476027488708, 0.5451769828796387, 0.5854063034057617, 0.6256356835365295, 0.6658650636672974, 0.7060943841934204, 0.7463237643241882, 0.786553144454956, 0.8267824649810791, 0.8670118451118469, 0.9072412252426147, 0.9474705457687378, 0.9876999258995056, 1.0279293060302734, 1.0681586265563965, 1.1083879470825195, 1.1486173868179321, 1.1888467073440552, 1.2290761470794678, 1.2693054676055908]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 8.0, 21.0, 27.0, 49.0, 59.0, 106.0, 149.0, 206.0, 324.0, 496.0, 934.0, 1834.0, 3876.0, 8474.0, 21606.0, 67148.0, 241870.0, 428299.0, 188699.0, 52147.0, 17692.0, 7428.0, 3289.0, 1627.0, 856.0, 465.0, 318.0, 165.0, 134.0, 75.0, 51.0, 41.0, 30.0, 19.0, 11.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.5791015625, -0.5644035339355469, -0.5497055053710938, -0.5350074768066406, -0.5203094482421875, -0.5056114196777344, -0.49091339111328125, -0.4762153625488281, -0.461517333984375, -0.4468193054199219, -0.43212127685546875, -0.4174232482910156, -0.4027252197265625, -0.3880271911621094, -0.37332916259765625, -0.3586311340332031, -0.34393310546875, -0.3292350769042969, -0.31453704833984375, -0.2998390197753906, -0.2851409912109375, -0.2704429626464844, -0.25574493408203125, -0.24104690551757812, -0.226348876953125, -0.21165084838867188, -0.19695281982421875, -0.18225479125976562, -0.1675567626953125, -0.15285873413085938, -0.13816070556640625, -0.12346267700195312, -0.1087646484375, -0.09406661987304688, -0.07936859130859375, -0.06467056274414062, -0.0499725341796875, -0.035274505615234375, -0.02057647705078125, -0.005878448486328125, 0.008819580078125, 0.023517608642578125, 0.03821563720703125, 0.052913665771484375, 0.0676116943359375, 0.08230972290039062, 0.09700775146484375, 0.11170578002929688, 0.12640380859375, 0.14110183715820312, 0.15579986572265625, 0.17049789428710938, 0.1851959228515625, 0.19989395141601562, 0.21459197998046875, 0.22929000854492188, 0.243988037109375, 0.2586860656738281, 0.27338409423828125, 0.2880821228027344, 0.3027801513671875, 0.3174781799316406, 0.33217620849609375, 0.3468742370605469, 0.361572265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 10.0, 10.0, 11.0, 10.0, 7.0, 18.0, 12.0, 24.0, 23.0, 23.0, 23.0, 23.0, 20.0, 24.0, 39.0, 38.0, 44.0, 38.0, 40.0, 35.0, 32.0, 42.0, 44.0, 33.0, 34.0, 34.0, 35.0, 26.0, 32.0, 37.0, 18.0, 26.0, 14.0, 28.0, 16.0, 22.0, 6.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2308349609375, -0.2233562469482422, -0.21587753295898438, -0.20839881896972656, -0.20092010498046875, -0.19344139099121094, -0.18596267700195312, -0.1784839630126953, -0.1710052490234375, -0.1635265350341797, -0.15604782104492188, -0.14856910705566406, -0.14109039306640625, -0.13361167907714844, -0.12613296508789062, -0.11865425109863281, -0.111175537109375, -0.10369682312011719, -0.09621810913085938, -0.08873939514160156, -0.08126068115234375, -0.07378196716308594, -0.06630325317382812, -0.05882453918457031, -0.0513458251953125, -0.04386711120605469, -0.036388397216796875, -0.028909683227539062, -0.02143096923828125, -0.013952255249023438, -0.006473541259765625, 0.0010051727294921875, 0.00848388671875, 0.015962600708007812, 0.023441314697265625, 0.030920028686523438, 0.03839874267578125, 0.04587745666503906, 0.053356170654296875, 0.06083488464355469, 0.0683135986328125, 0.07579231262207031, 0.08327102661132812, 0.09074974060058594, 0.09822845458984375, 0.10570716857910156, 0.11318588256835938, 0.12066459655761719, 0.128143310546875, 0.1356220245361328, 0.14310073852539062, 0.15057945251464844, 0.15805816650390625, 0.16553688049316406, 0.17301559448242188, 0.1804943084716797, 0.1879730224609375, 0.1954517364501953, 0.20293045043945312, 0.21040916442871094, 0.21788787841796875, 0.22536659240722656, 0.23284530639648438, 0.2403240203857422, 0.247802734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 15.0, 9.0, 16.0, 14.0, 35.0, 56.0, 75.0, 125.0, 250.0, 423.0, 683.0, 1268.0, 2459.0, 4833.0, 10712.0, 28981.0, 107107.0, 416693.0, 348623.0, 83968.0, 24001.0, 9123.0, 4186.0, 2118.0, 1158.0, 640.0, 348.0, 231.0, 123.0, 84.0, 59.0, 38.0, 31.0, 17.0, 22.0, 11.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62890625, -0.6108932495117188, -0.5928802490234375, -0.5748672485351562, -0.556854248046875, -0.5388412475585938, -0.5208282470703125, -0.5028152465820312, -0.48480224609375, -0.46678924560546875, -0.4487762451171875, -0.43076324462890625, -0.412750244140625, -0.39473724365234375, -0.3767242431640625, -0.35871124267578125, -0.3406982421875, -0.32268524169921875, -0.3046722412109375, -0.28665924072265625, -0.268646240234375, -0.25063323974609375, -0.2326202392578125, -0.21460723876953125, -0.19659423828125, -0.17858123779296875, -0.1605682373046875, -0.14255523681640625, -0.124542236328125, -0.10652923583984375, -0.0885162353515625, -0.07050323486328125, -0.052490234375, -0.03447723388671875, -0.0164642333984375, 0.00154876708984375, 0.019561767578125, 0.03757476806640625, 0.0555877685546875, 0.07360076904296875, 0.09161376953125, 0.10962677001953125, 0.1276397705078125, 0.14565277099609375, 0.163665771484375, 0.18167877197265625, 0.1996917724609375, 0.21770477294921875, 0.2357177734375, 0.25373077392578125, 0.2717437744140625, 0.28975677490234375, 0.307769775390625, 0.32578277587890625, 0.3437957763671875, 0.36180877685546875, 0.37982177734375, 0.39783477783203125, 0.4158477783203125, 0.43386077880859375, 0.451873779296875, 0.46988677978515625, 0.4878997802734375, 0.5059127807617188, 0.52392578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 12.0, 28.0, 20.0, 28.0, 26.0, 25.0, 34.0, 44.0, 41.0, 52.0, 50.0, 57.0, 47.0, 59.0, 49.0, 54.0, 38.0, 42.0, 42.0, 39.0, 34.0, 28.0, 32.0, 27.0, 18.0, 16.0, 8.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0419921875, -1.012664794921875, -0.98333740234375, -0.954010009765625, -0.9246826171875, -0.895355224609375, -0.86602783203125, -0.836700439453125, -0.807373046875, -0.778045654296875, -0.74871826171875, -0.719390869140625, -0.6900634765625, -0.660736083984375, -0.63140869140625, -0.602081298828125, -0.57275390625, -0.543426513671875, -0.51409912109375, -0.484771728515625, -0.4554443359375, -0.426116943359375, -0.39678955078125, -0.367462158203125, -0.338134765625, -0.308807373046875, -0.27947998046875, -0.250152587890625, -0.2208251953125, -0.191497802734375, -0.16217041015625, -0.132843017578125, -0.103515625, -0.074188232421875, -0.04486083984375, -0.015533447265625, 0.0137939453125, 0.043121337890625, 0.07244873046875, 0.101776123046875, 0.131103515625, 0.160430908203125, 0.18975830078125, 0.219085693359375, 0.2484130859375, 0.277740478515625, 0.30706787109375, 0.336395263671875, 0.36572265625, 0.395050048828125, 0.42437744140625, 0.453704833984375, 0.4830322265625, 0.512359619140625, 0.54168701171875, 0.571014404296875, 0.600341796875, 0.629669189453125, 0.65899658203125, 0.688323974609375, 0.7176513671875, 0.746978759765625, 0.77630615234375, 0.805633544921875, 0.8349609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 13.0, 7.0, 9.0, 22.0, 33.0, 46.0, 75.0, 105.0, 174.0, 306.0, 484.0, 884.0, 1636.0, 3017.0, 6218.0, 13556.0, 34665.0, 112850.0, 357830.0, 348662.0, 108576.0, 33529.0, 13066.0, 6021.0, 2993.0, 1626.0, 889.0, 510.0, 279.0, 159.0, 119.0, 85.0, 36.0, 24.0, 18.0, 11.0, 11.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16064453125, -0.1552867889404297, -0.14992904663085938, -0.14457130432128906, -0.13921356201171875, -0.13385581970214844, -0.12849807739257812, -0.12314033508300781, -0.1177825927734375, -0.11242485046386719, -0.10706710815429688, -0.10170936584472656, -0.09635162353515625, -0.09099388122558594, -0.08563613891601562, -0.08027839660644531, -0.074920654296875, -0.06956291198730469, -0.06420516967773438, -0.05884742736816406, -0.05348968505859375, -0.04813194274902344, -0.042774200439453125, -0.03741645812988281, -0.0320587158203125, -0.026700973510742188, -0.021343231201171875, -0.015985488891601562, -0.01062774658203125, -0.0052700042724609375, 8.7738037109375e-05, 0.0054454803466796875, 0.01080322265625, 0.016160964965820312, 0.021518707275390625, 0.026876449584960938, 0.03223419189453125, 0.03759193420410156, 0.042949676513671875, 0.04830741882324219, 0.0536651611328125, 0.05902290344238281, 0.06438064575195312, 0.06973838806152344, 0.07509613037109375, 0.08045387268066406, 0.08581161499023438, 0.09116935729980469, 0.096527099609375, 0.10188484191894531, 0.10724258422851562, 0.11260032653808594, 0.11795806884765625, 0.12331581115722656, 0.12867355346679688, 0.1340312957763672, 0.1393890380859375, 0.1447467803955078, 0.15010452270507812, 0.15546226501464844, 0.16082000732421875, 0.16617774963378906, 0.17153549194335938, 0.1768932342529297, 0.1822509765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 9.0, 11.0, 12.0, 18.0, 30.0, 31.0, 57.0, 85.0, 93.0, 110.0, 120.0, 113.0, 68.0, 56.0, 49.0, 26.0, 22.0, 13.0, 11.0, 8.0, 6.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-05, -4.1338615119457245e-05, -3.976188600063324e-05, -3.8185156881809235e-05, -3.660842776298523e-05, -3.5031698644161224e-05, -3.345496952533722e-05, -3.1878240406513214e-05, -3.030151128768921e-05, -2.8724782168865204e-05, -2.71480530500412e-05, -2.5571323931217194e-05, -2.399459481239319e-05, -2.2417865693569183e-05, -2.0841136574745178e-05, -1.9264407455921173e-05, -1.7687678337097168e-05, -1.6110949218273163e-05, -1.4534220099449158e-05, -1.2957490980625153e-05, -1.1380761861801147e-05, -9.804032742977142e-06, -8.227303624153137e-06, -6.650574505329132e-06, -5.073845386505127e-06, -3.497116267681122e-06, -1.9203871488571167e-06, -3.4365803003311157e-07, 1.2330710887908936e-06, 2.8098002076148987e-06, 4.386529326438904e-06, 5.963258445262909e-06, 7.539987564086914e-06, 9.11671668291092e-06, 1.0693445801734924e-05, 1.227017492055893e-05, 1.3846904039382935e-05, 1.542363315820694e-05, 1.7000362277030945e-05, 1.857709139585495e-05, 2.0153820514678955e-05, 2.173054963350296e-05, 2.3307278752326965e-05, 2.488400787115097e-05, 2.6460736989974976e-05, 2.803746610879898e-05, 2.9614195227622986e-05, 3.119092434644699e-05, 3.2767653465270996e-05, 3.4344382584095e-05, 3.5921111702919006e-05, 3.749784082174301e-05, 3.9074569940567017e-05, 4.065129905939102e-05, 4.222802817821503e-05, 4.380475729703903e-05, 4.538148641586304e-05, 4.695821553468704e-05, 4.853494465351105e-05, 5.011167377233505e-05, 5.168840289115906e-05, 5.326513200998306e-05, 5.484186112880707e-05, 5.641859024763107e-05, 5.799531936645508e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 5.0, 5.0, 7.0, 8.0, 23.0, 28.0, 28.0, 59.0, 85.0, 133.0, 264.0, 437.0, 652.0, 1131.0, 2037.0, 3816.0, 7843.0, 17406.0, 42965.0, 114867.0, 262731.0, 314471.0, 168278.0, 64287.0, 24749.0, 10900.0, 5120.0, 2635.0, 1491.0, 823.0, 472.0, 296.0, 169.0, 121.0, 66.0, 49.0, 34.0, 22.0, 9.0, 6.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14410018920898438, -0.14000701904296875, -0.13591384887695312, -0.1318206787109375, -0.12772750854492188, -0.12363433837890625, -0.11954116821289062, -0.115447998046875, -0.11135482788085938, -0.10726165771484375, -0.10316848754882812, -0.0990753173828125, -0.09498214721679688, -0.09088897705078125, -0.08679580688476562, -0.08270263671875, -0.07860946655273438, -0.07451629638671875, -0.07042312622070312, -0.0663299560546875, -0.062236785888671875, -0.05814361572265625, -0.054050445556640625, -0.049957275390625, -0.045864105224609375, -0.04177093505859375, -0.037677764892578125, -0.0335845947265625, -0.029491424560546875, -0.02539825439453125, -0.021305084228515625, -0.0172119140625, -0.013118743896484375, -0.00902557373046875, -0.004932403564453125, -0.0008392333984375, 0.003253936767578125, 0.00734710693359375, 0.011440277099609375, 0.015533447265625, 0.019626617431640625, 0.02371978759765625, 0.027812957763671875, 0.0319061279296875, 0.035999298095703125, 0.04009246826171875, 0.044185638427734375, 0.04827880859375, 0.052371978759765625, 0.05646514892578125, 0.060558319091796875, 0.0646514892578125, 0.06874465942382812, 0.07283782958984375, 0.07693099975585938, 0.081024169921875, 0.08511734008789062, 0.08921051025390625, 0.09330368041992188, 0.0973968505859375, 0.10149002075195312, 0.10558319091796875, 0.10967636108398438, 0.11376953125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 7.0, 19.0, 14.0, 16.0, 23.0, 21.0, 34.0, 43.0, 50.0, 64.0, 62.0, 86.0, 76.0, 73.0, 70.0, 62.0, 55.0, 54.0, 27.0, 29.0, 24.0, 7.0, 16.0, 10.0, 10.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.12979698181152344, -0.12495040893554688, -0.12010383605957031, -0.11525726318359375, -0.11041069030761719, -0.10556411743164062, -0.10071754455566406, -0.0958709716796875, -0.09102439880371094, -0.08617782592773438, -0.08133125305175781, -0.07648468017578125, -0.07163810729980469, -0.06679153442382812, -0.06194496154785156, -0.057098388671875, -0.05225181579589844, -0.047405242919921875, -0.04255867004394531, -0.03771209716796875, -0.03286552429199219, -0.028018951416015625, -0.023172378540039062, -0.0183258056640625, -0.013479232788085938, -0.008632659912109375, -0.0037860870361328125, 0.00106048583984375, 0.0059070587158203125, 0.010753631591796875, 0.015600204467773438, 0.02044677734375, 0.025293350219726562, 0.030139923095703125, 0.03498649597167969, 0.03983306884765625, 0.04467964172363281, 0.049526214599609375, 0.05437278747558594, 0.0592193603515625, 0.06406593322753906, 0.06891250610351562, 0.07375907897949219, 0.07860565185546875, 0.08345222473144531, 0.08829879760742188, 0.09314537048339844, 0.097991943359375, 0.10283851623535156, 0.10768508911132812, 0.11253166198730469, 0.11737823486328125, 0.12222480773925781, 0.12707138061523438, 0.13191795349121094, 0.1367645263671875, 0.14161109924316406, 0.14645767211914062, 0.1513042449951172, 0.15615081787109375, 0.1609973907470703, 0.16584396362304688, 0.17069053649902344, 0.175537109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 13.0, 39.0, 52.0, 85.0, 96.0, 162.0, 168.0, 136.0, 96.0, 46.0, 37.0, 7.0, 14.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8907663822174072, -2.803969621658325, -2.717172861099243, -2.630376100540161, -2.543579339981079, -2.456782579421997, -2.369985580444336, -2.283188819885254, -2.196392059326172, -2.10959529876709, -2.022798538208008, -1.9360017776489258, -1.8492050170898438, -1.7624082565307617, -1.6756113767623901, -1.588814616203308, -1.5020179748535156, -1.4152212142944336, -1.3284244537353516, -1.2416276931762695, -1.1548309326171875, -1.0680341720581055, -0.9812372922897339, -0.8944405317306519, -0.8076437711715698, -0.7208470106124878, -0.6340502500534058, -0.547253429889679, -0.4604566693305969, -0.3736599087715149, -0.2868630886077881, -0.20006632804870605, -0.11326932907104492, -0.026472553610801697, 0.06032422184944153, 0.14712101221084595, 0.23391777276992798, 0.32071453332901, 0.4075113534927368, 0.49430811405181885, 0.5811048746109009, 0.6679016351699829, 0.7546983957290649, 0.8414952158927917, 0.9282919764518738, 1.0150887966156006, 1.1018855571746826, 1.1886823177337646, 1.2754790782928467, 1.3622758388519287, 1.4490725994110107, 1.5358693599700928, 1.6226661205291748, 1.7094628810882568, 1.7962597608566284, 1.8830565214157104, 1.9698532819747925, 2.056650161743164, 2.143446922302246, 2.230243682861328, 2.31704044342041, 2.403837203979492, 2.490633964538574, 2.5774307250976562, 2.6642274856567383]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 8.0, 8.0, 13.0, 13.0, 13.0, 16.0, 14.0, 22.0, 36.0, 27.0, 29.0, 28.0, 34.0, 44.0, 55.0, 40.0, 43.0, 50.0, 43.0, 50.0, 43.0, 31.0, 41.0, 42.0, 33.0, 28.0, 28.0, 25.0, 24.0, 20.0, 20.0, 11.0, 9.0, 22.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.101801872253418, -2.039381265640259, -1.9769608974456787, -1.914540410041809, -1.8521199226379395, -1.7896993160247803, -1.7272788286209106, -1.664858341217041, -1.6024378538131714, -1.5400173664093018, -1.4775968790054321, -1.4151763916015625, -1.3527557849884033, -1.2903354167938232, -1.227914810180664, -1.1654943227767944, -1.1030738353729248, -1.0406533479690552, -0.9782328605651855, -0.9158123135566711, -0.8533918261528015, -0.7909713387489319, -0.7285507917404175, -0.6661303043365479, -0.6037098169326782, -0.5412893295288086, -0.4788688123226166, -0.41644829511642456, -0.35402780771255493, -0.2916073203086853, -0.2291868031024933, -0.16676628589630127, -0.10434579849243164, -0.04192529618740082, 0.020495206117630005, 0.08291570842266083, 0.14533621072769165, 0.20775669813156128, 0.2701772153377533, 0.3325977325439453, 0.39501821994781494, 0.45743870735168457, 0.5198591947555542, 0.5822797417640686, 0.6447002291679382, 0.7071207165718079, 0.7695412635803223, 0.8319617509841919, 0.8943822383880615, 0.9568027257919312, 1.0192232131958008, 1.0816437005996704, 1.14406418800354, 1.2064847946166992, 1.2689052820205688, 1.3313257694244385, 1.393746256828308, 1.4561667442321777, 1.5185872316360474, 1.581007719039917, 1.6434283256530762, 1.7058486938476562, 1.7682693004608154, 1.830689787864685, 1.8931102752685547]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 19.0, 22.0, 32.0, 58.0, 79.0, 131.0, 200.0, 288.0, 450.0, 672.0, 1216.0, 2035.0, 3778.0, 7158.0, 15979.0, 41714.0, 119178.0, 321567.0, 745603.0, 1165876.0, 972402.0, 492112.0, 189583.0, 68076.0, 24604.0, 10090.0, 4762.0, 2587.0, 1511.0, 871.0, 516.0, 350.0, 217.0, 175.0, 106.0, 66.0, 57.0, 33.0, 35.0, 15.0, 12.0, 8.0, 5.0, 6.0, 3.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2281494140625, -0.22072219848632812, -0.21329498291015625, -0.20586776733398438, -0.1984405517578125, -0.19101333618164062, -0.18358612060546875, -0.17615890502929688, -0.168731689453125, -0.16130447387695312, -0.15387725830078125, -0.14645004272460938, -0.1390228271484375, -0.13159561157226562, -0.12416839599609375, -0.11674118041992188, -0.10931396484375, -0.10188674926757812, -0.09445953369140625, -0.08703231811523438, -0.0796051025390625, -0.07217788696289062, -0.06475067138671875, -0.057323455810546875, -0.049896240234375, -0.042469024658203125, -0.03504180908203125, -0.027614593505859375, -0.0201873779296875, -0.012760162353515625, -0.00533294677734375, 0.002094268798828125, 0.009521484375, 0.016948699951171875, 0.02437591552734375, 0.031803131103515625, 0.0392303466796875, 0.046657562255859375, 0.05408477783203125, 0.061511993408203125, 0.068939208984375, 0.07636642456054688, 0.08379364013671875, 0.09122085571289062, 0.0986480712890625, 0.10607528686523438, 0.11350250244140625, 0.12092971801757812, 0.12835693359375, 0.13578414916992188, 0.14321136474609375, 0.15063858032226562, 0.1580657958984375, 0.16549301147460938, 0.17292022705078125, 0.18034744262695312, 0.187774658203125, 0.19520187377929688, 0.20262908935546875, 0.21005630493164062, 0.2174835205078125, 0.22491073608398438, 0.23233795166015625, 0.23976516723632812, 0.2471923828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 10.0, 17.0, 21.0, 12.0, 23.0, 18.0, 35.0, 29.0, 31.0, 31.0, 40.0, 40.0, 45.0, 40.0, 37.0, 55.0, 25.0, 45.0, 49.0, 49.0, 39.0, 42.0, 41.0, 36.0, 47.0, 18.0, 12.0, 17.0, 7.0, 13.0, 10.0, 10.0, 6.0, 8.0, 7.0, 7.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.2987060546875, -0.2890625, -0.2794189453125, -0.269775390625, -0.2601318359375, -0.25048828125, -0.2408447265625, -0.231201171875, -0.2215576171875, -0.2119140625, -0.2022705078125, -0.192626953125, -0.1829833984375, -0.17333984375, -0.1636962890625, -0.154052734375, -0.1444091796875, -0.134765625, -0.1251220703125, -0.115478515625, -0.1058349609375, -0.09619140625, -0.0865478515625, -0.076904296875, -0.0672607421875, -0.0576171875, -0.0479736328125, -0.038330078125, -0.0286865234375, -0.01904296875, -0.0093994140625, 0.000244140625, 0.0098876953125, 0.01953125, 0.0291748046875, 0.038818359375, 0.0484619140625, 0.05810546875, 0.0677490234375, 0.077392578125, 0.0870361328125, 0.0966796875, 0.1063232421875, 0.115966796875, 0.1256103515625, 0.13525390625, 0.1448974609375, 0.154541015625, 0.1641845703125, 0.173828125, 0.1834716796875, 0.193115234375, 0.2027587890625, 0.21240234375, 0.2220458984375, 0.231689453125, 0.2413330078125, 0.2509765625, 0.2606201171875, 0.270263671875, 0.2799072265625, 0.28955078125, 0.2991943359375, 0.308837890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 9.0, 2.0, 11.0, 7.0, 20.0, 35.0, 46.0, 86.0, 125.0, 238.0, 469.0, 839.0, 1710.0, 3973.0, 11087.0, 39547.0, 182887.0, 1474135.0, 2127416.0, 274759.0, 53432.0, 14321.0, 4944.0, 1977.0, 984.0, 517.0, 279.0, 152.0, 113.0, 54.0, 40.0, 33.0, 10.0, 13.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.484375, -0.46773529052734375, -0.4510955810546875, -0.43445587158203125, -0.417816162109375, -0.40117645263671875, -0.3845367431640625, -0.36789703369140625, -0.35125732421875, -0.33461761474609375, -0.3179779052734375, -0.30133819580078125, -0.284698486328125, -0.26805877685546875, -0.2514190673828125, -0.23477935791015625, -0.2181396484375, -0.20149993896484375, -0.1848602294921875, -0.16822052001953125, -0.151580810546875, -0.13494110107421875, -0.1183013916015625, -0.10166168212890625, -0.08502197265625, -0.06838226318359375, -0.0517425537109375, -0.03510284423828125, -0.018463134765625, -0.00182342529296875, 0.0148162841796875, 0.03145599365234375, 0.048095703125, 0.06473541259765625, 0.0813751220703125, 0.09801483154296875, 0.114654541015625, 0.13129425048828125, 0.1479339599609375, 0.16457366943359375, 0.18121337890625, 0.19785308837890625, 0.2144927978515625, 0.23113250732421875, 0.247772216796875, 0.26441192626953125, 0.2810516357421875, 0.29769134521484375, 0.3143310546875, 0.33097076416015625, 0.3476104736328125, 0.36425018310546875, 0.380889892578125, 0.39752960205078125, 0.4141693115234375, 0.43080902099609375, 0.44744873046875, 0.46408843994140625, 0.4807281494140625, 0.49736785888671875, 0.514007568359375, 0.5306472778320312, 0.5472869873046875, 0.5639266967773438, 0.58056640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 16.0, 20.0, 14.0, 33.0, 49.0, 74.0, 78.0, 123.0, 190.0, 280.0, 442.0, 548.0, 583.0, 514.0, 393.0, 226.0, 129.0, 75.0, 75.0, 54.0, 35.0, 25.0, 22.0, 19.0, 18.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5284042358398438, -0.5109100341796875, -0.49341583251953125, -0.475921630859375, -0.45842742919921875, -0.4409332275390625, -0.42343902587890625, -0.40594482421875, -0.38845062255859375, -0.3709564208984375, -0.35346221923828125, -0.335968017578125, -0.31847381591796875, -0.3009796142578125, -0.28348541259765625, -0.2659912109375, -0.24849700927734375, -0.2310028076171875, -0.21350860595703125, -0.196014404296875, -0.17852020263671875, -0.1610260009765625, -0.14353179931640625, -0.12603759765625, -0.10854339599609375, -0.0910491943359375, -0.07355499267578125, -0.056060791015625, -0.03856658935546875, -0.0210723876953125, -0.00357818603515625, 0.013916015625, 0.03141021728515625, 0.0489044189453125, 0.06639862060546875, 0.083892822265625, 0.10138702392578125, 0.1188812255859375, 0.13637542724609375, 0.15386962890625, 0.17136383056640625, 0.1888580322265625, 0.20635223388671875, 0.223846435546875, 0.24134063720703125, 0.2588348388671875, 0.27632904052734375, 0.2938232421875, 0.31131744384765625, 0.3288116455078125, 0.34630584716796875, 0.363800048828125, 0.38129425048828125, 0.3987884521484375, 0.41628265380859375, 0.43377685546875, 0.45127105712890625, 0.4687652587890625, 0.48625946044921875, 0.503753662109375, 0.5212478637695312, 0.5387420654296875, 0.5562362670898438, 0.57373046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 19.0, 56.0, 124.0, 225.0, 291.0, 177.0, 64.0, 20.0, 11.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624755382537842, -5.4380927085876465, -5.251430034637451, -5.064766883850098, -4.878104209899902, -4.691441535949707, -4.504778861999512, -4.318116188049316, -4.131453514099121, -3.944790840148926, -3.7581279277801514, -3.571465253829956, -3.3848023414611816, -3.1981396675109863, -3.011476993560791, -2.8248143196105957, -2.638151168823242, -2.451488494873047, -2.2648255825042725, -2.078162908554077, -1.8915001153945923, -1.7048373222351074, -1.518174648284912, -1.3315118551254272, -1.1448490619659424, -0.9581862688064575, -0.7715235352516174, -0.5848608016967773, -0.3981980085372925, -0.21153521537780762, -0.024872541427612305, 0.16179025173187256, 0.3484525680541992, 0.5351153612136841, 0.7217780947685242, 0.9084408283233643, 1.0951036214828491, 1.281766414642334, 1.4684290885925293, 1.6550918817520142, 1.841754674911499, 2.0284173488616943, 2.2150802612304688, 2.401742935180664, 2.5884056091308594, 2.775068521499634, 2.961731195449829, 3.1483941078186035, 3.335056781768799, 3.521719455718994, 3.7083823680877686, 3.895045042037964, 4.081707954406738, 4.268370628356934, 4.455033302307129, 4.641695976257324, 4.8283586502075195, 5.015021324157715, 5.20168399810791, 5.3883466720581055, 5.575009822845459, 5.761672496795654, 5.94833517074585, 6.134997844696045, 6.321660995483398]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 9.0, 11.0, 9.0, 14.0, 7.0, 13.0, 17.0, 20.0, 22.0, 28.0, 32.0, 34.0, 32.0, 42.0, 36.0, 34.0, 37.0, 45.0, 43.0, 59.0, 42.0, 45.0, 38.0, 45.0, 37.0, 31.0, 32.0, 25.0, 27.0, 16.0, 17.0, 18.0, 11.0, 12.0, 14.0, 13.0, 8.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6541695594787598, -1.6049076318740845, -1.5556457042694092, -1.5063837766647339, -1.4571218490600586, -1.4078598022460938, -1.3585978746414185, -1.3093359470367432, -1.2600740194320679, -1.2108120918273926, -1.1615501642227173, -1.112288236618042, -1.0630261898040771, -1.0137642621994019, -0.9645023345947266, -0.9152404069900513, -0.865978479385376, -0.8167165517807007, -0.7674546241760254, -0.7181926369667053, -0.66893070936203, -0.6196687817573547, -0.5704067945480347, -0.5211448669433594, -0.4718829393386841, -0.4226210117340088, -0.3733590543270111, -0.3240970969200134, -0.27483516931533813, -0.22557322680950165, -0.17631128430366516, -0.12704932689666748, -0.07778739929199219, -0.0285254567861557, 0.020736485719680786, 0.06999842822551727, 0.11926037073135376, 0.16852231323719025, 0.21778425574302673, 0.2670462131500244, 0.3163081407546997, 0.365570068359375, 0.4148320257663727, 0.46409398317337036, 0.5133559107780457, 0.562617838382721, 0.611879825592041, 0.6611417531967163, 0.7104036808013916, 0.7596656084060669, 0.8089275360107422, 0.8581895232200623, 0.9074514508247375, 0.9567133784294128, 1.005975365638733, 1.0552372932434082, 1.1044992208480835, 1.1537611484527588, 1.203023076057434, 1.2522850036621094, 1.3015470504760742, 1.3508089780807495, 1.4000709056854248, 1.4493328332901, 1.4985947608947754]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 8.0, 5.0, 13.0, 12.0, 27.0, 36.0, 35.0, 62.0, 85.0, 145.0, 223.0, 346.0, 549.0, 1013.0, 1905.0, 3557.0, 7245.0, 15749.0, 40318.0, 132443.0, 344294.0, 321166.0, 115194.0, 36071.0, 13960.0, 6578.0, 3307.0, 1717.0, 953.0, 514.0, 323.0, 221.0, 151.0, 100.0, 57.0, 54.0, 33.0, 22.0, 19.0, 11.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5078125, -0.49285125732421875, -0.4778900146484375, -0.46292877197265625, -0.447967529296875, -0.43300628662109375, -0.4180450439453125, -0.40308380126953125, -0.38812255859375, -0.37316131591796875, -0.3582000732421875, -0.34323883056640625, -0.328277587890625, -0.31331634521484375, -0.2983551025390625, -0.28339385986328125, -0.2684326171875, -0.25347137451171875, -0.2385101318359375, -0.22354888916015625, -0.208587646484375, -0.19362640380859375, -0.1786651611328125, -0.16370391845703125, -0.14874267578125, -0.13378143310546875, -0.1188201904296875, -0.10385894775390625, -0.088897705078125, -0.07393646240234375, -0.0589752197265625, -0.04401397705078125, -0.029052734375, -0.01409149169921875, 0.0008697509765625, 0.01583099365234375, 0.030792236328125, 0.04575347900390625, 0.0607147216796875, 0.07567596435546875, 0.09063720703125, 0.10559844970703125, 0.1205596923828125, 0.13552093505859375, 0.150482177734375, 0.16544342041015625, 0.1804046630859375, 0.19536590576171875, 0.2103271484375, 0.22528839111328125, 0.2402496337890625, 0.25521087646484375, 0.270172119140625, 0.28513336181640625, 0.3000946044921875, 0.31505584716796875, 0.33001708984375, 0.34497833251953125, 0.3599395751953125, 0.37490081787109375, 0.389862060546875, 0.40482330322265625, 0.4197845458984375, 0.43474578857421875, 0.44970703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 5.0, 6.0, 7.0, 11.0, 13.0, 20.0, 24.0, 15.0, 23.0, 24.0, 30.0, 36.0, 27.0, 32.0, 26.0, 49.0, 30.0, 42.0, 33.0, 45.0, 40.0, 36.0, 42.0, 42.0, 42.0, 29.0, 31.0, 25.0, 31.0, 18.0, 21.0, 26.0, 13.0, 17.0, 14.0, 13.0, 10.0, 9.0, 13.0, 4.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2327880859375, -0.2248516082763672, -0.21691513061523438, -0.20897865295410156, -0.20104217529296875, -0.19310569763183594, -0.18516921997070312, -0.1772327423095703, -0.1692962646484375, -0.1613597869873047, -0.15342330932617188, -0.14548683166503906, -0.13755035400390625, -0.12961387634277344, -0.12167739868164062, -0.11374092102050781, -0.105804443359375, -0.09786796569824219, -0.08993148803710938, -0.08199501037597656, -0.07405853271484375, -0.06612205505371094, -0.058185577392578125, -0.05024909973144531, -0.0423126220703125, -0.03437614440917969, -0.026439666748046875, -0.018503189086914062, -0.01056671142578125, -0.0026302337646484375, 0.005306243896484375, 0.013242721557617188, 0.02117919921875, 0.029115676879882812, 0.037052154541015625, 0.04498863220214844, 0.05292510986328125, 0.06086158752441406, 0.06879806518554688, 0.07673454284667969, 0.0846710205078125, 0.09260749816894531, 0.10054397583007812, 0.10848045349121094, 0.11641693115234375, 0.12435340881347656, 0.13228988647460938, 0.1402263641357422, 0.148162841796875, 0.1560993194580078, 0.16403579711914062, 0.17197227478027344, 0.17990875244140625, 0.18784523010253906, 0.19578170776367188, 0.2037181854248047, 0.2116546630859375, 0.2195911407470703, 0.22752761840820312, 0.23546409606933594, 0.24340057373046875, 0.25133705139160156, 0.2592735290527344, 0.2672100067138672, 0.275146484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 12.0, 8.0, 34.0, 35.0, 44.0, 88.0, 127.0, 192.0, 347.0, 633.0, 1535.0, 3511.0, 8541.0, 21370.0, 60609.0, 202455.0, 421513.0, 222104.0, 66204.0, 23109.0, 9077.0, 3753.0, 1536.0, 781.0, 355.0, 209.0, 132.0, 71.0, 51.0, 44.0, 16.0, 18.0, 11.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5523605346679688, -0.5353851318359375, -0.5184097290039062, -0.501434326171875, -0.48445892333984375, -0.4674835205078125, -0.45050811767578125, -0.43353271484375, -0.41655731201171875, -0.3995819091796875, -0.38260650634765625, -0.365631103515625, -0.34865570068359375, -0.3316802978515625, -0.31470489501953125, -0.2977294921875, -0.28075408935546875, -0.2637786865234375, -0.24680328369140625, -0.229827880859375, -0.21285247802734375, -0.1958770751953125, -0.17890167236328125, -0.16192626953125, -0.14495086669921875, -0.1279754638671875, -0.11100006103515625, -0.094024658203125, -0.07704925537109375, -0.0600738525390625, -0.04309844970703125, -0.026123046875, -0.00914764404296875, 0.0078277587890625, 0.02480316162109375, 0.041778564453125, 0.05875396728515625, 0.0757293701171875, 0.09270477294921875, 0.10968017578125, 0.12665557861328125, 0.1436309814453125, 0.16060638427734375, 0.177581787109375, 0.19455718994140625, 0.2115325927734375, 0.22850799560546875, 0.2454833984375, 0.26245880126953125, 0.2794342041015625, 0.29640960693359375, 0.313385009765625, 0.33036041259765625, 0.3473358154296875, 0.36431121826171875, 0.38128662109375, 0.39826202392578125, 0.4152374267578125, 0.43221282958984375, 0.449188232421875, 0.46616363525390625, 0.4831390380859375, 0.5001144409179688, 0.51708984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 8.0, 8.0, 8.0, 10.0, 14.0, 12.0, 21.0, 21.0, 13.0, 26.0, 28.0, 27.0, 27.0, 29.0, 43.0, 32.0, 28.0, 42.0, 38.0, 39.0, 34.0, 56.0, 37.0, 37.0, 37.0, 44.0, 38.0, 33.0, 33.0, 25.0, 16.0, 17.0, 17.0, 19.0, 14.0, 13.0, 9.0, 6.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.78369140625, -0.7600173950195312, -0.7363433837890625, -0.7126693725585938, -0.688995361328125, -0.6653213500976562, -0.6416473388671875, -0.6179733276367188, -0.59429931640625, -0.5706253051757812, -0.5469512939453125, -0.5232772827148438, -0.499603271484375, -0.47592926025390625, -0.4522552490234375, -0.42858123779296875, -0.4049072265625, -0.38123321533203125, -0.3575592041015625, -0.33388519287109375, -0.310211181640625, -0.28653717041015625, -0.2628631591796875, -0.23918914794921875, -0.21551513671875, -0.19184112548828125, -0.1681671142578125, -0.14449310302734375, -0.120819091796875, -0.09714508056640625, -0.0734710693359375, -0.04979705810546875, -0.026123046875, -0.00244903564453125, 0.0212249755859375, 0.04489898681640625, 0.068572998046875, 0.09224700927734375, 0.1159210205078125, 0.13959503173828125, 0.16326904296875, 0.18694305419921875, 0.2106170654296875, 0.23429107666015625, 0.257965087890625, 0.28163909912109375, 0.3053131103515625, 0.32898712158203125, 0.3526611328125, 0.37633514404296875, 0.4000091552734375, 0.42368316650390625, 0.447357177734375, 0.47103118896484375, 0.4947052001953125, 0.5183792114257812, 0.54205322265625, 0.5657272338867188, 0.5894012451171875, 0.6130752563476562, 0.636749267578125, 0.6604232788085938, 0.6840972900390625, 0.7077713012695312, 0.7314453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 11.0, 16.0, 22.0, 26.0, 39.0, 73.0, 124.0, 236.0, 555.0, 1132.0, 2627.0, 6199.0, 15353.0, 44747.0, 165261.0, 433400.0, 269249.0, 71674.0, 22288.0, 8721.0, 3661.0, 1649.0, 740.0, 305.0, 186.0, 99.0, 55.0, 38.0, 24.0, 9.0, 12.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1917724609375, -0.18552398681640625, -0.1792755126953125, -0.17302703857421875, -0.166778564453125, -0.16053009033203125, -0.1542816162109375, -0.14803314208984375, -0.14178466796875, -0.13553619384765625, -0.1292877197265625, -0.12303924560546875, -0.116790771484375, -0.11054229736328125, -0.1042938232421875, -0.09804534912109375, -0.091796875, -0.08554840087890625, -0.0792999267578125, -0.07305145263671875, -0.066802978515625, -0.06055450439453125, -0.0543060302734375, -0.04805755615234375, -0.04180908203125, -0.03556060791015625, -0.0293121337890625, -0.02306365966796875, -0.016815185546875, -0.01056671142578125, -0.0043182373046875, 0.00193023681640625, 0.0081787109375, 0.01442718505859375, 0.0206756591796875, 0.02692413330078125, 0.033172607421875, 0.03942108154296875, 0.0456695556640625, 0.05191802978515625, 0.05816650390625, 0.06441497802734375, 0.0706634521484375, 0.07691192626953125, 0.083160400390625, 0.08940887451171875, 0.0956573486328125, 0.10190582275390625, 0.108154296875, 0.11440277099609375, 0.1206512451171875, 0.12689971923828125, 0.133148193359375, 0.13939666748046875, 0.1456451416015625, 0.15189361572265625, 0.15814208984375, 0.16439056396484375, 0.1706390380859375, 0.17688751220703125, 0.183135986328125, 0.18938446044921875, 0.1956329345703125, 0.20188140869140625, 0.2081298828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 5.0, 1.0, 2.0, 6.0, 4.0, 8.0, 6.0, 7.0, 7.0, 20.0, 34.0, 45.0, 32.0, 80.0, 98.0, 111.0, 115.0, 115.0, 83.0, 63.0, 41.0, 33.0, 24.0, 9.0, 11.0, 7.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.924701690673828e-05, -5.734618753194809e-05, -5.54453581571579e-05, -5.3544528782367706e-05, -5.1643699407577515e-05, -4.974287003278732e-05, -4.784204065799713e-05, -4.594121128320694e-05, -4.404038190841675e-05, -4.2139552533626556e-05, -4.0238723158836365e-05, -3.833789378404617e-05, -3.643706440925598e-05, -3.453623503446579e-05, -3.26354056596756e-05, -3.0734576284885406e-05, -2.8833746910095215e-05, -2.6932917535305023e-05, -2.503208816051483e-05, -2.313125878572464e-05, -2.1230429410934448e-05, -1.9329600036144257e-05, -1.7428770661354065e-05, -1.5527941286563873e-05, -1.3627111911773682e-05, -1.172628253698349e-05, -9.825453162193298e-06, -7.924623787403107e-06, -6.023794412612915e-06, -4.122965037822723e-06, -2.2221356630325317e-06, -3.213062882423401e-07, 1.5795230865478516e-06, 3.4803524613380432e-06, 5.381181836128235e-06, 7.2820112109184265e-06, 9.182840585708618e-06, 1.108366996049881e-05, 1.2984499335289001e-05, 1.4885328710079193e-05, 1.6786158084869385e-05, 1.8686987459659576e-05, 2.0587816834449768e-05, 2.248864620923996e-05, 2.438947558403015e-05, 2.6290304958820343e-05, 2.8191134333610535e-05, 3.0091963708400726e-05, 3.199279308319092e-05, 3.389362245798111e-05, 3.57944518327713e-05, 3.769528120756149e-05, 3.9596110582351685e-05, 4.1496939957141876e-05, 4.339776933193207e-05, 4.529859870672226e-05, 4.719942808151245e-05, 4.910025745630264e-05, 5.1001086831092834e-05, 5.2901916205883026e-05, 5.480274558067322e-05, 5.670357495546341e-05, 5.86044043302536e-05, 6.050523370504379e-05, 6.240606307983398e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 13.0, 17.0, 26.0, 51.0, 57.0, 103.0, 140.0, 264.0, 467.0, 763.0, 1643.0, 3326.0, 7945.0, 19696.0, 55036.0, 163256.0, 339928.0, 282972.0, 110689.0, 37352.0, 13930.0, 5585.0, 2461.0, 1182.0, 655.0, 347.0, 215.0, 130.0, 107.0, 63.0, 40.0, 29.0, 15.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.133544921875, -0.12856483459472656, -0.12358474731445312, -0.11860466003417969, -0.11362457275390625, -0.10864448547363281, -0.10366439819335938, -0.09868431091308594, -0.0937042236328125, -0.08872413635253906, -0.08374404907226562, -0.07876396179199219, -0.07378387451171875, -0.06880378723144531, -0.06382369995117188, -0.05884361267089844, -0.053863525390625, -0.04888343811035156, -0.043903350830078125, -0.03892326354980469, -0.03394317626953125, -0.028963088989257812, -0.023983001708984375, -0.019002914428710938, -0.0140228271484375, -0.009042739868164062, -0.004062652587890625, 0.0009174346923828125, 0.00589752197265625, 0.010877609252929688, 0.015857696533203125, 0.020837783813476562, 0.02581787109375, 0.030797958374023438, 0.035778045654296875, 0.04075813293457031, 0.04573822021484375, 0.05071830749511719, 0.055698394775390625, 0.06067848205566406, 0.0656585693359375, 0.07063865661621094, 0.07561874389648438, 0.08059883117675781, 0.08557891845703125, 0.09055900573730469, 0.09553909301757812, 0.10051918029785156, 0.105499267578125, 0.11047935485839844, 0.11545944213867188, 0.12043952941894531, 0.12541961669921875, 0.1303997039794922, 0.13537979125976562, 0.14035987854003906, 0.1453399658203125, 0.15032005310058594, 0.15530014038085938, 0.1602802276611328, 0.16526031494140625, 0.1702404022216797, 0.17522048950195312, 0.18020057678222656, 0.1851806640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 12.0, 10.0, 21.0, 13.0, 24.0, 23.0, 28.0, 42.0, 49.0, 65.0, 62.0, 66.0, 60.0, 40.0, 57.0, 67.0, 46.0, 50.0, 41.0, 32.0, 31.0, 28.0, 21.0, 18.0, 16.0, 15.0, 9.0, 11.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13525390625, -0.1306133270263672, -0.12597274780273438, -0.12133216857910156, -0.11669158935546875, -0.11205101013183594, -0.10741043090820312, -0.10276985168457031, -0.0981292724609375, -0.09348869323730469, -0.08884811401367188, -0.08420753479003906, -0.07956695556640625, -0.07492637634277344, -0.07028579711914062, -0.06564521789550781, -0.061004638671875, -0.05636405944824219, -0.051723480224609375, -0.04708290100097656, -0.04244232177734375, -0.03780174255371094, -0.033161163330078125, -0.028520584106445312, -0.0238800048828125, -0.019239425659179688, -0.014598846435546875, -0.009958267211914062, -0.00531768798828125, -0.0006771087646484375, 0.003963470458984375, 0.008604049682617188, 0.01324462890625, 0.017885208129882812, 0.022525787353515625, 0.027166366577148438, 0.03180694580078125, 0.03644752502441406, 0.041088104248046875, 0.04572868347167969, 0.0503692626953125, 0.05500984191894531, 0.059650421142578125, 0.06429100036621094, 0.06893157958984375, 0.07357215881347656, 0.07821273803710938, 0.08285331726074219, 0.087493896484375, 0.09213447570800781, 0.09677505493164062, 0.10141563415527344, 0.10605621337890625, 0.11069679260253906, 0.11533737182617188, 0.11997795104980469, 0.1246185302734375, 0.1292591094970703, 0.13389968872070312, 0.13854026794433594, 0.14318084716796875, 0.14782142639160156, 0.15246200561523438, 0.1571025848388672, 0.1617431640625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 7.0, 11.0, 19.0, 55.0, 99.0, 155.0, 173.0, 195.0, 130.0, 78.0, 38.0, 12.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.05173659324646, -2.937774896621704, -2.823812961578369, -2.7098512649536133, -2.5958895683288574, -2.4819278717041016, -2.3679659366607666, -2.2540042400360107, -2.140042304992676, -2.02608060836792, -1.9121187925338745, -1.798156976699829, -1.6841952800750732, -1.5702334642410278, -1.4562716484069824, -1.3423099517822266, -1.2283482551574707, -1.1143864393234253, -1.0004247426986694, -0.886462926864624, -0.7725011706352234, -0.6585394144058228, -0.5445775985717773, -0.4306158423423767, -0.3166540861129761, -0.20269231498241425, -0.08873054385185242, 0.025231242179870605, 0.13919299840927124, 0.2531547546386719, 0.3671165704727173, 0.4810783267021179, 0.5950398445129395, 0.7090016007423401, 0.8229633569717407, 0.9369251728057861, 1.050886869430542, 1.1648486852645874, 1.2788105010986328, 1.3927721977233887, 1.506734013557434, 1.6206958293914795, 1.7346575260162354, 1.8486193418502808, 1.9625811576843262, 2.076542854309082, 2.190504550933838, 2.304466485977173, 2.4184281826019287, 2.5323898792266846, 2.6463518142700195, 2.7603135108947754, 2.8742752075195312, 2.988236904144287, 3.102198839187622, 3.216160535812378, 3.330122470855713, 3.4440841674804688, 3.5580461025238037, 3.6720077991485596, 3.7859694957733154, 3.8999314308166504, 4.013893127441406, 4.127854824066162, 4.241816520690918]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 9.0, 3.0, 11.0, 10.0, 12.0, 15.0, 19.0, 18.0, 17.0, 22.0, 26.0, 30.0, 40.0, 37.0, 30.0, 40.0, 43.0, 46.0, 42.0, 30.0, 38.0, 47.0, 38.0, 41.0, 33.0, 28.0, 44.0, 36.0, 35.0, 32.0, 15.0, 19.0, 15.0, 15.0, 15.0, 11.0, 12.0, 5.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7066266536712646, -1.649868130683899, -1.5931096076965332, -1.536351203918457, -1.4795926809310913, -1.4228341579437256, -1.3660756349563599, -1.3093171119689941, -1.252558708190918, -1.1958001852035522, -1.1390416622161865, -1.0822832584381104, -1.0255247354507446, -0.9687662124633789, -0.9120076894760132, -0.8552492260932922, -0.7984907031059265, -0.7417321801185608, -0.6849737167358398, -0.6282151937484741, -0.5714567303657532, -0.5146982073783875, -0.4579397141933441, -0.4011812210083008, -0.34442272782325745, -0.2876642346382141, -0.23090574145317078, -0.17414723336696625, -0.11738874018192291, -0.060630232095718384, -0.003871738910675049, 0.052886754274368286, 0.10964524745941162, 0.16640374064445496, 0.2231622338294983, 0.279920756816864, 0.33667922019958496, 0.3934377431869507, 0.450196236371994, 0.5069547295570374, 0.5637131929397583, 0.620471715927124, 0.677230179309845, 0.7339887022972107, 0.7907471656799316, 0.8475056886672974, 0.9042642116546631, 0.961022675037384, 1.0177812576293945, 1.0745397806167603, 1.131298303604126, 1.1880567073822021, 1.2448152303695679, 1.3015737533569336, 1.3583322763442993, 1.415090799331665, 1.4718492031097412, 1.528607726097107, 1.5853662490844727, 1.6421246528625488, 1.6988831758499146, 1.7556416988372803, 1.812400221824646, 1.8691587448120117, 1.925917148590088]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 14.0, 10.0, 10.0, 23.0, 30.0, 39.0, 64.0, 102.0, 136.0, 174.0, 280.0, 465.0, 791.0, 1467.0, 2637.0, 5397.0, 12752.0, 34736.0, 102077.0, 295589.0, 719977.0, 1176151.0, 1039198.0, 516366.0, 187083.0, 61120.0, 20665.0, 8008.0, 3875.0, 1943.0, 1119.0, 658.0, 412.0, 295.0, 191.0, 130.0, 89.0, 60.0, 39.0, 33.0, 20.0, 26.0, 13.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2491455078125, -0.24130821228027344, -0.23347091674804688, -0.2256336212158203, -0.21779632568359375, -0.2099590301513672, -0.20212173461914062, -0.19428443908691406, -0.1864471435546875, -0.17860984802246094, -0.17077255249023438, -0.1629352569580078, -0.15509796142578125, -0.1472606658935547, -0.13942337036132812, -0.13158607482910156, -0.123748779296875, -0.11591148376464844, -0.10807418823242188, -0.10023689270019531, -0.09239959716796875, -0.08456230163574219, -0.07672500610351562, -0.06888771057128906, -0.0610504150390625, -0.05321311950683594, -0.045375823974609375, -0.03753852844238281, -0.02970123291015625, -0.021863937377929688, -0.014026641845703125, -0.0061893463134765625, 0.00164794921875, 0.009485244750976562, 0.017322540283203125, 0.025159835815429688, 0.03299713134765625, 0.04083442687988281, 0.048671722412109375, 0.05650901794433594, 0.0643463134765625, 0.07218360900878906, 0.08002090454101562, 0.08785820007324219, 0.09569549560546875, 0.10353279113769531, 0.11137008666992188, 0.11920738220214844, 0.127044677734375, 0.13488197326660156, 0.14271926879882812, 0.1505565643310547, 0.15839385986328125, 0.1662311553955078, 0.17406845092773438, 0.18190574645996094, 0.1897430419921875, 0.19758033752441406, 0.20541763305664062, 0.2132549285888672, 0.22109222412109375, 0.2289295196533203, 0.23676681518554688, 0.24460411071777344, 0.25244140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 3.0, 4.0, 3.0, 7.0, 8.0, 11.0, 10.0, 16.0, 22.0, 17.0, 24.0, 33.0, 31.0, 29.0, 45.0, 42.0, 39.0, 40.0, 30.0, 43.0, 43.0, 41.0, 44.0, 42.0, 37.0, 28.0, 31.0, 41.0, 37.0, 35.0, 21.0, 23.0, 20.0, 17.0, 11.0, 13.0, 9.0, 8.0, 6.0, 7.0, 8.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2301025390625, -0.22183799743652344, -0.21357345581054688, -0.2053089141845703, -0.19704437255859375, -0.1887798309326172, -0.18051528930664062, -0.17225074768066406, -0.1639862060546875, -0.15572166442871094, -0.14745712280273438, -0.1391925811767578, -0.13092803955078125, -0.12266349792480469, -0.11439895629882812, -0.10613441467285156, -0.097869873046875, -0.08960533142089844, -0.08134078979492188, -0.07307624816894531, -0.06481170654296875, -0.05654716491699219, -0.048282623291015625, -0.04001808166503906, -0.0317535400390625, -0.023488998413085938, -0.015224456787109375, -0.0069599151611328125, 0.00130462646484375, 0.009569168090820312, 0.017833709716796875, 0.026098251342773438, 0.03436279296875, 0.04262733459472656, 0.050891876220703125, 0.05915641784667969, 0.06742095947265625, 0.07568550109863281, 0.08395004272460938, 0.09221458435058594, 0.1004791259765625, 0.10874366760253906, 0.11700820922851562, 0.1252727508544922, 0.13353729248046875, 0.1418018341064453, 0.15006637573242188, 0.15833091735839844, 0.166595458984375, 0.17486000061035156, 0.18312454223632812, 0.1913890838623047, 0.19965362548828125, 0.2079181671142578, 0.21618270874023438, 0.22444725036621094, 0.2327117919921875, 0.24097633361816406, 0.24924087524414062, 0.2575054168701172, 0.26576995849609375, 0.2740345001220703, 0.2822990417480469, 0.29056358337402344, 0.298828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 8.0, 4.0, 7.0, 10.0, 7.0, 22.0, 38.0, 49.0, 85.0, 170.0, 284.0, 652.0, 1324.0, 3003.0, 7789.0, 23098.0, 80186.0, 357966.0, 1816877.0, 1521644.0, 283661.0, 66206.0, 19212.0, 6918.0, 2654.0, 1160.0, 605.0, 288.0, 160.0, 75.0, 47.0, 32.0, 18.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343505859375, -0.33074951171875, -0.3179931640625, -0.30523681640625, -0.29248046875, -0.27972412109375, -0.2669677734375, -0.25421142578125, -0.241455078125, -0.22869873046875, -0.2159423828125, -0.20318603515625, -0.1904296875, -0.17767333984375, -0.1649169921875, -0.15216064453125, -0.139404296875, -0.12664794921875, -0.1138916015625, -0.10113525390625, -0.08837890625, -0.07562255859375, -0.0628662109375, -0.05010986328125, -0.037353515625, -0.02459716796875, -0.0118408203125, 0.00091552734375, 0.013671875, 0.02642822265625, 0.0391845703125, 0.05194091796875, 0.064697265625, 0.07745361328125, 0.0902099609375, 0.10296630859375, 0.11572265625, 0.12847900390625, 0.1412353515625, 0.15399169921875, 0.166748046875, 0.17950439453125, 0.1922607421875, 0.20501708984375, 0.2177734375, 0.23052978515625, 0.2432861328125, 0.25604248046875, 0.268798828125, 0.28155517578125, 0.2943115234375, 0.30706787109375, 0.31982421875, 0.33258056640625, 0.3453369140625, 0.35809326171875, 0.370849609375, 0.38360595703125, 0.3963623046875, 0.40911865234375, 0.421875, 0.43463134765625, 0.4473876953125, 0.46014404296875, 0.472900390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 6.0, 11.0, 18.0, 23.0, 27.0, 27.0, 42.0, 43.0, 71.0, 80.0, 112.0, 172.0, 206.0, 291.0, 347.0, 413.0, 418.0, 355.0, 325.0, 252.0, 196.0, 139.0, 120.0, 86.0, 71.0, 47.0, 28.0, 21.0, 23.0, 18.0, 15.0, 10.0, 8.0, 12.0, 3.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3261756896972656, -0.31421661376953125, -0.3022575378417969, -0.2902984619140625, -0.2783393859863281, -0.26638031005859375, -0.2544212341308594, -0.242462158203125, -0.23050308227539062, -0.21854400634765625, -0.20658493041992188, -0.1946258544921875, -0.18266677856445312, -0.17070770263671875, -0.15874862670898438, -0.14678955078125, -0.13483047485351562, -0.12287139892578125, -0.11091232299804688, -0.0989532470703125, -0.08699417114257812, -0.07503509521484375, -0.06307601928710938, -0.051116943359375, -0.039157867431640625, -0.02719879150390625, -0.015239715576171875, -0.0032806396484375, 0.008678436279296875, 0.02063751220703125, 0.032596588134765625, 0.0445556640625, 0.056514739990234375, 0.06847381591796875, 0.08043289184570312, 0.0923919677734375, 0.10435104370117188, 0.11631011962890625, 0.12826919555664062, 0.140228271484375, 0.15218734741210938, 0.16414642333984375, 0.17610549926757812, 0.1880645751953125, 0.20002365112304688, 0.21198272705078125, 0.22394180297851562, 0.23590087890625, 0.24785995483398438, 0.25981903076171875, 0.2717781066894531, 0.2837371826171875, 0.2956962585449219, 0.30765533447265625, 0.3196144104003906, 0.331573486328125, 0.3435325622558594, 0.35549163818359375, 0.3674507141113281, 0.3794097900390625, 0.3913688659667969, 0.40332794189453125, 0.4152870178222656, 0.42724609375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 15.0, 36.0, 63.0, 151.0, 175.0, 229.0, 152.0, 91.0, 43.0, 24.0, 5.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.954829692840576, -4.821051597595215, -4.687273979187012, -4.55349588394165, -4.419718265533447, -4.285940170288086, -4.152162551879883, -4.0183844566345215, -3.8846065998077393, -3.750828742980957, -3.617050886154175, -3.4832730293273926, -3.3494949340820312, -3.215717315673828, -3.081939220428467, -2.9481613636016846, -2.8143835067749023, -2.68060564994812, -2.546827793121338, -2.4130499362945557, -2.2792720794677734, -2.145493984222412, -2.01171612739563, -1.8779382705688477, -1.7441604137420654, -1.6103825569152832, -1.476604700088501, -1.3428267240524292, -1.209048867225647, -1.0752710103988647, -0.9414930939674377, -0.8077151775360107, -0.6739375591278076, -0.5401597023010254, -0.4063817858695984, -0.2726038992404938, -0.13882601261138916, -0.005048155784606934, 0.12872976064682007, 0.26250767707824707, 0.3962855339050293, 0.5300633907318115, 0.6638413071632385, 0.7976192235946655, 0.9313970804214478, 1.06517493724823, 1.1989529132843018, 1.332730770111084, 1.4665086269378662, 1.6002864837646484, 1.7340643405914307, 1.8678423166275024, 2.001620292663574, 2.1353979110717773, 2.2691760063171387, 2.402953863143921, 2.536731719970703, 2.6705095767974854, 2.8042874336242676, 2.93806529045105, 3.071843147277832, 3.2056212425231934, 3.3393990993499756, 3.473176956176758, 3.60695481300354]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 11.0, 7.0, 11.0, 12.0, 18.0, 19.0, 22.0, 28.0, 27.0, 42.0, 30.0, 34.0, 39.0, 31.0, 25.0, 33.0, 38.0, 30.0, 33.0, 51.0, 41.0, 37.0, 51.0, 44.0, 36.0, 27.0, 29.0, 45.0, 24.0, 12.0, 18.0, 17.0, 14.0, 18.0, 9.0, 10.0, 12.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3525772094726562, -1.3114572763442993, -1.2703372240066528, -1.229217290878296, -1.1880972385406494, -1.1469773054122925, -1.1058573722839355, -1.064737319946289, -1.0236173868179321, -0.9824973940849304, -0.9413774013519287, -0.9002574682235718, -0.8591374754905701, -0.8180174827575684, -0.7768974900245667, -0.7357774972915649, -0.6946575045585632, -0.6535375118255615, -0.6124175190925598, -0.5712975263595581, -0.5301775932312012, -0.48905760049819946, -0.44793760776519775, -0.40681764483451843, -0.3656976521015167, -0.324577659368515, -0.2834576964378357, -0.24233770370483398, -0.20121772587299347, -0.16009774804115295, -0.11897775530815125, -0.07785779237747192, -0.036737799644470215, 0.004382181912660599, 0.04550216346979141, 0.08662214875221252, 0.12774212658405304, 0.16886210441589355, 0.20998209714889526, 0.2511020600795746, 0.2922220528125763, 0.333342045545578, 0.3744620084762573, 0.41558200120925903, 0.45670199394226074, 0.49782195687294006, 0.5389419794082642, 0.5800619125366211, 0.6211819052696228, 0.6623018980026245, 0.7034218907356262, 0.7445418834686279, 0.7856618165969849, 0.8267818093299866, 0.8679018020629883, 0.9090217351913452, 0.9501417875289917, 0.9912617802619934, 1.0323817729949951, 1.073501706123352, 1.1146217584609985, 1.1557416915893555, 1.196861743927002, 1.2379816770553589, 1.2791016101837158]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 3.0, 7.0, 9.0, 11.0, 14.0, 30.0, 36.0, 50.0, 69.0, 89.0, 117.0, 190.0, 250.0, 424.0, 677.0, 979.0, 1567.0, 2578.0, 4329.0, 7934.0, 16209.0, 38184.0, 100409.0, 225208.0, 301535.0, 200139.0, 83931.0, 32414.0, 13852.0, 6954.0, 3882.0, 2256.0, 1436.0, 880.0, 601.0, 407.0, 254.0, 180.0, 127.0, 91.0, 57.0, 40.0, 35.0, 31.0, 26.0, 16.0, 3.0, 9.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2864036560058594, -0.27666473388671875, -0.2669258117675781, -0.2571868896484375, -0.24744796752929688, -0.23770904541015625, -0.22797012329101562, -0.218231201171875, -0.20849227905273438, -0.19875335693359375, -0.18901443481445312, -0.1792755126953125, -0.16953659057617188, -0.15979766845703125, -0.15005874633789062, -0.14031982421875, -0.13058090209960938, -0.12084197998046875, -0.11110305786132812, -0.1013641357421875, -0.09162521362304688, -0.08188629150390625, -0.07214736938476562, -0.062408447265625, -0.052669525146484375, -0.04293060302734375, -0.033191680908203125, -0.0234527587890625, -0.013713836669921875, -0.00397491455078125, 0.005764007568359375, 0.0155029296875, 0.025241851806640625, 0.03498077392578125, 0.044719696044921875, 0.0544586181640625, 0.06419754028320312, 0.07393646240234375, 0.08367538452148438, 0.093414306640625, 0.10315322875976562, 0.11289215087890625, 0.12263107299804688, 0.1323699951171875, 0.14210891723632812, 0.15184783935546875, 0.16158676147460938, 0.17132568359375, 0.18106460571289062, 0.19080352783203125, 0.20054244995117188, 0.2102813720703125, 0.22002029418945312, 0.22975921630859375, 0.23949813842773438, 0.249237060546875, 0.2589759826660156, 0.26871490478515625, 0.2784538269042969, 0.2881927490234375, 0.2979316711425781, 0.30767059326171875, 0.3174095153808594, 0.3271484375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 7.0, 10.0, 8.0, 10.0, 12.0, 23.0, 14.0, 27.0, 30.0, 32.0, 36.0, 39.0, 59.0, 41.0, 40.0, 44.0, 48.0, 43.0, 49.0, 32.0, 53.0, 47.0, 34.0, 34.0, 24.0, 29.0, 29.0, 23.0, 21.0, 17.0, 23.0, 11.0, 7.0, 9.0, 3.0, 7.0, 2.0, 0.0, 8.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.278564453125, -0.2690086364746094, -0.25945281982421875, -0.24989700317382812, -0.2403411865234375, -0.23078536987304688, -0.22122955322265625, -0.21167373657226562, -0.202117919921875, -0.19256210327148438, -0.18300628662109375, -0.17345046997070312, -0.1638946533203125, -0.15433883666992188, -0.14478302001953125, -0.13522720336914062, -0.12567138671875, -0.11611557006835938, -0.10655975341796875, -0.09700393676757812, -0.0874481201171875, -0.07789230346679688, -0.06833648681640625, -0.058780670166015625, -0.049224853515625, -0.039669036865234375, -0.03011322021484375, -0.020557403564453125, -0.0110015869140625, -0.001445770263671875, 0.00811004638671875, 0.017665863037109375, 0.0272216796875, 0.036777496337890625, 0.04633331298828125, 0.055889129638671875, 0.0654449462890625, 0.07500076293945312, 0.08455657958984375, 0.09411239624023438, 0.103668212890625, 0.11322402954101562, 0.12277984619140625, 0.13233566284179688, 0.1418914794921875, 0.15144729614257812, 0.16100311279296875, 0.17055892944335938, 0.18011474609375, 0.18967056274414062, 0.19922637939453125, 0.20878219604492188, 0.2183380126953125, 0.22789382934570312, 0.23744964599609375, 0.24700546264648438, 0.256561279296875, 0.2661170959472656, 0.27567291259765625, 0.2852287292480469, 0.2947845458984375, 0.3043403625488281, 0.31389617919921875, 0.3234519958496094, 0.3330078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 0.0, 5.0, 6.0, 12.0, 20.0, 12.0, 28.0, 45.0, 46.0, 70.0, 122.0, 178.0, 271.0, 489.0, 778.0, 1281.0, 2070.0, 3699.0, 6301.0, 11495.0, 21367.0, 42301.0, 90135.0, 184870.0, 264879.0, 207200.0, 106278.0, 49971.0, 24226.0, 12997.0, 7086.0, 4181.0, 2427.0, 1442.0, 821.0, 495.0, 351.0, 212.0, 136.0, 78.0, 53.0, 30.0, 20.0, 19.0, 13.0, 15.0, 9.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.25641632080078125, -0.2474517822265625, -0.23848724365234375, -0.229522705078125, -0.22055816650390625, -0.2115936279296875, -0.20262908935546875, -0.19366455078125, -0.18470001220703125, -0.1757354736328125, -0.16677093505859375, -0.157806396484375, -0.14884185791015625, -0.1398773193359375, -0.13091278076171875, -0.1219482421875, -0.11298370361328125, -0.1040191650390625, -0.09505462646484375, -0.086090087890625, -0.07712554931640625, -0.0681610107421875, -0.05919647216796875, -0.05023193359375, -0.04126739501953125, -0.0323028564453125, -0.02333831787109375, -0.014373779296875, -0.00540924072265625, 0.0035552978515625, 0.01251983642578125, 0.021484375, 0.03044891357421875, 0.0394134521484375, 0.04837799072265625, 0.057342529296875, 0.06630706787109375, 0.0752716064453125, 0.08423614501953125, 0.09320068359375, 0.10216522216796875, 0.1111297607421875, 0.12009429931640625, 0.129058837890625, 0.13802337646484375, 0.1469879150390625, 0.15595245361328125, 0.1649169921875, 0.17388153076171875, 0.1828460693359375, 0.19181060791015625, 0.200775146484375, 0.20973968505859375, 0.2187042236328125, 0.22766876220703125, 0.23663330078125, 0.24559783935546875, 0.2545623779296875, 0.26352691650390625, 0.272491455078125, 0.28145599365234375, 0.2904205322265625, 0.29938507080078125, 0.308349609375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 14.0, 11.0, 15.0, 25.0, 19.0, 22.0, 31.0, 30.0, 31.0, 35.0, 46.0, 51.0, 53.0, 47.0, 55.0, 40.0, 50.0, 46.0, 36.0, 39.0, 36.0, 33.0, 32.0, 39.0, 25.0, 20.0, 15.0, 23.0, 13.0, 17.0, 8.0, 6.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8938140869140625, -0.866729736328125, -0.8396453857421875, -0.81256103515625, -0.7854766845703125, -0.758392333984375, -0.7313079833984375, -0.7042236328125, -0.6771392822265625, -0.650054931640625, -0.6229705810546875, -0.59588623046875, -0.5688018798828125, -0.541717529296875, -0.5146331787109375, -0.487548828125, -0.4604644775390625, -0.433380126953125, -0.4062957763671875, -0.37921142578125, -0.3521270751953125, -0.325042724609375, -0.2979583740234375, -0.2708740234375, -0.2437896728515625, -0.216705322265625, -0.1896209716796875, -0.16253662109375, -0.1354522705078125, -0.108367919921875, -0.0812835693359375, -0.05419921875, -0.0271148681640625, -3.0517578125e-05, 0.0270538330078125, 0.05413818359375, 0.0812225341796875, 0.108306884765625, 0.1353912353515625, 0.1624755859375, 0.1895599365234375, 0.216644287109375, 0.2437286376953125, 0.27081298828125, 0.2978973388671875, 0.324981689453125, 0.3520660400390625, 0.379150390625, 0.4062347412109375, 0.433319091796875, 0.4604034423828125, 0.48748779296875, 0.5145721435546875, 0.541656494140625, 0.5687408447265625, 0.5958251953125, 0.6229095458984375, 0.649993896484375, 0.6770782470703125, 0.70416259765625, 0.7312469482421875, 0.758331298828125, 0.7854156494140625, 0.8125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 13.0, 11.0, 27.0, 30.0, 42.0, 57.0, 78.0, 125.0, 217.0, 365.0, 596.0, 1044.0, 1755.0, 3294.0, 6049.0, 12175.0, 25576.0, 59865.0, 144823.0, 278580.0, 270509.0, 137809.0, 56305.0, 24189.0, 11626.0, 5899.0, 3187.0, 1775.0, 1014.0, 557.0, 326.0, 212.0, 153.0, 90.0, 51.0, 38.0, 24.0, 21.0, 11.0, 6.0, 9.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10174560546875, -0.09865951538085938, -0.09557342529296875, -0.09248733520507812, -0.0894012451171875, -0.08631515502929688, -0.08322906494140625, -0.08014297485351562, -0.077056884765625, -0.07397079467773438, -0.07088470458984375, -0.06779861450195312, -0.0647125244140625, -0.061626434326171875, -0.05854034423828125, -0.055454254150390625, -0.0523681640625, -0.049282073974609375, -0.04619598388671875, -0.043109893798828125, -0.0400238037109375, -0.036937713623046875, -0.03385162353515625, -0.030765533447265625, -0.027679443359375, -0.024593353271484375, -0.02150726318359375, -0.018421173095703125, -0.0153350830078125, -0.012248992919921875, -0.00916290283203125, -0.006076812744140625, -0.00299072265625, 9.5367431640625e-05, 0.00318145751953125, 0.006267547607421875, 0.0093536376953125, 0.012439727783203125, 0.01552581787109375, 0.018611907958984375, 0.021697998046875, 0.024784088134765625, 0.02787017822265625, 0.030956268310546875, 0.0340423583984375, 0.037128448486328125, 0.04021453857421875, 0.043300628662109375, 0.04638671875, 0.049472808837890625, 0.05255889892578125, 0.055644989013671875, 0.0587310791015625, 0.061817169189453125, 0.06490325927734375, 0.06798934936523438, 0.071075439453125, 0.07416152954101562, 0.07724761962890625, 0.08033370971679688, 0.0834197998046875, 0.08650588989257812, 0.08959197998046875, 0.09267807006835938, 0.09576416015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 6.0, 5.0, 5.0, 7.0, 13.0, 15.0, 28.0, 34.0, 57.0, 76.0, 86.0, 124.0, 127.0, 124.0, 82.0, 65.0, 48.0, 21.0, 17.0, 13.0, 10.0, 6.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.729364395141602e-05, -6.538163870573044e-05, -6.346963346004486e-05, -6.155762821435928e-05, -5.9645622968673706e-05, -5.773361772298813e-05, -5.582161247730255e-05, -5.3909607231616974e-05, -5.1997601985931396e-05, -5.008559674024582e-05, -4.817359149456024e-05, -4.6261586248874664e-05, -4.434958100318909e-05, -4.243757575750351e-05, -4.052557051181793e-05, -3.8613565266132355e-05, -3.670156002044678e-05, -3.47895547747612e-05, -3.287754952907562e-05, -3.0965544283390045e-05, -2.9053539037704468e-05, -2.714153379201889e-05, -2.5229528546333313e-05, -2.3317523300647736e-05, -2.1405518054962158e-05, -1.949351280927658e-05, -1.7581507563591003e-05, -1.5669502317905426e-05, -1.3757497072219849e-05, -1.1845491826534271e-05, -9.933486580848694e-06, -8.021481335163116e-06, -6.109476089477539e-06, -4.197470843791962e-06, -2.2854655981063843e-06, -3.734603524208069e-07, 1.5385448932647705e-06, 3.450550138950348e-06, 5.362555384635925e-06, 7.274560630321503e-06, 9.18656587600708e-06, 1.1098571121692657e-05, 1.3010576367378235e-05, 1.4922581613063812e-05, 1.683458685874939e-05, 1.8746592104434967e-05, 2.0658597350120544e-05, 2.2570602595806122e-05, 2.44826078414917e-05, 2.6394613087177277e-05, 2.8306618332862854e-05, 3.021862357854843e-05, 3.213062882423401e-05, 3.4042634069919586e-05, 3.5954639315605164e-05, 3.786664456129074e-05, 3.977864980697632e-05, 4.1690655052661896e-05, 4.360266029834747e-05, 4.551466554403305e-05, 4.742667078971863e-05, 4.9338676035404205e-05, 5.125068128108978e-05, 5.316268652677536e-05, 5.507469177246094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 9.0, 11.0, 19.0, 20.0, 45.0, 80.0, 99.0, 174.0, 268.0, 418.0, 773.0, 1388.0, 2428.0, 4370.0, 8355.0, 15887.0, 30669.0, 60764.0, 115495.0, 188790.0, 225019.0, 176813.0, 104386.0, 54192.0, 27456.0, 14147.0, 7454.0, 3973.0, 2163.0, 1164.0, 677.0, 413.0, 236.0, 144.0, 84.0, 54.0, 36.0, 24.0, 16.0, 9.0, 10.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07379150390625, -0.0714426040649414, -0.06909370422363281, -0.06674480438232422, -0.06439590454101562, -0.06204700469970703, -0.05969810485839844, -0.057349205017089844, -0.05500030517578125, -0.052651405334472656, -0.05030250549316406, -0.04795360565185547, -0.045604705810546875, -0.04325580596923828, -0.04090690612792969, -0.038558006286621094, -0.0362091064453125, -0.033860206604003906, -0.03151130676269531, -0.02916240692138672, -0.026813507080078125, -0.02446460723876953, -0.022115707397460938, -0.019766807556152344, -0.01741790771484375, -0.015069007873535156, -0.012720108032226562, -0.010371208190917969, -0.008022308349609375, -0.005673408508300781, -0.0033245086669921875, -0.0009756088256835938, 0.001373291015625, 0.0037221908569335938, 0.0060710906982421875, 0.008419990539550781, 0.010768890380859375, 0.013117790222167969, 0.015466690063476562, 0.017815589904785156, 0.02016448974609375, 0.022513389587402344, 0.024862289428710938, 0.02721118927001953, 0.029560089111328125, 0.03190898895263672, 0.03425788879394531, 0.036606788635253906, 0.0389556884765625, 0.041304588317871094, 0.04365348815917969, 0.04600238800048828, 0.048351287841796875, 0.05070018768310547, 0.05304908752441406, 0.055397987365722656, 0.05774688720703125, 0.060095787048339844, 0.06244468688964844, 0.06479358673095703, 0.06714248657226562, 0.06949138641357422, 0.07184028625488281, 0.0741891860961914, 0.0765380859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 8.0, 6.0, 9.0, 17.0, 11.0, 24.0, 25.0, 26.0, 26.0, 35.0, 37.0, 45.0, 47.0, 61.0, 49.0, 53.0, 51.0, 45.0, 50.0, 53.0, 43.0, 44.0, 38.0, 32.0, 26.0, 20.0, 17.0, 17.0, 11.0, 10.0, 11.0, 9.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10626220703125, -0.10299015045166016, -0.09971809387207031, -0.09644603729248047, -0.09317398071289062, -0.08990192413330078, -0.08662986755371094, -0.0833578109741211, -0.08008575439453125, -0.0768136978149414, -0.07354164123535156, -0.07026958465576172, -0.06699752807617188, -0.06372547149658203, -0.06045341491699219, -0.057181358337402344, -0.0539093017578125, -0.050637245178222656, -0.04736518859863281, -0.04409313201904297, -0.040821075439453125, -0.03754901885986328, -0.03427696228027344, -0.031004905700683594, -0.02773284912109375, -0.024460792541503906, -0.021188735961914062, -0.01791667938232422, -0.014644622802734375, -0.011372566223144531, -0.008100509643554688, -0.004828453063964844, -0.001556396484375, 0.0017156600952148438, 0.0049877166748046875, 0.008259773254394531, 0.011531829833984375, 0.014803886413574219, 0.018075942993164062, 0.021347999572753906, 0.02462005615234375, 0.027892112731933594, 0.031164169311523438, 0.03443622589111328, 0.037708282470703125, 0.04098033905029297, 0.04425239562988281, 0.047524452209472656, 0.0507965087890625, 0.054068565368652344, 0.05734062194824219, 0.06061267852783203, 0.06388473510742188, 0.06715679168701172, 0.07042884826660156, 0.0737009048461914, 0.07697296142578125, 0.0802450180053711, 0.08351707458496094, 0.08678913116455078, 0.09006118774414062, 0.09333324432373047, 0.09660530090332031, 0.09987735748291016, 0.1031494140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 9.0, 21.0, 34.0, 70.0, 115.0, 176.0, 203.0, 164.0, 91.0, 61.0, 20.0, 15.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7886669635772705, -2.6865320205688477, -2.584397315979004, -2.482262372970581, -2.380127429962158, -2.2779927253723145, -2.1758577823638916, -2.0737228393554688, -1.971588134765625, -1.8694533109664917, -1.7673183679580688, -1.6651835441589355, -1.5630487203598022, -1.460913896560669, -1.358778953552246, -1.2566441297531128, -1.15450918674469, -1.0523743629455566, -0.9502394795417786, -0.8481045961380005, -0.7459697723388672, -0.6438348889350891, -0.541700005531311, -0.43956518173217773, -0.33743029832839966, -0.23529544472694397, -0.1331605762243271, -0.031025707721710205, 0.07110914587974548, 0.17324399948120117, 0.27537888288497925, 0.37751370668411255, 0.4796485900878906, 0.5817834734916687, 0.683918297290802, 0.7860531806945801, 0.8881880044937134, 0.9903228878974915, 1.0924577713012695, 1.1945925951004028, 1.2967274188995361, 1.3988622426986694, 1.5009971857070923, 1.6031320095062256, 1.7052668333053589, 1.8074016571044922, 1.909536600112915, 2.011671543121338, 2.1138062477111816, 2.2159411907196045, 2.3180758953094482, 2.420210838317871, 2.522345781326294, 2.6244804859161377, 2.7266154289245605, 2.8287501335144043, 2.9308853149414062, 3.033020257949829, 3.135154962539673, 3.2372899055480957, 3.3394248485565186, 3.4415595531463623, 3.543694496154785, 3.645829200744629, 3.7479641437530518]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 10.0, 5.0, 11.0, 7.0, 9.0, 10.0, 10.0, 19.0, 13.0, 17.0, 24.0, 36.0, 37.0, 33.0, 37.0, 42.0, 46.0, 45.0, 49.0, 51.0, 28.0, 36.0, 48.0, 30.0, 30.0, 41.0, 41.0, 41.0, 25.0, 24.0, 26.0, 25.0, 17.0, 18.0, 15.0, 12.0, 6.0, 5.0, 4.0, 3.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.823325514793396, -1.7693320512771606, -1.7153385877609253, -1.6613450050354004, -1.607351541519165, -1.5533580780029297, -1.4993646144866943, -1.445371150970459, -1.3913776874542236, -1.3373842239379883, -1.283390760421753, -1.2293972969055176, -1.1754037141799927, -1.1214102506637573, -1.067416787147522, -1.0134233236312866, -0.9594298005104065, -0.9054363369941711, -0.851442813873291, -0.7974493503570557, -0.7434558868408203, -0.689462423324585, -0.6354689002037048, -0.5814754366874695, -0.5274819135665894, -0.4734884202480316, -0.41949495673179626, -0.3655014634132385, -0.3115079998970032, -0.25751450657844543, -0.2035210132598877, -0.14952754974365234, -0.09553408622741699, -0.04154060408473015, 0.012452878057956696, 0.06644636392593384, 0.12043984234333038, 0.17443332076072693, 0.22842681407928467, 0.28242027759552, 0.33641377091407776, 0.3904072642326355, 0.44440072774887085, 0.4983942210674286, 0.5523877143859863, 0.6063811779022217, 0.660374641418457, 0.7143681049346924, 0.7683616280555725, 0.8223550915718079, 0.876348614692688, 0.9303420782089233, 0.9843355417251587, 1.038329005241394, 1.092322587966919, 1.1463160514831543, 1.2003095149993896, 1.254302978515625, 1.3082964420318604, 1.3622899055480957, 1.4162834882736206, 1.470276951789856, 1.5242704153060913, 1.5782638788223267, 1.632257342338562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 2.0, 3.0, 4.0, 11.0, 12.0, 14.0, 18.0, 29.0, 36.0, 43.0, 76.0, 106.0, 161.0, 257.0, 406.0, 547.0, 896.0, 1548.0, 2760.0, 5549.0, 11987.0, 29749.0, 80210.0, 219251.0, 510157.0, 908676.0, 1059718.0, 752647.0, 367445.0, 148213.0, 55345.0, 20604.0, 8384.0, 4046.0, 2108.0, 1197.0, 726.0, 448.0, 279.0, 194.0, 126.0, 90.0, 54.0, 42.0, 36.0, 23.0, 16.0, 13.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2005615234375, -0.1937122344970703, -0.18686294555664062, -0.18001365661621094, -0.17316436767578125, -0.16631507873535156, -0.15946578979492188, -0.1526165008544922, -0.1457672119140625, -0.1389179229736328, -0.13206863403320312, -0.12521934509277344, -0.11837005615234375, -0.11152076721191406, -0.10467147827148438, -0.09782218933105469, -0.090972900390625, -0.08412361145019531, -0.07727432250976562, -0.07042503356933594, -0.06357574462890625, -0.05672645568847656, -0.049877166748046875, -0.04302787780761719, -0.0361785888671875, -0.029329299926757812, -0.022480010986328125, -0.015630722045898438, -0.00878143310546875, -0.0019321441650390625, 0.004917144775390625, 0.011766433715820312, 0.01861572265625, 0.025465011596679688, 0.032314300537109375, 0.03916358947753906, 0.04601287841796875, 0.05286216735839844, 0.059711456298828125, 0.06656074523925781, 0.0734100341796875, 0.08025932312011719, 0.08710861206054688, 0.09395790100097656, 0.10080718994140625, 0.10765647888183594, 0.11450576782226562, 0.12135505676269531, 0.128204345703125, 0.1350536346435547, 0.14190292358398438, 0.14875221252441406, 0.15560150146484375, 0.16245079040527344, 0.16930007934570312, 0.1761493682861328, 0.1829986572265625, 0.1898479461669922, 0.19669723510742188, 0.20354652404785156, 0.21039581298828125, 0.21724510192871094, 0.22409439086914062, 0.2309436798095703, 0.23779296875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 6.0, 6.0, 2.0, 4.0, 14.0, 9.0, 17.0, 13.0, 19.0, 20.0, 40.0, 41.0, 28.0, 37.0, 42.0, 30.0, 42.0, 42.0, 47.0, 62.0, 31.0, 44.0, 43.0, 48.0, 33.0, 35.0, 38.0, 31.0, 23.0, 22.0, 27.0, 24.0, 15.0, 8.0, 16.0, 10.0, 8.0, 5.0, 2.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2392578125, -0.23063278198242188, -0.22200775146484375, -0.21338272094726562, -0.2047576904296875, -0.19613265991210938, -0.18750762939453125, -0.17888259887695312, -0.170257568359375, -0.16163253784179688, -0.15300750732421875, -0.14438247680664062, -0.1357574462890625, -0.12713241577148438, -0.11850738525390625, -0.10988235473632812, -0.10125732421875, -0.09263229370117188, -0.08400726318359375, -0.07538223266601562, -0.0667572021484375, -0.058132171630859375, -0.04950714111328125, -0.040882110595703125, -0.032257080078125, -0.023632049560546875, -0.01500701904296875, -0.006381988525390625, 0.0022430419921875, 0.010868072509765625, 0.01949310302734375, 0.028118133544921875, 0.0367431640625, 0.045368194580078125, 0.05399322509765625, 0.06261825561523438, 0.0712432861328125, 0.07986831665039062, 0.08849334716796875, 0.09711837768554688, 0.105743408203125, 0.11436843872070312, 0.12299346923828125, 0.13161849975585938, 0.1402435302734375, 0.14886856079101562, 0.15749359130859375, 0.16611862182617188, 0.17474365234375, 0.18336868286132812, 0.19199371337890625, 0.20061874389648438, 0.2092437744140625, 0.21786880493164062, 0.22649383544921875, 0.23511886596679688, 0.243743896484375, 0.2523689270019531, 0.26099395751953125, 0.2696189880371094, 0.2782440185546875, 0.2868690490722656, 0.29549407958984375, 0.3041191101074219, 0.312744140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 15.0, 24.0, 23.0, 36.0, 77.0, 110.0, 178.0, 333.0, 575.0, 1037.0, 2029.0, 4082.0, 9277.0, 23244.0, 66790.0, 238126.0, 1098997.0, 1980054.0, 565565.0, 133933.0, 41503.0, 15473.0, 6449.0, 2973.0, 1556.0, 782.0, 418.0, 224.0, 135.0, 79.0, 57.0, 41.0, 34.0, 21.0, 7.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31689453125, -0.3070793151855469, -0.29726409912109375, -0.2874488830566406, -0.2776336669921875, -0.2678184509277344, -0.25800323486328125, -0.24818801879882812, -0.238372802734375, -0.22855758666992188, -0.21874237060546875, -0.20892715454101562, -0.1991119384765625, -0.18929672241210938, -0.17948150634765625, -0.16966629028320312, -0.15985107421875, -0.15003585815429688, -0.14022064208984375, -0.13040542602539062, -0.1205902099609375, -0.11077499389648438, -0.10095977783203125, -0.09114456176757812, -0.081329345703125, -0.07151412963867188, -0.06169891357421875, -0.051883697509765625, -0.0420684814453125, -0.032253265380859375, -0.02243804931640625, -0.012622833251953125, -0.0028076171875, 0.007007598876953125, 0.01682281494140625, 0.026638031005859375, 0.0364532470703125, 0.046268463134765625, 0.05608367919921875, 0.06589889526367188, 0.075714111328125, 0.08552932739257812, 0.09534454345703125, 0.10515975952148438, 0.1149749755859375, 0.12479019165039062, 0.13460540771484375, 0.14442062377929688, 0.15423583984375, 0.16405105590820312, 0.17386627197265625, 0.18368148803710938, 0.1934967041015625, 0.20331192016601562, 0.21312713623046875, 0.22294235229492188, 0.232757568359375, 0.24257278442382812, 0.25238800048828125, 0.2622032165527344, 0.2720184326171875, 0.2818336486816406, 0.29164886474609375, 0.3014640808105469, 0.311279296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 7.0, 15.0, 19.0, 13.0, 25.0, 30.0, 33.0, 67.0, 63.0, 120.0, 146.0, 232.0, 307.0, 426.0, 480.0, 452.0, 453.0, 326.0, 241.0, 150.0, 137.0, 78.0, 65.0, 53.0, 25.0, 36.0, 16.0, 17.0, 7.0, 8.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41650390625, -0.4035377502441406, -0.39057159423828125, -0.3776054382324219, -0.3646392822265625, -0.3516731262207031, -0.33870697021484375, -0.3257408142089844, -0.312774658203125, -0.2998085021972656, -0.28684234619140625, -0.2738761901855469, -0.2609100341796875, -0.24794387817382812, -0.23497772216796875, -0.22201156616210938, -0.20904541015625, -0.19607925415039062, -0.18311309814453125, -0.17014694213867188, -0.1571807861328125, -0.14421463012695312, -0.13124847412109375, -0.11828231811523438, -0.105316162109375, -0.09235000610351562, -0.07938385009765625, -0.06641769409179688, -0.0534515380859375, -0.040485382080078125, -0.02751922607421875, -0.014553070068359375, -0.0015869140625, 0.011379241943359375, 0.02434539794921875, 0.037311553955078125, 0.0502777099609375, 0.06324386596679688, 0.07621002197265625, 0.08917617797851562, 0.102142333984375, 0.11510848999023438, 0.12807464599609375, 0.14104080200195312, 0.1540069580078125, 0.16697311401367188, 0.17993927001953125, 0.19290542602539062, 0.20587158203125, 0.21883773803710938, 0.23180389404296875, 0.24477005004882812, 0.2577362060546875, 0.2707023620605469, 0.28366851806640625, 0.2966346740722656, 0.309600830078125, 0.3225669860839844, 0.33553314208984375, 0.3484992980957031, 0.3614654541015625, 0.3744316101074219, 0.38739776611328125, 0.4003639221191406, 0.413330078125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 7.0, 17.0, 62.0, 224.0, 375.0, 207.0, 82.0, 15.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.769885301589966, -3.5406415462493896, -3.3113975524902344, -3.082153797149658, -2.852910041809082, -2.623666286468506, -2.3944222927093506, -2.1651785373687744, -1.9359346628189087, -1.706690788269043, -1.4774470329284668, -1.248203158378601, -1.0189592838287354, -0.7897155284881592, -0.5604716539382935, -0.3312278985977173, -0.10198402404785156, 0.12725980579853058, 0.3565036356449127, 0.585747480392456, 0.814991295337677, 1.044235110282898, 1.2734789848327637, 1.5027227401733398, 1.7319666147232056, 1.9612104892730713, 2.1904542446136475, 2.4196982383728027, 2.648941993713379, 2.878185749053955, 3.1074295043945312, 3.3366732597351074, 3.565917491912842, 3.795161247253418, 4.024405002593994, 4.25364875793457, 4.482892990112305, 4.712136745452881, 4.941380500793457, 5.170624256134033, 5.399868011474609, 5.6291117668151855, 5.858355522155762, 6.087599754333496, 6.316843509674072, 6.546087265014648, 6.775331020355225, 7.004574775695801, 7.233819007873535, 7.463062763214111, 7.6923065185546875, 7.921550750732422, 8.15079402923584, 8.380038261413574, 8.609281539916992, 8.838525772094727, 9.067769050598145, 9.297013282775879, 9.526256561279297, 9.755500793457031, 9.98474407196045, 10.213988304138184, 10.443231582641602, 10.672475814819336, 10.90172004699707]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 6.0, 11.0, 8.0, 13.0, 22.0, 23.0, 23.0, 19.0, 43.0, 29.0, 32.0, 24.0, 33.0, 28.0, 39.0, 46.0, 27.0, 27.0, 41.0, 35.0, 36.0, 45.0, 31.0, 39.0, 31.0, 34.0, 33.0, 34.0, 18.0, 24.0, 17.0, 23.0, 15.0, 16.0, 12.0, 8.0, 6.0, 8.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.261836290359497, -1.2233893871307373, -1.1849424839019775, -1.1464955806732178, -1.1080487966537476, -1.0696018934249878, -1.031154990196228, -0.9927080869674683, -0.9542611837387085, -0.9158142805099487, -0.8773674368858337, -0.838920533657074, -0.8004736304283142, -0.7620267868041992, -0.7235798835754395, -0.6851329803466797, -0.6466861367225647, -0.6082392334938049, -0.5697923898696899, -0.5313454866409302, -0.4928985834121704, -0.45445170998573303, -0.41600483655929565, -0.3775579333305359, -0.3391110599040985, -0.30066418647766113, -0.26221728324890137, -0.223770409822464, -0.18532352149486542, -0.14687663316726685, -0.10842975974082947, -0.0699828565120697, -0.031535983085632324, 0.006910901516675949, 0.04535778611898422, 0.0838046669960022, 0.12225155532360077, 0.16069844365119934, 0.19914531707763672, 0.23759222030639648, 0.27603909373283386, 0.31448596715927124, 0.352932870388031, 0.3913797438144684, 0.42982661724090576, 0.4682735204696655, 0.5067204236984253, 0.5451673269271851, 0.5836141705513, 0.6220610737800598, 0.6605079174041748, 0.6989548206329346, 0.7374017238616943, 0.7758486270904541, 0.8142954707145691, 0.8527423739433289, 0.8911892175674438, 0.9296361207962036, 0.9680829644203186, 1.0065298080444336, 1.0449767112731934, 1.0834236145019531, 1.121870517730713, 1.1603174209594727, 1.1987643241882324]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 21.0, 18.0, 24.0, 37.0, 36.0, 79.0, 110.0, 180.0, 244.0, 362.0, 558.0, 925.0, 1468.0, 2461.0, 4134.0, 7161.0, 12651.0, 22435.0, 39787.0, 68863.0, 112748.0, 162576.0, 184410.0, 159582.0, 110348.0, 67175.0, 38677.0, 21485.0, 12275.0, 7215.0, 4195.0, 2367.0, 1416.0, 843.0, 586.0, 354.0, 239.0, 153.0, 107.0, 64.0, 56.0, 28.0, 30.0, 20.0, 14.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.192138671875, -0.18622207641601562, -0.18030548095703125, -0.17438888549804688, -0.1684722900390625, -0.16255569458007812, -0.15663909912109375, -0.15072250366210938, -0.144805908203125, -0.13888931274414062, -0.13297271728515625, -0.12705612182617188, -0.1211395263671875, -0.11522293090820312, -0.10930633544921875, -0.10338973999023438, -0.09747314453125, -0.09155654907226562, -0.08563995361328125, -0.07972335815429688, -0.0738067626953125, -0.06789016723632812, -0.06197357177734375, -0.056056976318359375, -0.050140380859375, -0.044223785400390625, -0.03830718994140625, -0.032390594482421875, -0.0264739990234375, -0.020557403564453125, -0.01464080810546875, -0.008724212646484375, -0.0028076171875, 0.003108978271484375, 0.00902557373046875, 0.014942169189453125, 0.0208587646484375, 0.026775360107421875, 0.03269195556640625, 0.038608551025390625, 0.044525146484375, 0.050441741943359375, 0.05635833740234375, 0.062274932861328125, 0.0681915283203125, 0.07410812377929688, 0.08002471923828125, 0.08594131469726562, 0.09185791015625, 0.09777450561523438, 0.10369110107421875, 0.10960769653320312, 0.1155242919921875, 0.12144088745117188, 0.12735748291015625, 0.13327407836914062, 0.139190673828125, 0.14510726928710938, 0.15102386474609375, 0.15694046020507812, 0.1628570556640625, 0.16877365112304688, 0.17469024658203125, 0.18060684204101562, 0.1865234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 8.0, 7.0, 2.0, 8.0, 18.0, 23.0, 19.0, 29.0, 35.0, 20.0, 30.0, 42.0, 35.0, 57.0, 43.0, 65.0, 39.0, 55.0, 45.0, 48.0, 46.0, 38.0, 49.0, 34.0, 24.0, 28.0, 32.0, 17.0, 26.0, 22.0, 10.0, 11.0, 7.0, 10.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0], "bins": [-0.366455078125, -0.3566856384277344, -0.34691619873046875, -0.3371467590332031, -0.3273773193359375, -0.3176078796386719, -0.30783843994140625, -0.2980690002441406, -0.288299560546875, -0.2785301208496094, -0.26876068115234375, -0.2589912414550781, -0.2492218017578125, -0.23945236206054688, -0.22968292236328125, -0.21991348266601562, -0.21014404296875, -0.20037460327148438, -0.19060516357421875, -0.18083572387695312, -0.1710662841796875, -0.16129684448242188, -0.15152740478515625, -0.14175796508789062, -0.131988525390625, -0.12221908569335938, -0.11244964599609375, -0.10268020629882812, -0.0929107666015625, -0.08314132690429688, -0.07337188720703125, -0.06360244750976562, -0.0538330078125, -0.044063568115234375, -0.03429412841796875, -0.024524688720703125, -0.0147552490234375, -0.004985809326171875, 0.00478363037109375, 0.014553070068359375, 0.024322509765625, 0.034091949462890625, 0.04386138916015625, 0.053630828857421875, 0.0634002685546875, 0.07316970825195312, 0.08293914794921875, 0.09270858764648438, 0.10247802734375, 0.11224746704101562, 0.12201690673828125, 0.13178634643554688, 0.1415557861328125, 0.15132522583007812, 0.16109466552734375, 0.17086410522460938, 0.180633544921875, 0.19040298461914062, 0.20017242431640625, 0.20994186401367188, 0.2197113037109375, 0.22948074340820312, 0.23925018310546875, 0.24901962280273438, 0.2587890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 18.0, 11.0, 23.0, 33.0, 48.0, 78.0, 127.0, 173.0, 305.0, 502.0, 823.0, 1455.0, 2396.0, 4287.0, 7716.0, 13966.0, 26038.0, 48517.0, 87299.0, 147910.0, 226908.0, 193282.0, 127083.0, 72853.0, 39185.0, 21291.0, 11467.0, 6179.0, 3504.0, 1984.0, 1195.0, 683.0, 439.0, 273.0, 167.0, 122.0, 63.0, 52.0, 30.0, 20.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205810546875, -0.19913673400878906, -0.19246292114257812, -0.1857891082763672, -0.17911529541015625, -0.1724414825439453, -0.16576766967773438, -0.15909385681152344, -0.1524200439453125, -0.14574623107910156, -0.13907241821289062, -0.1323986053466797, -0.12572479248046875, -0.11905097961425781, -0.11237716674804688, -0.10570335388183594, -0.099029541015625, -0.09235572814941406, -0.08568191528320312, -0.07900810241699219, -0.07233428955078125, -0.06566047668457031, -0.058986663818359375, -0.05231285095214844, -0.0456390380859375, -0.03896522521972656, -0.032291412353515625, -0.025617599487304688, -0.01894378662109375, -0.012269973754882812, -0.005596160888671875, 0.0010776519775390625, 0.00775146484375, 0.014425277709960938, 0.021099090576171875, 0.027772903442382812, 0.03444671630859375, 0.04112052917480469, 0.047794342041015625, 0.05446815490722656, 0.0611419677734375, 0.06781578063964844, 0.07448959350585938, 0.08116340637207031, 0.08783721923828125, 0.09451103210449219, 0.10118484497070312, 0.10785865783691406, 0.114532470703125, 0.12120628356933594, 0.12788009643554688, 0.1345539093017578, 0.14122772216796875, 0.1479015350341797, 0.15457534790039062, 0.16124916076660156, 0.1679229736328125, 0.17459678649902344, 0.18127059936523438, 0.1879444122314453, 0.19461822509765625, 0.2012920379638672, 0.20796585083007812, 0.21463966369628906, 0.2213134765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 7.0, 11.0, 10.0, 8.0, 7.0, 17.0, 18.0, 23.0, 31.0, 32.0, 40.0, 30.0, 40.0, 30.0, 47.0, 41.0, 39.0, 43.0, 36.0, 44.0, 48.0, 35.0, 39.0, 33.0, 40.0, 29.0, 30.0, 30.0, 18.0, 20.0, 18.0, 26.0, 11.0, 9.0, 11.0, 13.0, 14.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.62103271484375, -0.5994873046875, -0.57794189453125, -0.556396484375, -0.53485107421875, -0.5133056640625, -0.49176025390625, -0.47021484375, -0.44866943359375, -0.4271240234375, -0.40557861328125, -0.384033203125, -0.36248779296875, -0.3409423828125, -0.31939697265625, -0.2978515625, -0.27630615234375, -0.2547607421875, -0.23321533203125, -0.211669921875, -0.19012451171875, -0.1685791015625, -0.14703369140625, -0.12548828125, -0.10394287109375, -0.0823974609375, -0.06085205078125, -0.039306640625, -0.01776123046875, 0.0037841796875, 0.02532958984375, 0.046875, 0.06842041015625, 0.0899658203125, 0.11151123046875, 0.133056640625, 0.15460205078125, 0.1761474609375, 0.19769287109375, 0.21923828125, 0.24078369140625, 0.2623291015625, 0.28387451171875, 0.305419921875, 0.32696533203125, 0.3485107421875, 0.37005615234375, 0.3916015625, 0.41314697265625, 0.4346923828125, 0.45623779296875, 0.477783203125, 0.49932861328125, 0.5208740234375, 0.54241943359375, 0.56396484375, 0.58551025390625, 0.6070556640625, 0.62860107421875, 0.650146484375, 0.67169189453125, 0.6932373046875, 0.71478271484375, 0.736328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 12.0, 24.0, 16.0, 33.0, 56.0, 73.0, 129.0, 184.0, 282.0, 437.0, 652.0, 1007.0, 1664.0, 2733.0, 4524.0, 7573.0, 12831.0, 21620.0, 36334.0, 59423.0, 92340.0, 135123.0, 195526.0, 161807.0, 115703.0, 77316.0, 48521.0, 29133.0, 17565.0, 10215.0, 6071.0, 3632.0, 2197.0, 1390.0, 855.0, 551.0, 319.0, 230.0, 128.0, 97.0, 80.0, 49.0, 36.0, 16.0, 13.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.041259765625, -0.0400385856628418, -0.038817405700683594, -0.03759622573852539, -0.03637504577636719, -0.035153865814208984, -0.03393268585205078, -0.03271150588989258, -0.031490325927734375, -0.030269145965576172, -0.02904796600341797, -0.027826786041259766, -0.026605606079101562, -0.02538442611694336, -0.024163246154785156, -0.022942066192626953, -0.02172088623046875, -0.020499706268310547, -0.019278526306152344, -0.01805734634399414, -0.016836166381835938, -0.015614986419677734, -0.014393806457519531, -0.013172626495361328, -0.011951446533203125, -0.010730266571044922, -0.009509086608886719, -0.008287906646728516, -0.0070667266845703125, -0.005845546722412109, -0.004624366760253906, -0.003403186798095703, -0.0021820068359375, -0.0009608268737792969, 0.00026035308837890625, 0.0014815330505371094, 0.0027027130126953125, 0.003923892974853516, 0.005145072937011719, 0.006366252899169922, 0.007587432861328125, 0.008808612823486328, 0.010029792785644531, 0.011250972747802734, 0.012472152709960938, 0.01369333267211914, 0.014914512634277344, 0.016135692596435547, 0.01735687255859375, 0.018578052520751953, 0.019799232482910156, 0.02102041244506836, 0.022241592407226562, 0.023462772369384766, 0.02468395233154297, 0.025905132293701172, 0.027126312255859375, 0.028347492218017578, 0.02956867218017578, 0.030789852142333984, 0.03201103210449219, 0.03323221206665039, 0.034453392028808594, 0.0356745719909668, 0.036895751953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 7.0, 8.0, 6.0, 8.0, 12.0, 25.0, 18.0, 26.0, 25.0, 42.0, 35.0, 55.0, 66.0, 69.0, 73.0, 73.0, 73.0, 62.0, 54.0, 40.0, 43.0, 30.0, 29.0, 20.0, 20.0, 15.0, 11.0, 11.0, 11.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.562999725341797e-05, -2.477876842021942e-05, -2.3927539587020874e-05, -2.3076310753822327e-05, -2.222508192062378e-05, -2.1373853087425232e-05, -2.0522624254226685e-05, -1.9671395421028137e-05, -1.882016658782959e-05, -1.7968937754631042e-05, -1.7117708921432495e-05, -1.6266480088233948e-05, -1.54152512550354e-05, -1.4564022421836853e-05, -1.3712793588638306e-05, -1.2861564755439758e-05, -1.2010335922241211e-05, -1.1159107089042664e-05, -1.0307878255844116e-05, -9.456649422645569e-06, -8.605420589447021e-06, -7.754191756248474e-06, -6.902962923049927e-06, -6.051734089851379e-06, -5.200505256652832e-06, -4.349276423454285e-06, -3.4980475902557373e-06, -2.64681875705719e-06, -1.7955899238586426e-06, -9.443610906600952e-07, -9.313225746154785e-08, 7.580965757369995e-07, 1.6093254089355469e-06, 2.4605542421340942e-06, 3.3117830753326416e-06, 4.163011908531189e-06, 5.014240741729736e-06, 5.865469574928284e-06, 6.716698408126831e-06, 7.567927241325378e-06, 8.419156074523926e-06, 9.270384907722473e-06, 1.012161374092102e-05, 1.0972842574119568e-05, 1.1824071407318115e-05, 1.2675300240516663e-05, 1.352652907371521e-05, 1.4377757906913757e-05, 1.5228986740112305e-05, 1.6080215573310852e-05, 1.69314444065094e-05, 1.7782673239707947e-05, 1.8633902072906494e-05, 1.948513090610504e-05, 2.033635973930359e-05, 2.1187588572502136e-05, 2.2038817405700684e-05, 2.289004623889923e-05, 2.374127507209778e-05, 2.4592503905296326e-05, 2.5443732738494873e-05, 2.629496157169342e-05, 2.7146190404891968e-05, 2.7997419238090515e-05, 2.8848648071289062e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 4.0, 20.0, 28.0, 36.0, 49.0, 92.0, 177.0, 264.0, 441.0, 766.0, 1376.0, 2480.0, 4918.0, 9264.0, 18701.0, 37727.0, 73532.0, 130226.0, 198903.0, 234392.0, 150860.0, 89269.0, 47097.0, 23369.0, 11615.0, 5879.0, 3133.0, 1683.0, 857.0, 554.0, 343.0, 182.0, 114.0, 72.0, 48.0, 25.0, 27.0, 16.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0589599609375, -0.05728292465209961, -0.05560588836669922, -0.05392885208129883, -0.05225181579589844, -0.05057477951049805, -0.048897743225097656, -0.047220706939697266, -0.045543670654296875, -0.043866634368896484, -0.042189598083496094, -0.0405125617980957, -0.03883552551269531, -0.03715848922729492, -0.03548145294189453, -0.03380441665649414, -0.03212738037109375, -0.03045034408569336, -0.02877330780029297, -0.027096271514892578, -0.025419235229492188, -0.023742198944091797, -0.022065162658691406, -0.020388126373291016, -0.018711090087890625, -0.017034053802490234, -0.015357017517089844, -0.013679981231689453, -0.012002944946289062, -0.010325908660888672, -0.008648872375488281, -0.006971836090087891, -0.0052947998046875, -0.0036177635192871094, -0.0019407272338867188, -0.0002636909484863281, 0.0014133453369140625, 0.003090381622314453, 0.004767417907714844, 0.006444454193115234, 0.008121490478515625, 0.009798526763916016, 0.011475563049316406, 0.013152599334716797, 0.014829635620117188, 0.016506671905517578, 0.01818370819091797, 0.01986074447631836, 0.02153778076171875, 0.02321481704711914, 0.02489185333251953, 0.026568889617919922, 0.028245925903320312, 0.029922962188720703, 0.031599998474121094, 0.033277034759521484, 0.034954071044921875, 0.036631107330322266, 0.038308143615722656, 0.03998517990112305, 0.04166221618652344, 0.04333925247192383, 0.04501628875732422, 0.04669332504272461, 0.048370361328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 20.0, 18.0, 22.0, 27.0, 28.0, 42.0, 33.0, 35.0, 48.0, 58.0, 50.0, 46.0, 58.0, 63.0, 60.0, 45.0, 46.0, 47.0, 37.0, 34.0, 37.0, 25.0, 25.0, 12.0, 13.0, 4.0, 12.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.09722900390625, -0.09464168548583984, -0.09205436706542969, -0.08946704864501953, -0.08687973022460938, -0.08429241180419922, -0.08170509338378906, -0.0791177749633789, -0.07653045654296875, -0.0739431381225586, -0.07135581970214844, -0.06876850128173828, -0.06618118286132812, -0.06359386444091797, -0.06100654602050781, -0.058419227600097656, -0.0558319091796875, -0.053244590759277344, -0.05065727233886719, -0.04806995391845703, -0.045482635498046875, -0.04289531707763672, -0.04030799865722656, -0.037720680236816406, -0.03513336181640625, -0.032546043395996094, -0.029958724975585938, -0.02737140655517578, -0.024784088134765625, -0.02219676971435547, -0.019609451293945312, -0.017022132873535156, -0.014434814453125, -0.011847496032714844, -0.009260177612304688, -0.006672859191894531, -0.004085540771484375, -0.0014982223510742188, 0.0010890960693359375, 0.0036764144897460938, 0.00626373291015625, 0.008851051330566406, 0.011438369750976562, 0.014025688171386719, 0.016613006591796875, 0.01920032501220703, 0.021787643432617188, 0.024374961853027344, 0.0269622802734375, 0.029549598693847656, 0.03213691711425781, 0.03472423553466797, 0.037311553955078125, 0.03989887237548828, 0.04248619079589844, 0.045073509216308594, 0.04766082763671875, 0.050248146057128906, 0.05283546447753906, 0.05542278289794922, 0.058010101318359375, 0.06059741973876953, 0.06318473815917969, 0.06577205657958984, 0.068359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 12.0, 22.0, 59.0, 77.0, 133.0, 202.0, 194.0, 121.0, 87.0, 38.0, 25.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.788917064666748, -2.7024102210998535, -2.615903377532959, -2.5293965339660645, -2.44288969039917, -2.3563828468322754, -2.269876003265381, -2.1833691596984863, -2.096862316131592, -2.0103554725646973, -1.9238486289978027, -1.8373417854309082, -1.7508349418640137, -1.6643280982971191, -1.5778212547302246, -1.49131441116333, -1.404807686805725, -1.3183008432388306, -1.231793999671936, -1.1452871561050415, -1.058780312538147, -0.9722734689712524, -0.8857666850090027, -0.7992598414421082, -0.7127529978752136, -0.6262461543083191, -0.5397393107414246, -0.4532324969768524, -0.3667256534099579, -0.28021880984306335, -0.1937119960784912, -0.10720515251159668, -0.02069830894470215, 0.06580852717161179, 0.15231536328792572, 0.23882219195365906, 0.3253290355205536, 0.4118358790874481, 0.49834269285202026, 0.5848495364189148, 0.6713563799858093, 0.7578632235527039, 0.8443700671195984, 0.9308768510818481, 1.0173836946487427, 1.1038905382156372, 1.1903973817825317, 1.2769042253494263, 1.3634110689163208, 1.4499179124832153, 1.5364247560501099, 1.6229315996170044, 1.709438443183899, 1.7959452867507935, 1.8824520111083984, 1.968958854675293, 2.0554656982421875, 2.141972541809082, 2.2284793853759766, 2.314986228942871, 2.4014930725097656, 2.48799991607666, 2.5745067596435547, 2.661013603210449, 2.7475204467773438]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 5.0, 2.0, 5.0, 9.0, 6.0, 5.0, 9.0, 16.0, 14.0, 8.0, 20.0, 21.0, 23.0, 18.0, 30.0, 39.0, 47.0, 39.0, 39.0, 46.0, 47.0, 37.0, 48.0, 40.0, 44.0, 41.0, 42.0, 24.0, 44.0, 26.0, 31.0, 23.0, 25.0, 25.0, 18.0, 13.0, 17.0, 12.0, 10.0, 8.0, 6.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.289499044418335, -1.240760326385498, -1.1920214891433716, -1.1432827711105347, -1.0945439338684082, -1.0458052158355713, -0.9970664381980896, -0.9483276605606079, -0.8995888829231262, -0.8508501052856445, -0.8021113276481628, -0.7533725500106812, -0.7046338319778442, -0.6558949947357178, -0.6071562767028809, -0.5584174990653992, -0.5096787214279175, -0.4609399437904358, -0.4122011661529541, -0.3634624183177948, -0.3147236406803131, -0.2659848630428314, -0.21724611520767212, -0.16850733757019043, -0.11976855993270874, -0.07102978974580765, -0.022291019558906555, 0.02644774317741394, 0.07518652081489563, 0.12392529845237732, 0.17266404628753662, 0.2214028239250183, 0.2701416015625, 0.3188803791999817, 0.3676191568374634, 0.4163579046726227, 0.46509668231010437, 0.5138354301452637, 0.5625742077827454, 0.611312985420227, 0.6600517630577087, 0.7087905406951904, 0.7575293183326721, 0.8062680959701538, 0.8550068140029907, 0.9037456512451172, 0.9524843692779541, 1.001223087310791, 1.0499619245529175, 1.0987006425857544, 1.1474394798278809, 1.1961781978607178, 1.2449170351028442, 1.2936557531356812, 1.3423945903778076, 1.3911333084106445, 1.4398720264434814, 1.4886107444763184, 1.5373495817184448, 1.5860882997512817, 1.6348271369934082, 1.6835658550262451, 1.732304573059082, 1.7810434103012085, 1.829782247543335]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 11.0, 14.0, 17.0, 18.0, 26.0, 30.0, 45.0, 68.0, 83.0, 120.0, 210.0, 331.0, 622.0, 1420.0, 3458.0, 11835.0, 52495.0, 243142.0, 788580.0, 1370899.0, 1139210.0, 446571.0, 103123.0, 21912.0, 5775.0, 2147.0, 893.0, 434.0, 234.0, 181.0, 121.0, 73.0, 57.0, 31.0, 30.0, 16.0, 10.0, 10.0, 5.0, 14.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2538032531738281, -0.24393463134765625, -0.23406600952148438, -0.2241973876953125, -0.21432876586914062, -0.20446014404296875, -0.19459152221679688, -0.184722900390625, -0.17485427856445312, -0.16498565673828125, -0.15511703491210938, -0.1452484130859375, -0.13537979125976562, -0.12551116943359375, -0.11564254760742188, -0.10577392578125, -0.09590530395507812, -0.08603668212890625, -0.07616806030273438, -0.0662994384765625, -0.056430816650390625, -0.04656219482421875, -0.036693572998046875, -0.026824951171875, -0.016956329345703125, -0.00708770751953125, 0.002780914306640625, 0.0126495361328125, 0.022518157958984375, 0.03238677978515625, 0.042255401611328125, 0.0521240234375, 0.061992645263671875, 0.07186126708984375, 0.08172988891601562, 0.0915985107421875, 0.10146713256835938, 0.11133575439453125, 0.12120437622070312, 0.131072998046875, 0.14094161987304688, 0.15081024169921875, 0.16067886352539062, 0.1705474853515625, 0.18041610717773438, 0.19028472900390625, 0.20015335083007812, 0.21002197265625, 0.21989059448242188, 0.22975921630859375, 0.23962783813476562, 0.2494964599609375, 0.2593650817871094, 0.26923370361328125, 0.2791023254394531, 0.288970947265625, 0.2988395690917969, 0.30870819091796875, 0.3185768127441406, 0.3284454345703125, 0.3383140563964844, 0.34818267822265625, 0.3580513000488281, 0.367919921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 9.0, 7.0, 13.0, 16.0, 26.0, 26.0, 27.0, 28.0, 29.0, 28.0, 42.0, 34.0, 44.0, 33.0, 43.0, 40.0, 46.0, 35.0, 37.0, 46.0, 35.0, 37.0, 31.0, 26.0, 31.0, 26.0, 26.0, 15.0, 26.0, 21.0, 18.0, 14.0, 10.0, 9.0, 13.0, 6.0, 4.0, 5.0, 9.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221435546875, -0.21432113647460938, -0.20720672607421875, -0.20009231567382812, -0.1929779052734375, -0.18586349487304688, -0.17874908447265625, -0.17163467407226562, -0.164520263671875, -0.15740585327148438, -0.15029144287109375, -0.14317703247070312, -0.1360626220703125, -0.12894821166992188, -0.12183380126953125, -0.11471939086914062, -0.10760498046875, -0.10049057006835938, -0.09337615966796875, -0.08626174926757812, -0.0791473388671875, -0.07203292846679688, -0.06491851806640625, -0.057804107666015625, -0.050689697265625, -0.043575286865234375, -0.03646087646484375, -0.029346466064453125, -0.0222320556640625, -0.015117645263671875, -0.00800323486328125, -0.000888824462890625, 0.0062255859375, 0.013339996337890625, 0.02045440673828125, 0.027568817138671875, 0.0346832275390625, 0.041797637939453125, 0.04891204833984375, 0.056026458740234375, 0.063140869140625, 0.07025527954101562, 0.07736968994140625, 0.08448410034179688, 0.0915985107421875, 0.09871292114257812, 0.10582733154296875, 0.11294174194335938, 0.12005615234375, 0.12717056274414062, 0.13428497314453125, 0.14139938354492188, 0.1485137939453125, 0.15562820434570312, 0.16274261474609375, 0.16985702514648438, 0.176971435546875, 0.18408584594726562, 0.19120025634765625, 0.19831466674804688, 0.2054290771484375, 0.21254348754882812, 0.21965789794921875, 0.22677230834960938, 0.23388671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 8.0, 7.0, 16.0, 14.0, 19.0, 44.0, 61.0, 75.0, 93.0, 181.0, 256.0, 475.0, 800.0, 1555.0, 3746.0, 11353.0, 58726.0, 578238.0, 2956565.0, 511140.0, 53207.0, 10734.0, 3498.0, 1447.0, 759.0, 417.0, 264.0, 165.0, 118.0, 86.0, 46.0, 45.0, 25.0, 21.0, 18.0, 12.0, 15.0, 5.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5078125, -0.4921760559082031, -0.47653961181640625, -0.4609031677246094, -0.4452667236328125, -0.4296302795410156, -0.41399383544921875, -0.3983573913574219, -0.382720947265625, -0.3670845031738281, -0.35144805908203125, -0.3358116149902344, -0.3201751708984375, -0.3045387268066406, -0.28890228271484375, -0.2732658386230469, -0.25762939453125, -0.24199295043945312, -0.22635650634765625, -0.21072006225585938, -0.1950836181640625, -0.17944717407226562, -0.16381072998046875, -0.14817428588867188, -0.132537841796875, -0.11690139770507812, -0.10126495361328125, -0.08562850952148438, -0.0699920654296875, -0.054355621337890625, -0.03871917724609375, -0.023082733154296875, -0.0074462890625, 0.008190155029296875, 0.02382659912109375, 0.039463043212890625, 0.0550994873046875, 0.07073593139648438, 0.08637237548828125, 0.10200881958007812, 0.117645263671875, 0.13328170776367188, 0.14891815185546875, 0.16455459594726562, 0.1801910400390625, 0.19582748413085938, 0.21146392822265625, 0.22710037231445312, 0.24273681640625, 0.2583732604980469, 0.27400970458984375, 0.2896461486816406, 0.3052825927734375, 0.3209190368652344, 0.33655548095703125, 0.3521919250488281, 0.367828369140625, 0.3834648132324219, 0.39910125732421875, 0.4147377014160156, 0.4303741455078125, 0.4460105895996094, 0.46164703369140625, 0.4772834777832031, 0.492919921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 10.0, 12.0, 9.0, 23.0, 29.0, 39.0, 58.0, 72.0, 126.0, 166.0, 243.0, 300.0, 401.0, 458.0, 423.0, 449.0, 351.0, 249.0, 216.0, 137.0, 77.0, 71.0, 49.0, 35.0, 21.0, 12.0, 11.0, 3.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4521484375, -0.435455322265625, -0.41876220703125, -0.402069091796875, -0.3853759765625, -0.368682861328125, -0.35198974609375, -0.335296630859375, -0.318603515625, -0.301910400390625, -0.28521728515625, -0.268524169921875, -0.2518310546875, -0.235137939453125, -0.21844482421875, -0.201751708984375, -0.18505859375, -0.168365478515625, -0.15167236328125, -0.134979248046875, -0.1182861328125, -0.101593017578125, -0.08489990234375, -0.068206787109375, -0.051513671875, -0.034820556640625, -0.01812744140625, -0.001434326171875, 0.0152587890625, 0.031951904296875, 0.04864501953125, 0.065338134765625, 0.08203125, 0.098724365234375, 0.11541748046875, 0.132110595703125, 0.1488037109375, 0.165496826171875, 0.18218994140625, 0.198883056640625, 0.215576171875, 0.232269287109375, 0.24896240234375, 0.265655517578125, 0.2823486328125, 0.299041748046875, 0.31573486328125, 0.332427978515625, 0.34912109375, 0.365814208984375, 0.38250732421875, 0.399200439453125, 0.4158935546875, 0.432586669921875, 0.44927978515625, 0.465972900390625, 0.482666015625, 0.499359130859375, 0.51605224609375, 0.532745361328125, 0.5494384765625, 0.566131591796875, 0.58282470703125, 0.599517822265625, 0.6162109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 5.0, 9.0, 16.0, 24.0, 41.0, 52.0, 67.0, 95.0, 93.0, 120.0, 106.0, 99.0, 74.0, 63.0, 26.0, 34.0, 17.0, 13.0, 9.0, 4.0, 2.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669386625289917, -2.5404624938964844, -2.4115383625030518, -2.282614231109619, -2.1536898612976074, -2.024765729904175, -1.8958415985107422, -1.7669174671173096, -1.6379932165145874, -1.5090690851211548, -1.3801448345184326, -1.251220703125, -1.1222965717315674, -0.9933723211288452, -0.8644481897354126, -0.7355239987373352, -0.6065998077392578, -0.4776756167411804, -0.3487514555454254, -0.2198272943496704, -0.09090310335159302, 0.038021087646484375, 0.166945219039917, 0.2958694100379944, 0.4247936010360718, 0.5537177920341492, 0.6826419830322266, 0.8115661144256592, 0.9404903054237366, 1.069414496421814, 1.1983386278152466, 1.3272628784179688, 1.4561867713928223, 1.5851109027862549, 1.714035153388977, 1.8429592847824097, 1.9718835353851318, 2.1008076667785645, 2.229731798171997, 2.3586559295654297, 2.4875802993774414, 2.616504430770874, 2.7454285621643066, 2.8743529319763184, 3.003277063369751, 3.1322011947631836, 3.261125326156616, 3.390049457550049, 3.5189735889434814, 3.647897720336914, 3.7768218517303467, 3.9057459831237793, 4.034670352935791, 4.1635942459106445, 4.292518615722656, 4.421442985534668, 4.5503668785095215, 4.679291248321533, 4.808215141296387, 4.937139511108398, 5.066063404083252, 5.194987773895264, 5.323911666870117, 5.452836036682129, 5.581760406494141]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 7.0, 5.0, 8.0, 12.0, 10.0, 19.0, 22.0, 13.0, 16.0, 34.0, 24.0, 15.0, 35.0, 30.0, 29.0, 40.0, 45.0, 37.0, 30.0, 43.0, 41.0, 46.0, 32.0, 41.0, 31.0, 41.0, 33.0, 31.0, 24.0, 25.0, 34.0, 20.0, 19.0, 13.0, 8.0, 11.0, 14.0, 5.0, 9.0, 5.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.658757209777832, -1.6051093339920044, -1.5514614582061768, -1.4978135824203491, -1.4441657066345215, -1.3905178308486938, -1.3368699550628662, -1.283221960067749, -1.229574203491211, -1.1759263277053833, -1.1222784519195557, -1.068630576133728, -1.0149827003479004, -0.9613348245620728, -0.9076868891716003, -0.8540390133857727, -0.8003910779953003, -0.7467432022094727, -0.693095326423645, -0.6394474506378174, -0.5857995748519897, -0.5321516990661621, -0.4785037636756897, -0.42485588788986206, -0.3712080121040344, -0.3175601363182068, -0.26391226053237915, -0.21026435494422913, -0.1566164791584015, -0.10296860337257385, -0.04932069778442383, 0.004327178001403809, 0.057974934577941895, 0.11162281781435013, 0.16527070105075836, 0.2189185917377472, 0.27256646752357483, 0.32621434330940247, 0.3798622488975525, 0.4335101246833801, 0.48715800046920776, 0.5408058762550354, 0.594453752040863, 0.6481016874313354, 0.7017495632171631, 0.7553974390029907, 0.8090453147888184, 0.862693190574646, 0.9163410663604736, 0.9699889421463013, 1.023636817932129, 1.0772846937179565, 1.1309325695037842, 1.1845804452896118, 1.2382283210754395, 1.2918763160705566, 1.3455240726470947, 1.3991719484329224, 1.45281982421875, 1.5064677000045776, 1.5601155757904053, 1.613763451576233, 1.6674113273620605, 1.7210593223571777, 1.7747071981430054]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 12.0, 14.0, 13.0, 28.0, 29.0, 47.0, 59.0, 86.0, 138.0, 207.0, 345.0, 548.0, 1013.0, 1982.0, 4242.0, 10786.0, 32019.0, 121242.0, 420981.0, 330555.0, 84791.0, 23596.0, 8411.0, 3521.0, 1638.0, 888.0, 473.0, 297.0, 200.0, 111.0, 91.0, 51.0, 32.0, 28.0, 23.0, 15.0, 14.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.363037109375, -0.3519935607910156, -0.34095001220703125, -0.3299064636230469, -0.3188629150390625, -0.3078193664550781, -0.29677581787109375, -0.2857322692871094, -0.274688720703125, -0.2636451721191406, -0.25260162353515625, -0.24155807495117188, -0.2305145263671875, -0.21947097778320312, -0.20842742919921875, -0.19738388061523438, -0.18634033203125, -0.17529678344726562, -0.16425323486328125, -0.15320968627929688, -0.1421661376953125, -0.13112258911132812, -0.12007904052734375, -0.10903549194335938, -0.097991943359375, -0.08694839477539062, -0.07590484619140625, -0.06486129760742188, -0.0538177490234375, -0.042774200439453125, -0.03173065185546875, -0.020687103271484375, -0.0096435546875, 0.001399993896484375, 0.01244354248046875, 0.023487091064453125, 0.0345306396484375, 0.045574188232421875, 0.05661773681640625, 0.06766128540039062, 0.078704833984375, 0.08974838256835938, 0.10079193115234375, 0.11183547973632812, 0.1228790283203125, 0.13392257690429688, 0.14496612548828125, 0.15600967407226562, 0.16705322265625, 0.17809677124023438, 0.18914031982421875, 0.20018386840820312, 0.2112274169921875, 0.22227096557617188, 0.23331451416015625, 0.24435806274414062, 0.255401611328125, 0.2664451599121094, 0.27748870849609375, 0.2885322570800781, 0.2995758056640625, 0.3106193542480469, 0.32166290283203125, 0.3327064514160156, 0.34375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 4.0, 8.0, 8.0, 6.0, 17.0, 16.0, 22.0, 27.0, 35.0, 27.0, 41.0, 49.0, 40.0, 43.0, 57.0, 58.0, 60.0, 44.0, 43.0, 41.0, 45.0, 40.0, 44.0, 33.0, 46.0, 25.0, 25.0, 18.0, 19.0, 14.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37109375, -0.3598365783691406, -0.34857940673828125, -0.3373222351074219, -0.3260650634765625, -0.3148078918457031, -0.30355072021484375, -0.2922935485839844, -0.281036376953125, -0.2697792053222656, -0.25852203369140625, -0.24726486206054688, -0.2360076904296875, -0.22475051879882812, -0.21349334716796875, -0.20223617553710938, -0.19097900390625, -0.17972183227539062, -0.16846466064453125, -0.15720748901367188, -0.1459503173828125, -0.13469314575195312, -0.12343597412109375, -0.11217880249023438, -0.100921630859375, -0.08966445922851562, -0.07840728759765625, -0.06715011596679688, -0.0558929443359375, -0.044635772705078125, -0.03337860107421875, -0.022121429443359375, -0.0108642578125, 0.000392913818359375, 0.01165008544921875, 0.022907257080078125, 0.0341644287109375, 0.045421600341796875, 0.05667877197265625, 0.06793594360351562, 0.079193115234375, 0.09045028686523438, 0.10170745849609375, 0.11296463012695312, 0.1242218017578125, 0.13547897338867188, 0.14673614501953125, 0.15799331665039062, 0.16925048828125, 0.18050765991210938, 0.19176483154296875, 0.20302200317382812, 0.2142791748046875, 0.22553634643554688, 0.23679351806640625, 0.24805068969726562, 0.259307861328125, 0.2705650329589844, 0.28182220458984375, 0.2930793762207031, 0.3043365478515625, 0.3155937194824219, 0.32685089111328125, 0.3381080627441406, 0.349365234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 14.0, 10.0, 11.0, 11.0, 25.0, 25.0, 27.0, 54.0, 73.0, 134.0, 237.0, 412.0, 892.0, 2141.0, 5829.0, 20260.0, 99125.0, 600190.0, 259193.0, 42999.0, 10690.0, 3531.0, 1312.0, 582.0, 300.0, 156.0, 97.0, 66.0, 39.0, 30.0, 26.0, 17.0, 12.0, 8.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.292205810546875, -0.28167724609375, -0.271148681640625, -0.2606201171875, -0.250091552734375, -0.23956298828125, -0.229034423828125, -0.218505859375, -0.207977294921875, -0.19744873046875, -0.186920166015625, -0.1763916015625, -0.165863037109375, -0.15533447265625, -0.144805908203125, -0.13427734375, -0.123748779296875, -0.11322021484375, -0.102691650390625, -0.0921630859375, -0.081634521484375, -0.07110595703125, -0.060577392578125, -0.050048828125, -0.039520263671875, -0.02899169921875, -0.018463134765625, -0.0079345703125, 0.002593994140625, 0.01312255859375, 0.023651123046875, 0.0341796875, 0.044708251953125, 0.05523681640625, 0.065765380859375, 0.0762939453125, 0.086822509765625, 0.09735107421875, 0.107879638671875, 0.118408203125, 0.128936767578125, 0.13946533203125, 0.149993896484375, 0.1605224609375, 0.171051025390625, 0.18157958984375, 0.192108154296875, 0.20263671875, 0.213165283203125, 0.22369384765625, 0.234222412109375, 0.2447509765625, 0.255279541015625, 0.26580810546875, 0.276336669921875, 0.286865234375, 0.297393798828125, 0.30792236328125, 0.318450927734375, 0.3289794921875, 0.339508056640625, 0.35003662109375, 0.360565185546875, 0.37109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 7.0, 16.0, 13.0, 24.0, 21.0, 13.0, 27.0, 41.0, 55.0, 62.0, 65.0, 67.0, 75.0, 66.0, 64.0, 69.0, 47.0, 47.0, 44.0, 34.0, 27.0, 14.0, 15.0, 13.0, 17.0, 6.0, 7.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.791015625, -0.7649612426757812, -0.7389068603515625, -0.7128524780273438, -0.686798095703125, -0.6607437133789062, -0.6346893310546875, -0.6086349487304688, -0.58258056640625, -0.5565261840820312, -0.5304718017578125, -0.5044174194335938, -0.478363037109375, -0.45230865478515625, -0.4262542724609375, -0.40019989013671875, -0.3741455078125, -0.34809112548828125, -0.3220367431640625, -0.29598236083984375, -0.269927978515625, -0.24387359619140625, -0.2178192138671875, -0.19176483154296875, -0.16571044921875, -0.13965606689453125, -0.1136016845703125, -0.08754730224609375, -0.061492919921875, -0.03543853759765625, -0.0093841552734375, 0.01667022705078125, 0.042724609375, 0.06877899169921875, 0.0948333740234375, 0.12088775634765625, 0.146942138671875, 0.17299652099609375, 0.1990509033203125, 0.22510528564453125, 0.25115966796875, 0.27721405029296875, 0.3032684326171875, 0.32932281494140625, 0.355377197265625, 0.38143157958984375, 0.4074859619140625, 0.43354034423828125, 0.4595947265625, 0.48564910888671875, 0.5117034912109375, 0.5377578735351562, 0.563812255859375, 0.5898666381835938, 0.6159210205078125, 0.6419754028320312, 0.66802978515625, 0.6940841674804688, 0.7201385498046875, 0.7461929321289062, 0.772247314453125, 0.7983016967773438, 0.8243560791015625, 0.8504104614257812, 0.87646484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 29.0, 38.0, 102.0, 255.0, 1520.0, 209311.0, 834250.0, 2429.0, 367.0, 115.0, 55.0, 31.0, 15.0, 7.0, 10.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.3642616271972656, -0.35254669189453125, -0.3408317565917969, -0.3291168212890625, -0.3174018859863281, -0.30568695068359375, -0.2939720153808594, -0.282257080078125, -0.2705421447753906, -0.25882720947265625, -0.24711227416992188, -0.2353973388671875, -0.22368240356445312, -0.21196746826171875, -0.20025253295898438, -0.18853759765625, -0.17682266235351562, -0.16510772705078125, -0.15339279174804688, -0.1416778564453125, -0.12996292114257812, -0.11824798583984375, -0.10653305053710938, -0.094818115234375, -0.08310317993164062, -0.07138824462890625, -0.059673309326171875, -0.0479583740234375, -0.036243438720703125, -0.02452850341796875, -0.012813568115234375, -0.0010986328125, 0.010616302490234375, 0.02233123779296875, 0.034046173095703125, 0.0457611083984375, 0.057476043701171875, 0.06919097900390625, 0.08090591430664062, 0.092620849609375, 0.10433578491210938, 0.11605072021484375, 0.12776565551757812, 0.1394805908203125, 0.15119552612304688, 0.16291046142578125, 0.17462539672851562, 0.18634033203125, 0.19805526733398438, 0.20977020263671875, 0.22148513793945312, 0.2332000732421875, 0.24491500854492188, 0.25662994384765625, 0.2683448791503906, 0.280059814453125, 0.2917747497558594, 0.30348968505859375, 0.3152046203613281, 0.3269195556640625, 0.3386344909667969, 0.35034942626953125, 0.3620643615722656, 0.373779296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 10.0, 16.0, 23.0, 33.0, 67.0, 65.0, 77.0, 91.0, 92.0, 121.0, 87.0, 86.0, 57.0, 48.0, 31.0, 21.0, 22.0, 4.0, 11.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-05, -2.413243055343628e-05, -2.3230910301208496e-05, -2.2329390048980713e-05, -2.142786979675293e-05, -2.0526349544525146e-05, -1.9624829292297363e-05, -1.872330904006958e-05, -1.7821788787841797e-05, -1.6920268535614014e-05, -1.601874828338623e-05, -1.5117228031158447e-05, -1.4215707778930664e-05, -1.3314187526702881e-05, -1.2412667274475098e-05, -1.1511147022247314e-05, -1.0609626770019531e-05, -9.708106517791748e-06, -8.806586265563965e-06, -7.905066013336182e-06, -7.0035457611083984e-06, -6.102025508880615e-06, -5.200505256652832e-06, -4.298985004425049e-06, -3.3974647521972656e-06, -2.4959444999694824e-06, -1.5944242477416992e-06, -6.92903995513916e-07, 2.086162567138672e-07, 1.1101365089416504e-06, 2.0116567611694336e-06, 2.913177013397217e-06, 3.814697265625e-06, 4.716217517852783e-06, 5.617737770080566e-06, 6.51925802230835e-06, 7.420778274536133e-06, 8.322298526763916e-06, 9.2238187789917e-06, 1.0125339031219482e-05, 1.1026859283447266e-05, 1.1928379535675049e-05, 1.2829899787902832e-05, 1.3731420040130615e-05, 1.4632940292358398e-05, 1.553446054458618e-05, 1.6435980796813965e-05, 1.7337501049041748e-05, 1.823902130126953e-05, 1.9140541553497314e-05, 2.0042061805725098e-05, 2.094358205795288e-05, 2.1845102310180664e-05, 2.2746622562408447e-05, 2.364814281463623e-05, 2.4549663066864014e-05, 2.5451183319091797e-05, 2.635270357131958e-05, 2.7254223823547363e-05, 2.8155744075775146e-05, 2.905726432800293e-05, 2.9958784580230713e-05, 3.0860304832458496e-05, 3.176182508468628e-05, 3.266334533691406e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 4.0, 6.0, 2.0, 9.0, 12.0, 12.0, 18.0, 42.0, 69.0, 118.0, 208.0, 458.0, 1453.0, 8036.0, 146500.0, 847357.0, 38727.0, 3743.0, 976.0, 412.0, 193.0, 88.0, 46.0, 28.0, 14.0, 11.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.1835193634033203, -0.17746353149414062, -0.17140769958496094, -0.16535186767578125, -0.15929603576660156, -0.15324020385742188, -0.1471843719482422, -0.1411285400390625, -0.1350727081298828, -0.12901687622070312, -0.12296104431152344, -0.11690521240234375, -0.11084938049316406, -0.10479354858398438, -0.09873771667480469, -0.092681884765625, -0.08662605285644531, -0.08057022094726562, -0.07451438903808594, -0.06845855712890625, -0.06240272521972656, -0.056346893310546875, -0.05029106140136719, -0.0442352294921875, -0.03817939758300781, -0.032123565673828125, -0.026067733764648438, -0.02001190185546875, -0.013956069946289062, -0.007900238037109375, -0.0018444061279296875, 0.00421142578125, 0.010267257690429688, 0.016323089599609375, 0.022378921508789062, 0.02843475341796875, 0.03449058532714844, 0.040546417236328125, 0.04660224914550781, 0.0526580810546875, 0.05871391296386719, 0.06476974487304688, 0.07082557678222656, 0.07688140869140625, 0.08293724060058594, 0.08899307250976562, 0.09504890441894531, 0.101104736328125, 0.10716056823730469, 0.11321640014648438, 0.11927223205566406, 0.12532806396484375, 0.13138389587402344, 0.13743972778320312, 0.1434955596923828, 0.1495513916015625, 0.1556072235107422, 0.16166305541992188, 0.16771888732910156, 0.17377471923828125, 0.17983055114746094, 0.18588638305664062, 0.1919422149658203, 0.197998046875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 7.0, 9.0, 14.0, 32.0, 50.0, 88.0, 169.0, 212.0, 184.0, 110.0, 46.0, 40.0, 15.0, 7.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.31673622131347656, -0.3085212707519531, -0.3003063201904297, -0.29209136962890625, -0.2838764190673828, -0.2756614685058594, -0.26744651794433594, -0.2592315673828125, -0.25101661682128906, -0.24280166625976562, -0.2345867156982422, -0.22637176513671875, -0.2181568145751953, -0.20994186401367188, -0.20172691345214844, -0.193511962890625, -0.18529701232910156, -0.17708206176757812, -0.1688671112060547, -0.16065216064453125, -0.1524372100830078, -0.14422225952148438, -0.13600730895996094, -0.1277923583984375, -0.11957740783691406, -0.11136245727539062, -0.10314750671386719, -0.09493255615234375, -0.08671760559082031, -0.07850265502929688, -0.07028770446777344, -0.06207275390625, -0.05385780334472656, -0.045642852783203125, -0.03742790222167969, -0.02921295166015625, -0.020998001098632812, -0.012783050537109375, -0.0045680999755859375, 0.0036468505859375, 0.011861801147460938, 0.020076751708984375, 0.028291702270507812, 0.03650665283203125, 0.04472160339355469, 0.052936553955078125, 0.06115150451660156, 0.069366455078125, 0.07758140563964844, 0.08579635620117188, 0.09401130676269531, 0.10222625732421875, 0.11044120788574219, 0.11865615844726562, 0.12687110900878906, 0.1350860595703125, 0.14330101013183594, 0.15151596069335938, 0.1597309112548828, 0.16794586181640625, 0.1761608123779297, 0.18437576293945312, 0.19259071350097656, 0.2008056640625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 3.0, 5.0, 9.0, 10.0, 22.0, 38.0, 63.0, 130.0, 158.0, 242.0, 156.0, 72.0, 53.0, 20.0, 9.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309689044952393, -4.213437080383301, -4.117184638977051, -4.020932674407959, -3.924680233001709, -3.828428030014038, -3.732175827026367, -3.6359238624572754, -3.5396714210510254, -3.4434192180633545, -3.3471670150756836, -3.2509148120880127, -3.154662609100342, -3.058410406112671, -2.962158203125, -2.865906238555908, -2.7696540355682373, -2.6734018325805664, -2.5771496295928955, -2.4808974266052246, -2.3846452236175537, -2.288393020629883, -2.192141056060791, -2.095888614654541, -1.9996365308761597, -1.9033843278884888, -1.8071321249008179, -1.7108800411224365, -1.6146278381347656, -1.5183756351470947, -1.4221234321594238, -1.325871229171753, -1.2296192646026611, -1.1333670616149902, -1.0371148586273193, -0.9408627152442932, -0.8446105122566223, -0.7483583092689514, -0.6521061658859253, -0.5558539628982544, -0.4596017599105835, -0.3633495569229126, -0.2670973837375641, -0.17084521055221558, -0.07459300756454468, 0.02165919542312622, 0.11791133880615234, 0.21416354179382324, 0.31041574478149414, 0.40666794776916504, 0.5029201507568359, 0.5991722941398621, 0.695424497127533, 0.7916767001152039, 0.88792884349823, 0.9841810464859009, 1.0804332494735718, 1.1766854524612427, 1.2729376554489136, 1.369189739227295, 1.4654419422149658, 1.5616941452026367, 1.6579463481903076, 1.7541985511779785, 1.8504507541656494]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 5.0, 9.0, 10.0, 13.0, 19.0, 21.0, 26.0, 33.0, 24.0, 30.0, 49.0, 55.0, 58.0, 76.0, 115.0, 87.0, 63.0, 63.0, 43.0, 53.0, 26.0, 20.0, 19.0, 19.0, 11.0, 14.0, 10.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4957046508789062, -2.4190940856933594, -2.3424835205078125, -2.2658727169036865, -2.1892621517181396, -2.1126515865325928, -2.036040782928467, -1.95943021774292, -1.882819652557373, -1.8062090873718262, -1.7295984029769897, -1.6529877185821533, -1.5763771533966064, -1.4997665882110596, -1.4231559038162231, -1.3465452194213867, -1.2699346542358398, -1.193324089050293, -1.1167134046554565, -1.0401027202606201, -0.9634921550750732, -0.8868815302848816, -0.8102709054946899, -0.7336602807044983, -0.6570496559143066, -0.580439031124115, -0.5038284063339233, -0.4272177815437317, -0.35060715675354004, -0.2739965319633484, -0.19738590717315674, -0.12077528238296509, -0.04416489601135254, 0.03244572877883911, 0.10905635356903076, 0.1856669783592224, 0.26227760314941406, 0.3388882279396057, 0.41549885272979736, 0.492109477519989, 0.5687201023101807, 0.6453307271003723, 0.721941351890564, 0.7985519766807556, 0.8751626014709473, 0.9517732262611389, 1.0283838510513306, 1.104994535446167, 1.1816051006317139, 1.2582156658172607, 1.3348263502120972, 1.4114370346069336, 1.4880475997924805, 1.5646581649780273, 1.6412688493728638, 1.7178795337677002, 1.794490098953247, 1.871100664138794, 1.9477113485336304, 2.024322032928467, 2.1009325981140137, 2.1775431632995605, 2.2541537284851074, 2.3307645320892334, 2.4073750972747803]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 13.0, 12.0, 12.0, 15.0, 15.0, 23.0, 36.0, 33.0, 36.0, 48.0, 105.0, 225.0, 147.0, 45.0, 40.0, 25.0, 24.0, 25.0, 21.0, 11.0, 20.0, 11.0, 12.0, 10.0, 5.0, 3.0, 1.0, 4.0, 2.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.4025993347167969, -0.39064788818359375, -0.3786964416503906, -0.3667449951171875, -0.3547935485839844, -0.34284210205078125, -0.3308906555175781, -0.318939208984375, -0.3069877624511719, -0.29503631591796875, -0.2830848693847656, -0.2711334228515625, -0.2591819763183594, -0.24723052978515625, -0.23527908325195312, -0.22332763671875, -0.21137619018554688, -0.19942474365234375, -0.18747329711914062, -0.1755218505859375, -0.16357040405273438, -0.15161895751953125, -0.13966751098632812, -0.127716064453125, -0.11576461791992188, -0.10381317138671875, -0.09186172485351562, -0.0799102783203125, -0.06795883178710938, -0.05600738525390625, -0.044055938720703125, -0.0321044921875, -0.020153045654296875, -0.00820159912109375, 0.003749847412109375, 0.0157012939453125, 0.027652740478515625, 0.03960418701171875, 0.051555633544921875, 0.063507080078125, 0.07545852661132812, 0.08740997314453125, 0.09936141967773438, 0.1113128662109375, 0.12326431274414062, 0.13521575927734375, 0.14716720581054688, 0.15911865234375, 0.17107009887695312, 0.18302154541015625, 0.19497299194335938, 0.2069244384765625, 0.21887588500976562, 0.23082733154296875, 0.24277877807617188, 0.254730224609375, 0.2666816711425781, 0.27863311767578125, 0.2905845642089844, 0.3025360107421875, 0.3144874572753906, 0.32643890380859375, 0.3383903503417969, 0.350341796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 1.0, 8.0, 14.0, 19.0, 29.0, 30.0, 25.0, 48.0, 75.0, 120.0, 187.0, 303.0, 559.0, 1179.0, 2781.0, 8999.0, 63488.0, 8274418.0, 25929.0, 6136.0, 2084.0, 965.0, 437.0, 246.0, 174.0, 99.0, 64.0, 46.0, 25.0, 35.0, 19.0, 13.0, 12.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1407769918441772, -1.1084915399551392, -1.076206088066101, -1.043920636177063, -1.011635184288025, -0.9793497323989868, -0.9470642805099487, -0.9147788286209106, -0.8824933767318726, -0.8502079248428345, -0.8179224729537964, -0.7856370210647583, -0.7533515691757202, -0.7210661172866821, -0.688780665397644, -0.656495213508606, -0.6242097616195679, -0.5919243097305298, -0.5596388578414917, -0.5273534059524536, -0.4950679540634155, -0.46278250217437744, -0.43049705028533936, -0.39821159839630127, -0.3659261465072632, -0.3336406946182251, -0.301355242729187, -0.2690697908401489, -0.23678433895111084, -0.20449888706207275, -0.17221343517303467, -0.13992798328399658, -0.1076425313949585, -0.07535707950592041, -0.043071627616882324, -0.010786175727844238, 0.021499276161193848, 0.053784728050231934, 0.08607017993927002, 0.1183556318283081, 0.1506410837173462, 0.18292653560638428, 0.21521198749542236, 0.24749743938446045, 0.27978289127349854, 0.3120683431625366, 0.3443537950515747, 0.3766392469406128, 0.4089246988296509, 0.44121015071868896, 0.47349560260772705, 0.5057810544967651, 0.5380665063858032, 0.5703519582748413, 0.6026374101638794, 0.6349228620529175, 0.6672083139419556, 0.6994937658309937, 0.7317792177200317, 0.7640646696090698, 0.7963501214981079, 0.828635573387146, 0.8609210252761841, 0.8932064771652222, 0.9254919290542603]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.468613624572754, -1.4089070558547974, -1.3492003679275513, -1.2894937992095947, -1.2297871112823486, -1.170080542564392, -1.1103739738464355, -1.0506672859191895, -0.9909606575965881, -0.9312540292739868, -0.8715474009513855, -0.8118407726287842, -0.7521342039108276, -0.6924275159835815, -0.632720947265625, -0.5730143189430237, -0.5133076906204224, -0.45360106229782104, -0.3938944339752197, -0.3341878354549408, -0.2744812071323395, -0.21477457880973816, -0.15506798028945923, -0.09536135196685791, -0.03565472364425659, 0.02405189722776413, 0.08375851809978485, 0.14346513152122498, 0.2031717598438263, 0.2628783881664276, 0.32258498668670654, 0.38229161500930786, 0.4419982433319092, 0.5017048716545105, 0.5614114999771118, 0.6211180686950684, 0.6808247566223145, 0.740531325340271, 0.8002379536628723, 0.8599445819854736, 0.919651210308075, 0.9793578386306763, 1.0390644073486328, 1.098771095275879, 1.1584776639938354, 1.2181843519210815, 1.277890920639038, 1.3375976085662842, 1.3973041772842407, 1.4570107460021973, 1.5167174339294434, 1.5764240026474, 1.636130690574646, 1.6958372592926025, 1.7555439472198486, 1.8152505159378052, 1.8749570846557617, 1.9346636533737183, 1.9943703413009644, 2.054076910018921, 2.113783597946167, 2.173490285873413, 2.23319673538208, 2.292903423309326, 2.3526101112365723]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 7.0, 6.0, 8.0, 16.0, 22.0, 25.0, 26.0, 25.0, 38.0, 30.0, 43.0, 51.0, 45.0, 44.0, 54.0, 43.0, 58.0, 49.0, 52.0, 37.0, 47.0, 38.0, 42.0, 38.0, 24.0, 22.0, 21.0, 16.0, 13.0, 8.0, 7.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1998291015625, -0.19393348693847656, -0.18803787231445312, -0.1821422576904297, -0.17624664306640625, -0.1703510284423828, -0.16445541381835938, -0.15855979919433594, -0.1526641845703125, -0.14676856994628906, -0.14087295532226562, -0.1349773406982422, -0.12908172607421875, -0.12318611145019531, -0.11729049682617188, -0.11139488220214844, -0.105499267578125, -0.09960365295410156, -0.09370803833007812, -0.08781242370605469, -0.08191680908203125, -0.07602119445800781, -0.07012557983398438, -0.06422996520996094, -0.0583343505859375, -0.05243873596191406, -0.046543121337890625, -0.04064750671386719, -0.03475189208984375, -0.028856277465820312, -0.022960662841796875, -0.017065048217773438, -0.01116943359375, -0.0052738189697265625, 0.000621795654296875, 0.0065174102783203125, 0.01241302490234375, 0.018308639526367188, 0.024204254150390625, 0.030099868774414062, 0.0359954833984375, 0.04189109802246094, 0.047786712646484375, 0.05368232727050781, 0.05957794189453125, 0.06547355651855469, 0.07136917114257812, 0.07726478576660156, 0.083160400390625, 0.08905601501464844, 0.09495162963867188, 0.10084724426269531, 0.10674285888671875, 0.11263847351074219, 0.11853408813476562, 0.12442970275878906, 0.1303253173828125, 0.13622093200683594, 0.14211654663085938, 0.1480121612548828, 0.15390777587890625, 0.1598033905029297, 0.16569900512695312, 0.17159461975097656, 0.177490234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 5.0, 12.0, 22.0, 23.0, 31.0, 40.0, 56.0, 84.0, 122.0, 187.0, 244.0, 409.0, 512.0, 878.0, 1482.0, 2400.0, 4250.0, 7752.0, 15453.0, 33267.0, 91990.0, 192110.0, 100786.0, 36554.0, 16185.0, 8196.0, 4312.0, 2519.0, 1486.0, 943.0, 571.0, 405.0, 289.0, 195.0, 142.0, 100.0, 64.0, 56.0, 32.0, 31.0, 18.0, 12.0, 3.0, 9.0, 9.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.572265625, -2.485198974609375, -2.39813232421875, -2.311065673828125, -2.2239990234375, -2.136932373046875, -2.04986572265625, -1.962799072265625, -1.875732421875, -1.788665771484375, -1.70159912109375, -1.614532470703125, -1.5274658203125, -1.440399169921875, -1.35333251953125, -1.266265869140625, -1.17919921875, -1.092132568359375, -1.00506591796875, -0.917999267578125, -0.8309326171875, -0.743865966796875, -0.65679931640625, -0.569732666015625, -0.482666015625, -0.395599365234375, -0.30853271484375, -0.221466064453125, -0.1343994140625, -0.047332763671875, 0.03973388671875, 0.126800537109375, 0.2138671875, 0.300933837890625, 0.38800048828125, 0.475067138671875, 0.5621337890625, 0.649200439453125, 0.73626708984375, 0.823333740234375, 0.910400390625, 0.997467041015625, 1.08453369140625, 1.171600341796875, 1.2586669921875, 1.345733642578125, 1.43280029296875, 1.519866943359375, 1.60693359375, 1.694000244140625, 1.78106689453125, 1.868133544921875, 1.9552001953125, 2.042266845703125, 2.12933349609375, 2.216400146484375, 2.303466796875, 2.390533447265625, 2.47760009765625, 2.564666748046875, 2.6517333984375, 2.738800048828125, 2.82586669921875, 2.912933349609375, 3.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 3.0, 12.0, 13.0, 18.0, 16.0, 22.0, 19.0, 31.0, 39.0, 38.0, 44.0, 55.0, 60.0, 61.0, 61.0, 65.0, 64.0, 66.0, 35.0, 39.0, 33.0, 33.0, 30.0, 30.0, 27.0, 10.0, 20.0, 11.0, 10.0, 8.0, 4.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3403358459472656, -0.32862091064453125, -0.3169059753417969, -0.3051910400390625, -0.2934761047363281, -0.28176116943359375, -0.2700462341308594, -0.258331298828125, -0.24661636352539062, -0.23490142822265625, -0.22318649291992188, -0.2114715576171875, -0.19975662231445312, -0.18804168701171875, -0.17632675170898438, -0.16461181640625, -0.15289688110351562, -0.14118194580078125, -0.12946701049804688, -0.1177520751953125, -0.10603713989257812, -0.09432220458984375, -0.08260726928710938, -0.070892333984375, -0.059177398681640625, -0.04746246337890625, -0.035747528076171875, -0.0240325927734375, -0.012317657470703125, -0.00060272216796875, 0.011112213134765625, 0.0228271484375, 0.034542083740234375, 0.04625701904296875, 0.057971954345703125, 0.0696868896484375, 0.08140182495117188, 0.09311676025390625, 0.10483169555664062, 0.116546630859375, 0.12826156616210938, 0.13997650146484375, 0.15169143676757812, 0.1634063720703125, 0.17512130737304688, 0.18683624267578125, 0.19855117797851562, 0.21026611328125, 0.22198104858398438, 0.23369598388671875, 0.24541091918945312, 0.2571258544921875, 0.2688407897949219, 0.28055572509765625, 0.2922706604003906, 0.303985595703125, 0.3157005310058594, 0.32741546630859375, 0.3391304016113281, 0.3508453369140625, 0.3625602722167969, 0.37427520751953125, 0.3859901428222656, 0.397705078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 12.0, 9.0, 14.0, 35.0, 50.0, 71.0, 67.0, 64.0, 40.0, 19.0, 21.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3290114402770996, -1.2948863506317139, -1.2607612609863281, -1.2266360521316528, -1.192510962486267, -1.1583858728408813, -1.1242607831954956, -1.0901356935501099, -1.0560104846954346, -1.0218853950500488, -0.9877602458000183, -0.9536351561546326, -0.919510006904602, -0.8853849172592163, -0.8512598276138306, -0.8171347379684448, -0.7830096483230591, -0.7488845586776733, -0.7147594094276428, -0.6806343197822571, -0.6465091705322266, -0.6123840808868408, -0.5782589912414551, -0.5441339015960693, -0.5100087523460388, -0.4758836328983307, -0.44175851345062256, -0.4076334238052368, -0.3735083043575287, -0.33938318490982056, -0.3052580952644348, -0.2711329758167267, -0.237007737159729, -0.20288261771202087, -0.16875751316547394, -0.134632408618927, -0.10050728917121887, -0.06638216972351074, -0.032257065176963806, 0.0018680393695831299, 0.03599315881729126, 0.07011827081441879, 0.10424338281154633, 0.13836848735809326, 0.1724936068058014, 0.20661872625350952, 0.24074383080005646, 0.2748689353466034, 0.3089940547943115, 0.34311917424201965, 0.3772442936897278, 0.4113693833351135, 0.44549450278282166, 0.4796196222305298, 0.5137447118759155, 0.5478698015213013, 0.5819949507713318, 0.6161200404167175, 0.650245189666748, 0.6843702793121338, 0.7184953689575195, 0.75262051820755, 0.7867456078529358, 0.8208707571029663, 0.854995846748352]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 11.0, 3.0, 5.0, 13.0, 9.0, 7.0, 24.0, 58.0, 94.0, 76.0, 42.0, 30.0, 16.0, 15.0, 11.0, 11.0, 8.0, 7.0, 9.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.507197380065918, -1.4653044939041138, -1.4234116077423096, -1.3815187215805054, -1.3396258354187012, -1.297732949256897, -1.2558400630950928, -1.2139471769332886, -1.1720542907714844, -1.1301614046096802, -1.088268518447876, -1.0463756322860718, -1.0044827461242676, -0.9625898599624634, -0.9206969738006592, -0.878804087638855, -0.8369112014770508, -0.7950183153152466, -0.7531254291534424, -0.7112325429916382, -0.669339656829834, -0.6274467706680298, -0.5855538845062256, -0.5436609983444214, -0.5017681121826172, -0.459875226020813, -0.4179823398590088, -0.3760894536972046, -0.3341965675354004, -0.2923036813735962, -0.250410795211792, -0.2085179090499878, -0.16662490367889404, -0.12473201751708984, -0.08283913135528564, -0.040946245193481445, 0.0009466409683227539, 0.04283952713012695, 0.08473241329193115, 0.12662529945373535, 0.16851818561553955, 0.21041107177734375, 0.25230395793914795, 0.29419684410095215, 0.33608973026275635, 0.37798261642456055, 0.41987550258636475, 0.46176838874816895, 0.5036612749099731, 0.5455541610717773, 0.5874470472335815, 0.6293399333953857, 0.6712328195571899, 0.7131257057189941, 0.7550185918807983, 0.7969114780426025, 0.8388043642044067, 0.8806972503662109, 0.9225901365280151, 0.9644830226898193, 1.0063759088516235, 1.0482687950134277, 1.090161681175232, 1.1320545673370361, 1.1739474534988403]}, "eval/loss": 2.135566473007202, "eval/bleu": 1.0140224330923163e-13, "eval/runtime": 2535.9584, "eval/samples_per_second": 5.82, "eval/steps_per_second": 0.728, "train/train_runtime": 68135.2194, "train/train_samples_per_second": 9.131, "train/train_steps_per_second": 0.071, "train/total_flos": 0.0, "train/train_loss": 2.8622734340865916} \ No newline at end of file